blob: 8232327cceb84f9aea4938d12034ee7845c45e8c [file] [log] [blame]
#!/usr/bin/env python2
# Copyright 2014 The Chromium OS Authors. All rights reserved.
# Use of this source code is governed by a BSD-style license that can be
# found in the LICENSE file.
"""This module provides abstraction of audio data."""
from __future__ import absolute_import
from __future__ import division
from __future__ import print_function
import contextlib
import copy
import numpy as np
import struct
from six.moves import range
import six
"""The dict containing information on how to parse sample from raw data.
Keys: The sample format as in aplay command.
Values: A dict containing:
message: Human-readable sample format.
dtype_str: Data type used in numpy dtype. Check
https://docs.scipy.org/doc/numpy/reference/arrays.dtypes.html
for supported data type.
size_bytes: Number of bytes for one sample.
"""
SAMPLE_FORMATS = dict(
S32_LE=dict(
message='Signed 32-bit integer, little-endian',
dtype_str='<i',
size_bytes=4),
S16_LE=dict(
message='Signed 16-bit integer, little-endian',
dtype_str='<i',
size_bytes=2))
def get_maximum_value_from_sample_format(sample_format):
"""Gets the maximum value from sample format.
@param sample_format: A key in SAMPLE_FORMAT.
@returns: The maximum value the sample can hold + 1.
"""
size_bits = SAMPLE_FORMATS[sample_format]['size_bytes'] * 8
return 1 << (size_bits - 1)
class AudioRawDataError(Exception):
"""Error in AudioRawData."""
pass
class AudioRawData(object):
"""The abstraction of audio raw data.
@property channel: The number of channels.
@property channel_data: A list of lists containing samples in each channel.
E.g., The third sample in the second channel is
channel_data[1][2].
@property sample_format: The sample format which should be one of the keys
in audio_data.SAMPLE_FORMATS.
"""
def __init__(self, binary, channel, sample_format):
"""Initializes an AudioRawData.
@param binary: A string containing binary data. If binary is not None,
The samples in binary will be parsed and be filled into
channel_data.
@param channel: The number of channels.
@param sample_format: One of the keys in audio_data.SAMPLE_FORMATS.
"""
self.channel = channel
self.channel_data = [[] for _ in range(self.channel)]
self.sample_format = sample_format
if binary:
self.read_binary(binary)
def read_binary(self, binary):
"""Reads samples from binary and fills channel_data.
Reads samples of fixed width from binary string into a numpy array
and shapes them into each channel.
@param binary: A string containing binary data.
"""
sample_format_dict = SAMPLE_FORMATS[self.sample_format]
# The data type used in numpy fromstring function. For example,
# <i4 for 32-bit signed int.
np_dtype = '%s%d' % (sample_format_dict['dtype_str'],
sample_format_dict['size_bytes'])
# Reads data from a string into 1-D array.
np_array = np.fromstring(binary, dtype=np_dtype)
n_frames = len(np_array) // self.channel
# Reshape np_array into an array of shape (n_frames, channel).
np_array = np_array.reshape(n_frames, self.channel)
# Transpose np_arrya so it becomes of shape (channel, n_frames).
self.channel_data = np_array.transpose()