• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1#!/usr/bin/env python3
2# Copyright 2014 The Chromium OS Authors. All rights reserved.
3# Use of this source code is governed by a BSD-style license that can be
4# found in the LICENSE file.
5
6"""This module provides abstraction of audio data."""
7
8from __future__ import absolute_import
9from __future__ import division
10from __future__ import print_function
11import contextlib
12import copy
13import numpy as np
14import struct
15from six.moves import range
16import six
17
18
19"""The dict containing information on how to parse sample from raw data.
20
21Keys: The sample format as in aplay command.
22Values: A dict containing:
23    message: Human-readable sample format.
24    dtype_str: Data type used in numpy dtype.  Check
25               https://docs.scipy.org/doc/numpy/reference/arrays.dtypes.html
26               for supported data type.
27    size_bytes: Number of bytes for one sample.
28"""
29SAMPLE_FORMATS = dict(
30        S32_LE=dict(
31                message='Signed 32-bit integer, little-endian',
32                dtype_str='<i',
33                size_bytes=4),
34        S16_LE=dict(
35                message='Signed 16-bit integer, little-endian',
36                dtype_str='<i',
37                size_bytes=2))
38
39
40def get_maximum_value_from_sample_format(sample_format):
41    """Gets the maximum value from sample format.
42
43    @param sample_format: A key in SAMPLE_FORMAT.
44
45    @returns: The maximum value the sample can hold + 1.
46
47    """
48    size_bits = SAMPLE_FORMATS[sample_format]['size_bytes'] * 8
49    return 1 << (size_bits - 1)
50
51
52class AudioRawDataError(Exception):
53    """Error in AudioRawData."""
54    pass
55
56
57class AudioRawData(object):
58    """The abstraction of audio raw data.
59
60    @property channel: The number of channels.
61    @property channel_data: A list of lists containing samples in each channel.
62                            E.g., The third sample in the second channel is
63                            channel_data[1][2].
64    @property sample_format: The sample format which should be one of the keys
65                             in audio_data.SAMPLE_FORMATS.
66    """
67    def __init__(self, binary, channel, sample_format):
68        """Initializes an AudioRawData.
69
70        @param binary: A string containing binary data. If binary is not None,
71                       The samples in binary will be parsed and be filled into
72                       channel_data.
73        @param channel: The number of channels.
74        @param sample_format: One of the keys in audio_data.SAMPLE_FORMATS.
75        """
76        self.channel = channel
77        self.channel_data = [[] for _ in range(self.channel)]
78        self.sample_format = sample_format
79        if binary:
80            self.read_binary(binary)
81
82
83    def read_binary(self, binary):
84        """Reads samples from binary and fills channel_data.
85
86        Reads samples of fixed width from binary string into a numpy array
87        and shapes them into each channel.
88
89        @param binary: A string containing binary data.
90        """
91        sample_format_dict = SAMPLE_FORMATS[self.sample_format]
92
93        # The data type used in numpy fromstring function. For example,
94        # <i4 for 32-bit signed int.
95        np_dtype = '%s%d' % (sample_format_dict['dtype_str'],
96                             sample_format_dict['size_bytes'])
97
98        # Reads data from a string into 1-D array.
99        np_array = np.fromstring(binary, dtype=np_dtype)
100        n_frames = len(np_array) // self.channel
101        # Reshape np_array into an array of shape (n_frames, channel).
102        np_array = np_array.reshape(n_frames, self.channel)
103        # Transpose np_arrya so it becomes of shape (channel, n_frames).
104        self.channel_data = np_array.transpose()
105