• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  *  Copyright (c) 2016 The WebRTC project authors. All Rights Reserved.
3  *
4  *  Use of this source code is governed by a BSD-style license
5  *  that can be found in the LICENSE file in the root of the source
6  *  tree. An additional intellectual property rights grant can be found
7  *  in the file PATENTS.  All contributing project authors may
8  *  be found in the AUTHORS file in the root of the source tree.
9  */
10 
11 #include "audio/audio_transport_impl.h"
12 
13 #include <algorithm>
14 #include <memory>
15 #include <utility>
16 
17 #include "audio/remix_resample.h"
18 #include "audio/utility/audio_frame_operations.h"
19 #include "call/audio_sender.h"
20 #include "modules/async_audio_processing/async_audio_processing.h"
21 #include "modules/audio_processing/include/audio_frame_proxies.h"
22 #include "rtc_base/checks.h"
23 #include "rtc_base/trace_event.h"
24 
25 namespace webrtc {
26 
27 namespace {
28 
29 // We want to process at the lowest sample rate and channel count possible
30 // without losing information. Choose the lowest native rate at least equal to
31 // the minimum of input and codec rates, choose lowest channel count, and
32 // configure the audio frame.
InitializeCaptureFrame(int input_sample_rate,int send_sample_rate_hz,size_t input_num_channels,size_t send_num_channels,AudioFrame * audio_frame)33 void InitializeCaptureFrame(int input_sample_rate,
34                             int send_sample_rate_hz,
35                             size_t input_num_channels,
36                             size_t send_num_channels,
37                             AudioFrame* audio_frame) {
38   RTC_DCHECK(audio_frame);
39   int min_processing_rate_hz = std::min(input_sample_rate, send_sample_rate_hz);
40   for (int native_rate_hz : AudioProcessing::kNativeSampleRatesHz) {
41     audio_frame->sample_rate_hz_ = native_rate_hz;
42     if (audio_frame->sample_rate_hz_ >= min_processing_rate_hz) {
43       break;
44     }
45   }
46   audio_frame->num_channels_ = std::min(input_num_channels, send_num_channels);
47 }
48 
ProcessCaptureFrame(uint32_t delay_ms,bool key_pressed,bool swap_stereo_channels,AudioProcessing * audio_processing,AudioFrame * audio_frame)49 void ProcessCaptureFrame(uint32_t delay_ms,
50                          bool key_pressed,
51                          bool swap_stereo_channels,
52                          AudioProcessing* audio_processing,
53                          AudioFrame* audio_frame) {
54   RTC_DCHECK(audio_frame);
55   if (audio_processing) {
56     audio_processing->set_stream_delay_ms(delay_ms);
57     audio_processing->set_stream_key_pressed(key_pressed);
58     int error = ProcessAudioFrame(audio_processing, audio_frame);
59 
60     RTC_DCHECK_EQ(0, error) << "ProcessStream() error: " << error;
61   }
62 
63   if (swap_stereo_channels) {
64     AudioFrameOperations::SwapStereoChannels(audio_frame);
65   }
66 }
67 
68 // Resample audio in `frame` to given sample rate preserving the
69 // channel count and place the result in `destination`.
Resample(const AudioFrame & frame,const int destination_sample_rate,PushResampler<int16_t> * resampler,int16_t * destination)70 int Resample(const AudioFrame& frame,
71              const int destination_sample_rate,
72              PushResampler<int16_t>* resampler,
73              int16_t* destination) {
74   TRACE_EVENT2("webrtc", "Resample", "frame sample rate", frame.sample_rate_hz_,
75                "destination_sample_rate", destination_sample_rate);
76   const int number_of_channels = static_cast<int>(frame.num_channels_);
77   const int target_number_of_samples_per_channel =
78       destination_sample_rate / 100;
79   resampler->InitializeIfNeeded(frame.sample_rate_hz_, destination_sample_rate,
80                                 number_of_channels);
81 
82   // TODO(yujo): make resampler take an AudioFrame, and add special case
83   // handling of muted frames.
84   return resampler->Resample(
85       frame.data(), frame.samples_per_channel_ * number_of_channels,
86       destination, number_of_channels * target_number_of_samples_per_channel);
87 }
88 }  // namespace
89 
AudioTransportImpl(AudioMixer * mixer,AudioProcessing * audio_processing,AsyncAudioProcessing::Factory * async_audio_processing_factory)90 AudioTransportImpl::AudioTransportImpl(
91     AudioMixer* mixer,
92     AudioProcessing* audio_processing,
93     AsyncAudioProcessing::Factory* async_audio_processing_factory)
94     : audio_processing_(audio_processing),
95       async_audio_processing_(
96           async_audio_processing_factory
97               ? async_audio_processing_factory->CreateAsyncAudioProcessing(
98                     [this](std::unique_ptr<AudioFrame> frame) {
99                       this->SendProcessedData(std::move(frame));
100                     })
101               : nullptr),
102       mixer_(mixer) {
103   RTC_DCHECK(mixer);
104 }
105 
~AudioTransportImpl()106 AudioTransportImpl::~AudioTransportImpl() {}
107 
RecordedDataIsAvailable(const void * audio_data,const size_t number_of_frames,const size_t bytes_per_sample,const size_t number_of_channels,const uint32_t sample_rate,const uint32_t audio_delay_milliseconds,const int32_t clock_drift,const uint32_t volume,const bool key_pressed,uint32_t & new_mic_volume)108 int32_t AudioTransportImpl::RecordedDataIsAvailable(
109     const void* audio_data,
110     const size_t number_of_frames,
111     const size_t bytes_per_sample,
112     const size_t number_of_channels,
113     const uint32_t sample_rate,
114     const uint32_t audio_delay_milliseconds,
115     const int32_t clock_drift,
116     const uint32_t volume,
117     const bool key_pressed,
118     uint32_t& new_mic_volume) {  // NOLINT: to avoid changing APIs
119   return RecordedDataIsAvailable(
120       audio_data, number_of_frames, bytes_per_sample, number_of_channels,
121       sample_rate, audio_delay_milliseconds, clock_drift, volume, key_pressed,
122       new_mic_volume, /* estimated_capture_time_ns */ 0);
123 }
124 
125 // Not used in Chromium. Process captured audio and distribute to all sending
126 // streams, and try to do this at the lowest possible sample rate.
RecordedDataIsAvailable(const void * audio_data,const size_t number_of_frames,const size_t bytes_per_sample,const size_t number_of_channels,const uint32_t sample_rate,const uint32_t audio_delay_milliseconds,const int32_t,const uint32_t,const bool key_pressed,uint32_t &,const int64_t estimated_capture_time_ns)127 int32_t AudioTransportImpl::RecordedDataIsAvailable(
128     const void* audio_data,
129     const size_t number_of_frames,
130     const size_t bytes_per_sample,
131     const size_t number_of_channels,
132     const uint32_t sample_rate,
133     const uint32_t audio_delay_milliseconds,
134     const int32_t /*clock_drift*/,
135     const uint32_t /*volume*/,
136     const bool key_pressed,
137     uint32_t& /*new_mic_volume*/,
138     const int64_t
139         estimated_capture_time_ns) {  // NOLINT: to avoid changing APIs
140   RTC_DCHECK(audio_data);
141   RTC_DCHECK_GE(number_of_channels, 1);
142   RTC_DCHECK_LE(number_of_channels, 2);
143   RTC_DCHECK_EQ(2 * number_of_channels, bytes_per_sample);
144   RTC_DCHECK_GE(sample_rate, AudioProcessing::NativeRate::kSampleRate8kHz);
145   // 100 = 1 second / data duration (10 ms).
146   RTC_DCHECK_EQ(number_of_frames * 100, sample_rate);
147   RTC_DCHECK_LE(bytes_per_sample * number_of_frames * number_of_channels,
148                 AudioFrame::kMaxDataSizeBytes);
149 
150   int send_sample_rate_hz = 0;
151   size_t send_num_channels = 0;
152   bool swap_stereo_channels = false;
153   {
154     MutexLock lock(&capture_lock_);
155     send_sample_rate_hz = send_sample_rate_hz_;
156     send_num_channels = send_num_channels_;
157     swap_stereo_channels = swap_stereo_channels_;
158   }
159 
160   std::unique_ptr<AudioFrame> audio_frame(new AudioFrame());
161   InitializeCaptureFrame(sample_rate, send_sample_rate_hz, number_of_channels,
162                          send_num_channels, audio_frame.get());
163   voe::RemixAndResample(static_cast<const int16_t*>(audio_data),
164                         number_of_frames, number_of_channels, sample_rate,
165                         &capture_resampler_, audio_frame.get());
166   ProcessCaptureFrame(audio_delay_milliseconds, key_pressed,
167                       swap_stereo_channels, audio_processing_,
168                       audio_frame.get());
169   audio_frame->set_absolute_capture_timestamp_ms(estimated_capture_time_ns /
170                                                  1000000);
171 
172   RTC_DCHECK_GT(audio_frame->samples_per_channel_, 0);
173   if (async_audio_processing_)
174     async_audio_processing_->Process(std::move(audio_frame));
175   else
176     SendProcessedData(std::move(audio_frame));
177 
178   return 0;
179 }
180 
SendProcessedData(std::unique_ptr<AudioFrame> audio_frame)181 void AudioTransportImpl::SendProcessedData(
182     std::unique_ptr<AudioFrame> audio_frame) {
183   TRACE_EVENT0("webrtc", "AudioTransportImpl::SendProcessedData");
184   RTC_DCHECK_GT(audio_frame->samples_per_channel_, 0);
185   MutexLock lock(&capture_lock_);
186   if (audio_senders_.empty())
187     return;
188 
189   auto it = audio_senders_.begin();
190   while (++it != audio_senders_.end()) {
191     auto audio_frame_copy = std::make_unique<AudioFrame>();
192     audio_frame_copy->CopyFrom(*audio_frame);
193     (*it)->SendAudioData(std::move(audio_frame_copy));
194   }
195   // Send the original frame to the first stream w/o copying.
196   (*audio_senders_.begin())->SendAudioData(std::move(audio_frame));
197 }
198 
199 // Mix all received streams, feed the result to the AudioProcessing module, then
200 // resample the result to the requested output rate.
NeedMorePlayData(const size_t nSamples,const size_t nBytesPerSample,const size_t nChannels,const uint32_t samplesPerSec,void * audioSamples,size_t & nSamplesOut,int64_t * elapsed_time_ms,int64_t * ntp_time_ms)201 int32_t AudioTransportImpl::NeedMorePlayData(const size_t nSamples,
202                                              const size_t nBytesPerSample,
203                                              const size_t nChannels,
204                                              const uint32_t samplesPerSec,
205                                              void* audioSamples,
206                                              size_t& nSamplesOut,
207                                              int64_t* elapsed_time_ms,
208                                              int64_t* ntp_time_ms) {
209   TRACE_EVENT0("webrtc", "AudioTransportImpl::SendProcessedData");
210   RTC_DCHECK_EQ(sizeof(int16_t) * nChannels, nBytesPerSample);
211   RTC_DCHECK_GE(nChannels, 1);
212   RTC_DCHECK_LE(nChannels, 2);
213   RTC_DCHECK_GE(
214       samplesPerSec,
215       static_cast<uint32_t>(AudioProcessing::NativeRate::kSampleRate8kHz));
216 
217   // 100 = 1 second / data duration (10 ms).
218   RTC_DCHECK_EQ(nSamples * 100, samplesPerSec);
219   RTC_DCHECK_LE(nBytesPerSample * nSamples * nChannels,
220                 AudioFrame::kMaxDataSizeBytes);
221 
222   mixer_->Mix(nChannels, &mixed_frame_);
223   *elapsed_time_ms = mixed_frame_.elapsed_time_ms_;
224   *ntp_time_ms = mixed_frame_.ntp_time_ms_;
225 
226   if (audio_processing_) {
227     const auto error =
228         ProcessReverseAudioFrame(audio_processing_, &mixed_frame_);
229     RTC_DCHECK_EQ(error, AudioProcessing::kNoError);
230   }
231 
232   nSamplesOut = Resample(mixed_frame_, samplesPerSec, &render_resampler_,
233                          static_cast<int16_t*>(audioSamples));
234   RTC_DCHECK_EQ(nSamplesOut, nChannels * nSamples);
235   return 0;
236 }
237 
238 // Used by Chromium - same as NeedMorePlayData() but because Chrome has its
239 // own APM instance, does not call audio_processing_->ProcessReverseStream().
PullRenderData(int bits_per_sample,int sample_rate,size_t number_of_channels,size_t number_of_frames,void * audio_data,int64_t * elapsed_time_ms,int64_t * ntp_time_ms)240 void AudioTransportImpl::PullRenderData(int bits_per_sample,
241                                         int sample_rate,
242                                         size_t number_of_channels,
243                                         size_t number_of_frames,
244                                         void* audio_data,
245                                         int64_t* elapsed_time_ms,
246                                         int64_t* ntp_time_ms) {
247   TRACE_EVENT2("webrtc", "AudioTransportImpl::PullRenderData", "sample_rate",
248                sample_rate, "number_of_frames", number_of_frames);
249   RTC_DCHECK_EQ(bits_per_sample, 16);
250   RTC_DCHECK_GE(number_of_channels, 1);
251   RTC_DCHECK_GE(sample_rate, AudioProcessing::NativeRate::kSampleRate8kHz);
252 
253   // 100 = 1 second / data duration (10 ms).
254   RTC_DCHECK_EQ(number_of_frames * 100, sample_rate);
255 
256   // 8 = bits per byte.
257   RTC_DCHECK_LE(bits_per_sample / 8 * number_of_frames * number_of_channels,
258                 AudioFrame::kMaxDataSizeBytes);
259   mixer_->Mix(number_of_channels, &mixed_frame_);
260   *elapsed_time_ms = mixed_frame_.elapsed_time_ms_;
261   *ntp_time_ms = mixed_frame_.ntp_time_ms_;
262 
263   auto output_samples = Resample(mixed_frame_, sample_rate, &render_resampler_,
264                                  static_cast<int16_t*>(audio_data));
265   RTC_DCHECK_EQ(output_samples, number_of_channels * number_of_frames);
266 }
267 
UpdateAudioSenders(std::vector<AudioSender * > senders,int send_sample_rate_hz,size_t send_num_channels)268 void AudioTransportImpl::UpdateAudioSenders(std::vector<AudioSender*> senders,
269                                             int send_sample_rate_hz,
270                                             size_t send_num_channels) {
271   MutexLock lock(&capture_lock_);
272   audio_senders_ = std::move(senders);
273   send_sample_rate_hz_ = send_sample_rate_hz;
274   send_num_channels_ = send_num_channels;
275 }
276 
SetStereoChannelSwapping(bool enable)277 void AudioTransportImpl::SetStereoChannelSwapping(bool enable) {
278   MutexLock lock(&capture_lock_);
279   swap_stereo_channels_ = enable;
280 }
281 
282 }  // namespace webrtc
283