1 /*
2 * Copyright 2018 The Android Open Source Project
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13 * See the License for the specific language governing permissions and
14 * limitations under the License.
15 */
16
17 #include <memory>
18 #include <oboe/Definitions.h>
19 #include "FFMpegExtractor.h"
20 #include "utils/logging.h"
21
22 constexpr int kInternalBufferSize = 1152; // Use MP3 block size. https://wiki.hydrogenaud.io/index.php?title=MP3
23
read(void * opaque,uint8_t * buf,int buf_size)24 int read(void *opaque, uint8_t *buf, int buf_size) {
25
26 auto asset = (AAsset *) opaque;
27 int bytesRead = AAsset_read(asset, buf, (size_t)buf_size);
28 return bytesRead;
29 }
30
seek(void * opaque,int64_t offset,int whence)31 int64_t seek(void *opaque, int64_t offset, int whence){
32
33 auto asset = (AAsset*)opaque;
34
35 // See https://www.ffmpeg.org/doxygen/3.0/avio_8h.html#a427ff2a881637b47ee7d7f9e368be63f
36 if (whence == AVSEEK_SIZE) return AAsset_getLength(asset);
37 if (AAsset_seek(asset, offset, whence) == -1){
38 return -1;
39 } else {
40 return 0;
41 }
42 }
43
createAVIOContext(AAsset * asset,uint8_t * buffer,uint32_t bufferSize,AVIOContext ** avioContext)44 bool FFMpegExtractor::createAVIOContext(AAsset *asset, uint8_t *buffer, uint32_t bufferSize,
45 AVIOContext **avioContext) {
46
47 constexpr int isBufferWriteable = 0;
48
49 *avioContext = avio_alloc_context(
50 buffer, // internal buffer for FFmpeg to use
51 bufferSize, // For optimal decoding speed this should be the protocol block size
52 isBufferWriteable,
53 asset, // Will be passed to our callback functions as a (void *)
54 read, // Read callback function
55 nullptr, // Write callback function (not used)
56 seek); // Seek callback function
57
58 if (*avioContext == nullptr){
59 LOGE("Failed to create AVIO context");
60 return false;
61 } else {
62 return true;
63 }
64 }
65
66 bool
createAVFormatContext(AVIOContext * avioContext,AVFormatContext ** avFormatContext)67 FFMpegExtractor::createAVFormatContext(AVIOContext *avioContext, AVFormatContext **avFormatContext) {
68
69 *avFormatContext = avformat_alloc_context();
70 (*avFormatContext)->pb = avioContext;
71
72 if (*avFormatContext == nullptr){
73 LOGE("Failed to create AVFormatContext");
74 return false;
75 } else {
76 return true;
77 }
78 }
79
openAVFormatContext(AVFormatContext * avFormatContext)80 bool FFMpegExtractor::openAVFormatContext(AVFormatContext *avFormatContext) {
81
82 int result = avformat_open_input(&avFormatContext,
83 "", /* URL is left empty because we're providing our own I/O */
84 nullptr /* AVInputFormat *fmt */,
85 nullptr /* AVDictionary **options */
86 );
87
88 if (result == 0) {
89 return true;
90 } else {
91 LOGE("Failed to open file. Error code %s", av_err2str(result));
92 return false;
93 }
94 }
95
getStreamInfo(AVFormatContext * avFormatContext)96 bool FFMpegExtractor::getStreamInfo(AVFormatContext *avFormatContext) {
97
98 int result = avformat_find_stream_info(avFormatContext, nullptr);
99 if (result == 0 ){
100 return true;
101 } else {
102 LOGE("Failed to find stream info. Error code %s", av_err2str(result));
103 return false;
104 }
105 }
106
getBestAudioStream(AVFormatContext * avFormatContext)107 AVStream *FFMpegExtractor::getBestAudioStream(AVFormatContext *avFormatContext) {
108
109 int streamIndex = av_find_best_stream(avFormatContext, AVMEDIA_TYPE_AUDIO, -1, -1, nullptr, 0);
110
111 if (streamIndex < 0){
112 LOGE("Could not find stream");
113 return nullptr;
114 } else {
115 return avFormatContext->streams[streamIndex];
116 }
117 }
118
decode(AAsset * asset,uint8_t * targetData,AudioProperties targetProperties)119 int64_t FFMpegExtractor::decode(
120 AAsset *asset,
121 uint8_t *targetData,
122 AudioProperties targetProperties) {
123
124 LOGI("Decoder: FFMpeg");
125
126 int returnValue = -1; // -1 indicates error
127
128 // Create a buffer for FFmpeg to use for decoding (freed in the custom deleter below)
129 auto buffer = reinterpret_cast<uint8_t*>(av_malloc(kInternalBufferSize));
130
131 // Create an AVIOContext with a custom deleter
132 std::unique_ptr<AVIOContext, void(*)(AVIOContext *)> ioContext {
133 nullptr,
134 [](AVIOContext *c) {
135 av_free(c->buffer);
136 avio_context_free(&c);
137 }
138 };
139 {
140 AVIOContext *tmp = nullptr;
141 if (!createAVIOContext(asset, buffer, kInternalBufferSize, &tmp)){
142 LOGE("Could not create an AVIOContext");
143 return returnValue;
144 }
145 ioContext.reset(tmp);
146 }
147
148 // Create an AVFormatContext using the avformat_free_context as the deleter function
149 std::unique_ptr<AVFormatContext, decltype(&avformat_free_context)> formatContext {
150 nullptr,
151 &avformat_free_context
152 };
153 {
154 AVFormatContext *tmp;
155 if (!createAVFormatContext(ioContext.get(), &tmp)) return returnValue;
156 formatContext.reset(tmp);
157 }
158
159 if (!openAVFormatContext(formatContext.get())) return returnValue;
160
161 if (!getStreamInfo(formatContext.get())) return returnValue;
162
163 // Obtain the best audio stream to decode
164 AVStream *stream = getBestAudioStream(formatContext.get());
165 if (stream == nullptr || stream->codecpar == nullptr){
166 LOGE("Could not find a suitable audio stream to decode");
167 return returnValue;
168 }
169
170 printCodecParameters(stream->codecpar);
171
172 // Find the codec to decode this stream
173 AVCodec *codec = avcodec_find_decoder(stream->codecpar->codec_id);
174 if (!codec){
175 LOGE("Could not find codec with ID: %d", stream->codecpar->codec_id);
176 return returnValue;
177 }
178
179 // Create the codec context, specifying the deleter function
180 std::unique_ptr<AVCodecContext, void(*)(AVCodecContext *)> codecContext {
181 nullptr,
182 [](AVCodecContext *c) { avcodec_free_context(&c); }
183 };
184 {
185 AVCodecContext *tmp = avcodec_alloc_context3(codec);
186 if (!tmp){
187 LOGE("Failed to allocate codec context");
188 return returnValue;
189 }
190 codecContext.reset(tmp);
191 }
192
193 // Copy the codec parameters into the context
194 if (avcodec_parameters_to_context(codecContext.get(), stream->codecpar) < 0){
195 LOGE("Failed to copy codec parameters to codec context");
196 return returnValue;
197 }
198
199 // Open the codec
200 if (avcodec_open2(codecContext.get(), codec, nullptr) < 0){
201 LOGE("Could not open codec");
202 return returnValue;
203 }
204
205 // prepare resampler
206 int32_t outChannelLayout = (1 << targetProperties.channelCount) - 1;
207 LOGD("Channel layout %d", outChannelLayout);
208
209 SwrContext *swr = swr_alloc();
210 av_opt_set_int(swr, "in_channel_count", stream->codecpar->channels, 0);
211 av_opt_set_int(swr, "out_channel_count", targetProperties.channelCount, 0);
212 av_opt_set_int(swr, "in_channel_layout", stream->codecpar->channel_layout, 0);
213 av_opt_set_int(swr, "out_channel_layout", outChannelLayout, 0);
214 av_opt_set_int(swr, "in_sample_rate", stream->codecpar->sample_rate, 0);
215 av_opt_set_int(swr, "out_sample_rate", targetProperties.sampleRate, 0);
216 av_opt_set_int(swr, "in_sample_fmt", stream->codecpar->format, 0);
217 av_opt_set_sample_fmt(swr, "out_sample_fmt", AV_SAMPLE_FMT_FLT, 0);
218 av_opt_set_int(swr, "force_resampling", 1, 0);
219
220 // Check that resampler has been inited
221 int result = swr_init(swr);
222 if (result != 0){
223 LOGE("swr_init failed. Error: %s", av_err2str(result));
224 return returnValue;
225 };
226 if (!swr_is_initialized(swr)) {
227 LOGE("swr_is_initialized is false\n");
228 return returnValue;
229 }
230
231 // Prepare to read data
232 int bytesWritten = 0;
233 AVPacket avPacket; // Stores compressed audio data
234 av_init_packet(&avPacket);
235 AVFrame *decodedFrame = av_frame_alloc(); // Stores raw audio data
236 int bytesPerSample = av_get_bytes_per_sample((AVSampleFormat)stream->codecpar->format);
237
238 LOGD("Bytes per sample %d", bytesPerSample);
239
240 LOGD("DECODE START");
241
242 // While there is more data to read, read it into the avPacket
243 while (av_read_frame(formatContext.get(), &avPacket) == 0){
244
245 if (avPacket.stream_index == stream->index && avPacket.size > 0) {
246
247 // Pass our compressed data into the codec
248 result = avcodec_send_packet(codecContext.get(), &avPacket);
249 if (result != 0) {
250 LOGE("avcodec_send_packet error: %s", av_err2str(result));
251 goto cleanup;
252 }
253
254 // Retrieve our raw data from the codec
255 result = avcodec_receive_frame(codecContext.get(), decodedFrame);
256 if (result == AVERROR(EAGAIN)) {
257 // The codec needs more data before it can decode
258 LOGI("avcodec_receive_frame returned EAGAIN");
259 av_packet_unref(&avPacket);
260 continue;
261 } else if (result != 0) {
262 LOGE("avcodec_receive_frame error: %s", av_err2str(result));
263 goto cleanup;
264 }
265
266 // DO RESAMPLING
267 auto dst_nb_samples = (int32_t) av_rescale_rnd(
268 swr_get_delay(swr, decodedFrame->sample_rate) + decodedFrame->nb_samples,
269 targetProperties.sampleRate,
270 decodedFrame->sample_rate,
271 AV_ROUND_UP);
272
273 short *buffer1;
274 av_samples_alloc(
275 (uint8_t **) &buffer1,
276 nullptr,
277 targetProperties.channelCount,
278 dst_nb_samples,
279 AV_SAMPLE_FMT_FLT,
280 0);
281 int frame_count = swr_convert(
282 swr,
283 (uint8_t **) &buffer1,
284 dst_nb_samples,
285 (const uint8_t **) decodedFrame->data,
286 decodedFrame->nb_samples);
287
288 int64_t bytesToWrite = frame_count * sizeof(float) * targetProperties.channelCount;
289 memcpy(targetData + bytesWritten, buffer1, (size_t)bytesToWrite);
290 bytesWritten += bytesToWrite;
291 av_freep(&buffer1);
292
293 av_packet_unref(&avPacket);
294 }
295 }
296
297 av_frame_free(&decodedFrame);
298 LOGD("DECODE END");
299
300 returnValue = bytesWritten;
301
302 cleanup:
303 return returnValue;
304 }
305
printCodecParameters(AVCodecParameters * params)306 void FFMpegExtractor::printCodecParameters(AVCodecParameters *params) {
307
308 LOGD("Stream properties");
309 LOGD("Channels: %d", params->channels);
310 LOGD("Channel layout: %" PRId64, params->channel_layout);
311 LOGD("Sample rate: %d", params->sample_rate);
312 LOGD("Format: %s", av_get_sample_fmt_name((AVSampleFormat)params->format));
313 LOGD("Frame size: %d", params->frame_size);
314 }
315
316
317
318
319