1 /* Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
2 * Use of this source code is governed by a BSD-style license that can be
3 * found in the LICENSE file.
4 */
5
6 /* For now just use speex, can add more resamplers later. */
7 #include <speex/speex_resampler.h>
8 #include <sys/param.h>
9 #include <syslog.h>
10 #include <endian.h>
11 #include <limits.h>
12 #include <math.h>
13
14 #include "cras_fmt_conv.h"
15 #include "cras_fmt_conv_ops.h"
16 #include "cras_audio_format.h"
17 #include "cras_util.h"
18 #include "linear_resampler.h"
19
20 /* The quality level is a value between 0 and 10. This is a tradeoff between
21 * performance, latency, and quality. */
22 #define SPEEX_QUALITY_LEVEL 4
23 /* Max number of converters, src, down/up mix, 2xformat, and linear resample. */
24 #define MAX_NUM_CONVERTERS 5
25 /* Channel index for stereo. */
26 #define STEREO_L 0
27 #define STEREO_R 1
28
29 typedef void (*sample_format_converter_t)(const uint8_t *in, size_t in_samples,
30 uint8_t *out);
31 typedef size_t (*channel_converter_t)(struct cras_fmt_conv *conv,
32 const uint8_t *in, size_t in_frames,
33 uint8_t *out);
34
35 /* Member data for the resampler. */
36 struct cras_fmt_conv {
37 SpeexResamplerState *speex_state;
38 channel_converter_t channel_converter;
39 float **ch_conv_mtx; /* Coefficient matrix for mixing channels. */
40 sample_format_converter_t in_format_converter;
41 sample_format_converter_t out_format_converter;
42 struct linear_resampler *resampler;
43 struct cras_audio_format in_fmt;
44 struct cras_audio_format out_fmt;
45 uint8_t *tmp_bufs[MAX_NUM_CONVERTERS - 1];
46 size_t tmp_buf_frames;
47 size_t pre_linear_resample;
48 size_t num_converters; /* Incremented once for SRC, channel, format. */
49 };
50
is_channel_layout_equal(const struct cras_audio_format * a,const struct cras_audio_format * b)51 static int is_channel_layout_equal(const struct cras_audio_format *a,
52 const struct cras_audio_format *b)
53 {
54 int ch;
55 for (ch = 0; ch < CRAS_CH_MAX; ch++)
56 if (a->channel_layout[ch] != b->channel_layout[ch])
57 return 0;
58
59 return 1;
60 }
61
62 /*
63 * Calculates the normalize_factor abs_sum(ci) from given coefficients.
64 * Since sum(ci / abs_sum(ci)) <= 1, this could prevent sample overflow while
65 * upmixing or downmixing.
66 */
normalize_factor(float * buf,size_t n)67 static float normalize_factor(float *buf, size_t n)
68 {
69 int i;
70 float abs_sum = 0.0;
71 for (i = 0; i < n; i++)
72 abs_sum += fabs(buf[i]);
73
74 return 1.0 / abs_sum;
75 }
76
77 /*
78 * Normalize all channels with the same factor to maintain
79 * the energy ratio between original channels.
80 */
normalize(float ** mtx,size_t m,size_t n,float factor)81 static void normalize(float **mtx, size_t m, size_t n, float factor)
82 {
83 int i, j;
84 for (i = 0; i < m; i++)
85 for (j = 0; j < n; j++)
86 mtx[i][j] *= factor;
87 }
88
89 /*
90 * Populates the down mix matrix by rules:
91 * 1. Front/side left(right) channel will mix to left(right) of
92 * full scale.
93 * 2. Center and LFE will be split equally to left and right.
94 * Rear
95 * 3. Rear left/right will split 1/4 of the power to opposite
96 * channel.
97 */
surround51_to_stereo_downmix_mtx(float ** mtx,int8_t layout[CRAS_CH_MAX])98 static void surround51_to_stereo_downmix_mtx(float **mtx,
99 int8_t layout[CRAS_CH_MAX])
100 {
101 if (layout[CRAS_CH_FC] != -1) {
102 mtx[STEREO_L][layout[CRAS_CH_FC]] = 0.707;
103 mtx[STEREO_R][layout[CRAS_CH_FC]] = 0.707;
104 }
105 if (layout[CRAS_CH_FL] != -1 && layout[CRAS_CH_FR] != -1) {
106 mtx[STEREO_L][layout[CRAS_CH_FL]] = 1.0;
107 mtx[STEREO_R][layout[CRAS_CH_FR]] = 1.0;
108 }
109 if (layout[CRAS_CH_SL] != -1 && layout[CRAS_CH_SR] != -1) {
110 mtx[STEREO_L][layout[CRAS_CH_SL]] = 1.0;
111 mtx[STEREO_R][layout[CRAS_CH_SR]] = 1.0;
112 }
113 if (layout[CRAS_CH_RL] != -1 && layout[CRAS_CH_RR] != -1) {
114 /* Split 1/4 power to the other side */
115 mtx[STEREO_L][layout[CRAS_CH_RL]] = 0.866;
116 mtx[STEREO_R][layout[CRAS_CH_RL]] = 0.5;
117 mtx[STEREO_R][layout[CRAS_CH_RR]] = 0.866;
118 mtx[STEREO_L][layout[CRAS_CH_RR]] = 0.5;
119 }
120 if (layout[CRAS_CH_LFE] != -1) {
121 mtx[STEREO_L][layout[CRAS_CH_LFE]] = 0.707;
122 mtx[STEREO_R][layout[CRAS_CH_LFE]] = 0.707;
123 }
124 normalize(mtx, 2, 6, normalize_factor(mtx[STEREO_L], 6));
125 }
126
127 /* Populates the down mix matrix by rules:
128 * 1. Front left(right) channel will mix to the front left(right) of
129 * full scale.
130 * 2. Rear and side left(right) channel will mix to the rear left(right) of
131 * full scale.
132 * 3. Center will be split equally to the front left and right.
133 * 4. LFE will be split equally to the other channels.
134 */
surround51_to_quad_downmix_mtx(float ** mtx,int8_t layout[CRAS_CH_MAX])135 static void surround51_to_quad_downmix_mtx(float **mtx,
136 int8_t layout[CRAS_CH_MAX])
137 {
138 if (layout[CRAS_CH_FL] != -1 && layout[CRAS_CH_FR] != -1) {
139 mtx[CRAS_CH_FL][layout[CRAS_CH_FL]] = 1.0;
140 mtx[CRAS_CH_FR][layout[CRAS_CH_FR]] = 1.0;
141 }
142 if (layout[CRAS_CH_RL] != -1 && layout[CRAS_CH_RR] != -1) {
143 mtx[CRAS_CH_RL][layout[CRAS_CH_RL]] = 1.0;
144 mtx[CRAS_CH_RR][layout[CRAS_CH_RR]] = 1.0;
145 }
146 if (layout[CRAS_CH_SL] != -1 && layout[CRAS_CH_SR] != -1) {
147 mtx[CRAS_CH_RL][layout[CRAS_CH_SL]] = 1.0;
148 mtx[CRAS_CH_RR][layout[CRAS_CH_SR]] = 1.0;
149 }
150 if (layout[CRAS_CH_FC] != -1) {
151 /* Split 1/2 power to the front L/R */
152 mtx[CRAS_CH_FL][layout[CRAS_CH_FC]] = 0.707;
153 mtx[CRAS_CH_FR][layout[CRAS_CH_FC]] = 0.707;
154 }
155 if (layout[CRAS_CH_LFE] != -1) {
156 /* Split 1/4 power to the other channel */
157 mtx[CRAS_CH_FL][layout[CRAS_CH_LFE]] = 0.5;
158 mtx[CRAS_CH_FR][layout[CRAS_CH_LFE]] = 0.5;
159 mtx[CRAS_CH_RL][layout[CRAS_CH_LFE]] = 0.5;
160 mtx[CRAS_CH_RR][layout[CRAS_CH_LFE]] = 0.5;
161 }
162
163 normalize(mtx, 4, 6, normalize_factor(mtx[CRAS_CH_FL], 6));
164 }
165
is_supported_format(const struct cras_audio_format * fmt)166 static int is_supported_format(const struct cras_audio_format *fmt)
167 {
168 if (!fmt)
169 return 0;
170
171 switch (fmt->format) {
172 case SND_PCM_FORMAT_U8:
173 case SND_PCM_FORMAT_S16_LE:
174 case SND_PCM_FORMAT_S24_3LE:
175 case SND_PCM_FORMAT_S24_LE:
176 case SND_PCM_FORMAT_S32_LE:
177 return 1;
178 default:
179 return 0;
180 }
181 }
182
mono_to_stereo(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)183 static size_t mono_to_stereo(struct cras_fmt_conv *conv, const uint8_t *in,
184 size_t in_frames, uint8_t *out)
185 {
186 return s16_mono_to_stereo(in, in_frames, out);
187 }
188
stereo_to_mono(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)189 static size_t stereo_to_mono(struct cras_fmt_conv *conv, const uint8_t *in,
190 size_t in_frames, uint8_t *out)
191 {
192 return s16_stereo_to_mono(in, in_frames, out);
193 }
194
mono_to_51(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)195 static size_t mono_to_51(struct cras_fmt_conv *conv, const uint8_t *in,
196 size_t in_frames, uint8_t *out)
197 {
198 size_t left, right, center;
199
200 left = conv->out_fmt.channel_layout[CRAS_CH_FL];
201 right = conv->out_fmt.channel_layout[CRAS_CH_FR];
202 center = conv->out_fmt.channel_layout[CRAS_CH_FC];
203
204 return s16_mono_to_51(left, right, center, in, in_frames, out);
205 }
206
stereo_to_51(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)207 static size_t stereo_to_51(struct cras_fmt_conv *conv, const uint8_t *in,
208 size_t in_frames, uint8_t *out)
209 {
210 size_t left, right, center;
211
212 left = conv->out_fmt.channel_layout[CRAS_CH_FL];
213 right = conv->out_fmt.channel_layout[CRAS_CH_FR];
214 center = conv->out_fmt.channel_layout[CRAS_CH_FC];
215
216 return s16_stereo_to_51(left, right, center, in, in_frames, out);
217 }
218
quad_to_51(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)219 static size_t quad_to_51(struct cras_fmt_conv *conv, const uint8_t *in,
220 size_t in_frames, uint8_t *out)
221 {
222 size_t fl, fr, rl, rr;
223
224 fl = conv->out_fmt.channel_layout[CRAS_CH_FL];
225 fr = conv->out_fmt.channel_layout[CRAS_CH_FR];
226 rl = conv->out_fmt.channel_layout[CRAS_CH_RL];
227 rr = conv->out_fmt.channel_layout[CRAS_CH_RR];
228
229 return s16_quad_to_51(fl, fr, rl, rr, in, in_frames, out);
230 }
231
_51_to_stereo(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)232 static size_t _51_to_stereo(struct cras_fmt_conv *conv, const uint8_t *in,
233 size_t in_frames, uint8_t *out)
234 {
235 return s16_51_to_stereo(in, in_frames, out);
236 }
237
_51_to_quad(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)238 static size_t _51_to_quad(struct cras_fmt_conv *conv, const uint8_t *in,
239 size_t in_frames, uint8_t *out)
240 {
241 return s16_51_to_quad(in, in_frames, out);
242 }
243
stereo_to_quad(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)244 static size_t stereo_to_quad(struct cras_fmt_conv *conv, const uint8_t *in,
245 size_t in_frames, uint8_t *out)
246 {
247 size_t front_left, front_right, rear_left, rear_right;
248
249 front_left = conv->out_fmt.channel_layout[CRAS_CH_FL];
250 front_right = conv->out_fmt.channel_layout[CRAS_CH_FR];
251 rear_left = conv->out_fmt.channel_layout[CRAS_CH_RL];
252 rear_right = conv->out_fmt.channel_layout[CRAS_CH_RR];
253
254 return s16_stereo_to_quad(front_left, front_right, rear_left,
255 rear_right, in, in_frames, out);
256 }
257
quad_to_stereo(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)258 static size_t quad_to_stereo(struct cras_fmt_conv *conv, const uint8_t *in,
259 size_t in_frames, uint8_t *out)
260 {
261 size_t front_left, front_right, rear_left, rear_right;
262
263 front_left = conv->in_fmt.channel_layout[CRAS_CH_FL];
264 front_right = conv->in_fmt.channel_layout[CRAS_CH_FR];
265 rear_left = conv->in_fmt.channel_layout[CRAS_CH_RL];
266 rear_right = conv->in_fmt.channel_layout[CRAS_CH_RR];
267
268 return s16_quad_to_stereo(front_left, front_right, rear_left,
269 rear_right, in, in_frames, out);
270 }
271
default_all_to_all(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)272 static size_t default_all_to_all(struct cras_fmt_conv *conv, const uint8_t *in,
273 size_t in_frames, uint8_t *out)
274 {
275 size_t num_in_ch, num_out_ch;
276
277 num_in_ch = conv->in_fmt.num_channels;
278 num_out_ch = conv->out_fmt.num_channels;
279
280 return s16_default_all_to_all(&conv->out_fmt, num_in_ch, num_out_ch, in,
281 in_frames, out);
282 }
283
284 // Fill min(in channels, out_channels), leave the rest 0s.
default_some_to_some(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)285 static size_t default_some_to_some(struct cras_fmt_conv *conv,
286 const uint8_t *in,
287 size_t in_frames,
288 uint8_t *out)
289 {
290 size_t num_in_ch, num_out_ch;
291
292 num_in_ch = conv->in_fmt.num_channels;
293 num_out_ch = conv->out_fmt.num_channels;
294
295 return s16_some_to_some(&conv->out_fmt, num_in_ch, num_out_ch, in,
296 in_frames, out);
297 }
298
convert_channels(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)299 static size_t convert_channels(struct cras_fmt_conv *conv, const uint8_t *in,
300 size_t in_frames, uint8_t *out)
301 {
302 float **ch_conv_mtx;
303 size_t num_in_ch, num_out_ch;
304
305 ch_conv_mtx = conv->ch_conv_mtx;
306 num_in_ch = conv->in_fmt.num_channels;
307 num_out_ch = conv->out_fmt.num_channels;
308
309 return s16_convert_channels(ch_conv_mtx, num_in_ch, num_out_ch, in,
310 in_frames, out);
311 }
312
313 /*
314 * Exported interface
315 */
316
cras_fmt_conv_create(const struct cras_audio_format * in,const struct cras_audio_format * out,size_t max_frames,size_t pre_linear_resample)317 struct cras_fmt_conv *cras_fmt_conv_create(const struct cras_audio_format *in,
318 const struct cras_audio_format *out,
319 size_t max_frames,
320 size_t pre_linear_resample)
321 {
322 struct cras_fmt_conv *conv;
323 int rc;
324 unsigned i;
325
326 conv = calloc(1, sizeof(*conv));
327 if (conv == NULL)
328 return NULL;
329 conv->in_fmt = *in;
330 conv->out_fmt = *out;
331 conv->tmp_buf_frames = max_frames;
332 conv->pre_linear_resample = pre_linear_resample;
333
334 if (!is_supported_format(in)) {
335 syslog(LOG_ERR, "Invalid input format %d", in->format);
336 cras_fmt_conv_destroy(&conv);
337 return NULL;
338 }
339
340 if (!is_supported_format(out)) {
341 syslog(LOG_ERR, "Invalid output format %d", out->format);
342 cras_fmt_conv_destroy(&conv);
343 return NULL;
344 }
345
346 /* Set up sample format conversion. */
347 /* TODO(dgreid) - modify channel and sample rate conversion so
348 * converting to s16 isnt necessary. */
349 if (in->format != SND_PCM_FORMAT_S16_LE) {
350 conv->num_converters++;
351 syslog(LOG_DEBUG, "Convert from format %d to %d.", in->format,
352 out->format);
353 switch (in->format) {
354 case SND_PCM_FORMAT_U8:
355 conv->in_format_converter = convert_u8_to_s16le;
356 break;
357 case SND_PCM_FORMAT_S24_LE:
358 conv->in_format_converter = convert_s24le_to_s16le;
359 break;
360 case SND_PCM_FORMAT_S32_LE:
361 conv->in_format_converter = convert_s32le_to_s16le;
362 break;
363 case SND_PCM_FORMAT_S24_3LE:
364 conv->in_format_converter = convert_s243le_to_s16le;
365 break;
366 default:
367 syslog(LOG_ERR, "Should never reachable");
368 break;
369 }
370 }
371 if (out->format != SND_PCM_FORMAT_S16_LE) {
372 conv->num_converters++;
373 syslog(LOG_DEBUG, "Convert from format %d to %d.", in->format,
374 out->format);
375 switch (out->format) {
376 case SND_PCM_FORMAT_U8:
377 conv->out_format_converter = convert_s16le_to_u8;
378 break;
379 case SND_PCM_FORMAT_S24_LE:
380 conv->out_format_converter = convert_s16le_to_s24le;
381 break;
382 case SND_PCM_FORMAT_S32_LE:
383 conv->out_format_converter = convert_s16le_to_s32le;
384 break;
385 case SND_PCM_FORMAT_S24_3LE:
386 conv->out_format_converter = convert_s16le_to_s243le;
387 break;
388 default:
389 syslog(LOG_ERR, "Should never reachable");
390 break;
391 }
392 }
393
394 /* Set up channel number conversion. */
395 if (in->num_channels != out->num_channels) {
396 conv->num_converters++;
397 syslog(LOG_DEBUG, "Convert from %zu to %zu channels.",
398 in->num_channels, out->num_channels);
399
400 /* Populate the conversion matrix base on in/out channel count
401 * and layout. */
402 if (in->num_channels == 1 && out->num_channels == 2) {
403 conv->channel_converter = mono_to_stereo;
404 } else if (in->num_channels == 1 && out->num_channels == 6) {
405 conv->channel_converter = mono_to_51;
406 } else if (in->num_channels == 2 && out->num_channels == 1) {
407 conv->channel_converter = stereo_to_mono;
408 } else if (in->num_channels == 2 && out->num_channels == 4) {
409 conv->channel_converter = stereo_to_quad;
410 } else if (in->num_channels == 4 && out->num_channels == 2) {
411 conv->channel_converter = quad_to_stereo;
412 } else if (in->num_channels == 2 && out->num_channels == 6) {
413 conv->channel_converter = stereo_to_51;
414 } else if (in->num_channels == 4 && out->num_channels == 6) {
415 conv->channel_converter = quad_to_51;
416 } else if (in->num_channels == 6 &&
417 (out->num_channels == 2 || out->num_channels == 4)) {
418 int in_channel_layout_set = 0;
419
420 /* Checks if channel_layout is set in the incoming format */
421 for (i = 0; i < CRAS_CH_MAX; i++)
422 if (in->channel_layout[i] != -1)
423 in_channel_layout_set = 1;
424
425 /* Use the conversion matrix based converter when a
426 * channel layout is set, or default to use existing
427 * converter to downmix to stereo */
428 if (in_channel_layout_set) {
429 conv->ch_conv_mtx =
430 cras_channel_conv_matrix_alloc(
431 in->num_channels,
432 out->num_channels);
433 if (conv->ch_conv_mtx == NULL) {
434 cras_fmt_conv_destroy(&conv);
435 return NULL;
436 }
437 conv->channel_converter = convert_channels;
438 if (out->num_channels == 4) {
439 surround51_to_quad_downmix_mtx(
440 conv->ch_conv_mtx,
441 conv->in_fmt.channel_layout);
442 } else {
443 surround51_to_stereo_downmix_mtx(
444 conv->ch_conv_mtx,
445 conv->in_fmt.channel_layout);
446 }
447 } else {
448 if (out->num_channels == 4)
449 conv->channel_converter = _51_to_quad;
450 else
451 conv->channel_converter = _51_to_stereo;
452 }
453 } else if (in->num_channels <= 8 && out->num_channels <= 8) {
454 // For average channel counts mix from all to all.
455 syslog(LOG_WARNING,
456 "Using all_to_all map for %zu to %zu",
457 in->num_channels, out->num_channels);
458 conv->channel_converter = default_all_to_all;
459 } else {
460 syslog(LOG_WARNING,
461 "Using some_to_some channel map for %zu to %zu",
462 in->num_channels, out->num_channels);
463 conv->channel_converter = default_some_to_some;
464 }
465 } else if (in->num_channels > 2 && !is_channel_layout_equal(in, out)) {
466 conv->num_converters++;
467 conv->ch_conv_mtx = cras_channel_conv_matrix_create(in, out);
468 if (conv->ch_conv_mtx == NULL) {
469 syslog(LOG_ERR,
470 "Failed to create channel conversion matrix."
471 "Fallback to default_all_to_all.");
472 conv->channel_converter = default_all_to_all;
473 } else {
474 conv->channel_converter = convert_channels;
475 }
476 }
477 /* Set up sample rate conversion. */
478 if (in->frame_rate != out->frame_rate) {
479 conv->num_converters++;
480 syslog(LOG_DEBUG, "Convert from %zu to %zu Hz.", in->frame_rate,
481 out->frame_rate);
482 conv->speex_state =
483 speex_resampler_init(out->num_channels, in->frame_rate,
484 out->frame_rate,
485 SPEEX_QUALITY_LEVEL, &rc);
486 if (conv->speex_state == NULL) {
487 syslog(LOG_ERR, "Fail to create speex:%zu %zu %zu %d",
488 out->num_channels, in->frame_rate,
489 out->frame_rate, rc);
490 cras_fmt_conv_destroy(&conv);
491 return NULL;
492 }
493 }
494
495 /*
496 * Set up linear resampler.
497 *
498 * Note: intended to give both src_rate and dst_rate the same value
499 * (i.e. out->frame_rate). They will be updated in runtime in
500 * update_estimated_rate() when the audio thread wants to adjust the
501 * rate for inaccurate device consumption rate.
502 */
503 conv->num_converters++;
504 conv->resampler =
505 linear_resampler_create(out->num_channels,
506 cras_get_format_bytes(out),
507 out->frame_rate, out->frame_rate);
508 if (conv->resampler == NULL) {
509 syslog(LOG_ERR, "Fail to create linear resampler");
510 cras_fmt_conv_destroy(&conv);
511 return NULL;
512 }
513
514 /* Need num_converters-1 temp buffers, the final converter renders
515 * directly into the output. */
516 for (i = 0; i < conv->num_converters - 1; i++) {
517 conv->tmp_bufs[i] = malloc(
518 max_frames * 4 * /* width in bytes largest format. */
519 MAX(in->num_channels, out->num_channels));
520 if (conv->tmp_bufs[i] == NULL) {
521 cras_fmt_conv_destroy(&conv);
522 return NULL;
523 }
524 }
525
526 assert(conv->num_converters <= MAX_NUM_CONVERTERS);
527
528 return conv;
529 }
530
cras_fmt_conv_destroy(struct cras_fmt_conv ** convp)531 void cras_fmt_conv_destroy(struct cras_fmt_conv **convp)
532 {
533 unsigned i;
534 struct cras_fmt_conv *conv = *convp;
535
536 if (conv->ch_conv_mtx)
537 cras_channel_conv_matrix_destroy(conv->ch_conv_mtx,
538 conv->out_fmt.num_channels);
539 if (conv->speex_state)
540 speex_resampler_destroy(conv->speex_state);
541 if (conv->resampler)
542 linear_resampler_destroy(conv->resampler);
543 for (i = 0; i < MAX_NUM_CONVERTERS - 1; i++)
544 free(conv->tmp_bufs[i]);
545 free(conv);
546 *convp = NULL;
547 }
548
cras_channel_remix_conv_create(unsigned int num_channels,const float * coefficient)549 struct cras_fmt_conv *cras_channel_remix_conv_create(unsigned int num_channels,
550 const float *coefficient)
551 {
552 struct cras_fmt_conv *conv;
553 unsigned out_ch, in_ch;
554
555 conv = calloc(1, sizeof(*conv));
556 if (conv == NULL)
557 return NULL;
558 conv->in_fmt.num_channels = num_channels;
559 conv->out_fmt.num_channels = num_channels;
560
561 conv->ch_conv_mtx =
562 cras_channel_conv_matrix_alloc(num_channels, num_channels);
563 /* Convert the coeffiencnt array to conversion matrix. */
564 for (out_ch = 0; out_ch < num_channels; out_ch++)
565 for (in_ch = 0; in_ch < num_channels; in_ch++)
566 conv->ch_conv_mtx[out_ch][in_ch] =
567 coefficient[in_ch + out_ch * num_channels];
568
569 conv->num_converters = 1;
570 conv->tmp_bufs[0] = malloc(4 * /* width in bytes largest format. */
571 num_channels);
572 return conv;
573 }
574
cras_channel_remix_convert(struct cras_fmt_conv * conv,const struct cras_audio_format * fmt,uint8_t * in_buf,size_t nframes)575 void cras_channel_remix_convert(struct cras_fmt_conv *conv,
576 const struct cras_audio_format *fmt,
577 uint8_t *in_buf, size_t nframes)
578 {
579 unsigned ch, fr;
580 int16_t *tmp = (int16_t *)conv->tmp_bufs[0];
581 int16_t *buf = (int16_t *)in_buf;
582
583 /*
584 * Skip remix for non S16_LE format.
585 * TODO(tzungbi): support 24 bits remix convert.
586 */
587 if (fmt->format != SND_PCM_FORMAT_S16_LE)
588 return;
589
590 /* Do remix only when input buffer has the same number of channels. */
591 if (fmt->num_channels != conv->in_fmt.num_channels)
592 return;
593
594 for (fr = 0; fr < nframes; fr++) {
595 for (ch = 0; ch < conv->in_fmt.num_channels; ch++)
596 tmp[ch] = s16_multiply_buf_with_coef(
597 conv->ch_conv_mtx[ch], buf,
598 conv->in_fmt.num_channels);
599 for (ch = 0; ch < conv->in_fmt.num_channels; ch++)
600 buf[ch] = tmp[ch];
601 buf += conv->in_fmt.num_channels;
602 }
603 }
604
605 const struct cras_audio_format *
cras_fmt_conv_in_format(const struct cras_fmt_conv * conv)606 cras_fmt_conv_in_format(const struct cras_fmt_conv *conv)
607 {
608 return &conv->in_fmt;
609 }
610
611 const struct cras_audio_format *
cras_fmt_conv_out_format(const struct cras_fmt_conv * conv)612 cras_fmt_conv_out_format(const struct cras_fmt_conv *conv)
613 {
614 return &conv->out_fmt;
615 }
616
cras_fmt_conv_in_frames_to_out(struct cras_fmt_conv * conv,size_t in_frames)617 size_t cras_fmt_conv_in_frames_to_out(struct cras_fmt_conv *conv,
618 size_t in_frames)
619 {
620 if (!conv)
621 return in_frames;
622
623 if (conv->pre_linear_resample)
624 in_frames = linear_resampler_in_frames_to_out(conv->resampler,
625 in_frames);
626 in_frames = cras_frames_at_rate(conv->in_fmt.frame_rate, in_frames,
627 conv->out_fmt.frame_rate);
628 if (!conv->pre_linear_resample)
629 in_frames = linear_resampler_in_frames_to_out(conv->resampler,
630 in_frames);
631 return in_frames;
632 }
633
cras_fmt_conv_out_frames_to_in(struct cras_fmt_conv * conv,size_t out_frames)634 size_t cras_fmt_conv_out_frames_to_in(struct cras_fmt_conv *conv,
635 size_t out_frames)
636 {
637 if (!conv)
638 return out_frames;
639 if (!conv->pre_linear_resample)
640 out_frames = linear_resampler_out_frames_to_in(conv->resampler,
641 out_frames);
642 out_frames = cras_frames_at_rate(conv->out_fmt.frame_rate, out_frames,
643 conv->in_fmt.frame_rate);
644 if (conv->pre_linear_resample)
645 out_frames = linear_resampler_out_frames_to_in(conv->resampler,
646 out_frames);
647 return out_frames;
648 }
649
cras_fmt_conv_set_linear_resample_rates(struct cras_fmt_conv * conv,float from,float to)650 void cras_fmt_conv_set_linear_resample_rates(struct cras_fmt_conv *conv,
651 float from, float to)
652 {
653 linear_resampler_set_rates(conv->resampler, from, to);
654 }
655
cras_fmt_conv_convert_frames(struct cras_fmt_conv * conv,const uint8_t * in_buf,uint8_t * out_buf,unsigned int * in_frames,size_t out_frames)656 size_t cras_fmt_conv_convert_frames(struct cras_fmt_conv *conv,
657 const uint8_t *in_buf, uint8_t *out_buf,
658 unsigned int *in_frames, size_t out_frames)
659 {
660 uint32_t fr_in, fr_out;
661 uint8_t *buffers[MAX_NUM_CONVERTERS + 1]; /* converters + out buffer. */
662 size_t buf_idx = 0;
663 static int logged_frames_dont_fit;
664 unsigned int used_converters = conv->num_converters;
665 unsigned int post_linear_resample = 0;
666 unsigned int pre_linear_resample = 0;
667 unsigned int linear_resample_fr = 0;
668
669 assert(conv);
670 assert(*in_frames <= conv->tmp_buf_frames);
671
672 if (linear_resampler_needed(conv->resampler)) {
673 post_linear_resample = !conv->pre_linear_resample;
674 pre_linear_resample = conv->pre_linear_resample;
675 }
676
677 /* If no SRC, then in_frames should = out_frames. */
678 if (conv->speex_state == NULL) {
679 fr_in = MIN(*in_frames, out_frames);
680 if (out_frames < *in_frames && !logged_frames_dont_fit) {
681 syslog(LOG_INFO, "fmt_conv: %u to %zu no SRC.",
682 *in_frames, out_frames);
683 logged_frames_dont_fit = 1;
684 }
685 } else {
686 fr_in = *in_frames;
687 }
688 fr_out = fr_in;
689
690 /* Set up a chain of buffers. The output buffer of the first conversion
691 * is used as input to the second and so forth, ending in the output
692 * buffer. */
693 if (!linear_resampler_needed(conv->resampler))
694 used_converters--;
695
696 buffers[4] = (uint8_t *)conv->tmp_bufs[3];
697 buffers[3] = (uint8_t *)conv->tmp_bufs[2];
698 buffers[2] = (uint8_t *)conv->tmp_bufs[1];
699 buffers[1] = (uint8_t *)conv->tmp_bufs[0];
700 buffers[0] = (uint8_t *)in_buf;
701 buffers[used_converters] = out_buf;
702
703 if (pre_linear_resample) {
704 linear_resample_fr = fr_in;
705 unsigned resample_limit = out_frames;
706
707 /* If there is a 2nd fmt conversion we should convert the
708 * resample limit and round it to the lower bound in order
709 * not to convert too many frames in the pre linear resampler.
710 */
711 if (conv->speex_state != NULL) {
712 resample_limit = resample_limit *
713 conv->in_fmt.frame_rate /
714 conv->out_fmt.frame_rate;
715 /*
716 * However if the limit frames count is less than
717 * |out_rate / in_rate|, the final limit value could be
718 * rounded to zero so it confuses linear resampler to
719 * do nothing. Make sure it's non-zero in that case.
720 */
721 if (resample_limit == 0)
722 resample_limit = 1;
723 }
724
725 resample_limit = MIN(resample_limit, conv->tmp_buf_frames);
726 fr_in = linear_resampler_resample(
727 conv->resampler, buffers[buf_idx], &linear_resample_fr,
728 buffers[buf_idx + 1], resample_limit);
729 buf_idx++;
730 }
731
732 /* If the input format isn't S16_LE convert to it. */
733 if (conv->in_fmt.format != SND_PCM_FORMAT_S16_LE) {
734 conv->in_format_converter(buffers[buf_idx],
735 fr_in * conv->in_fmt.num_channels,
736 (uint8_t *)buffers[buf_idx + 1]);
737 buf_idx++;
738 }
739
740 /* Then channel conversion. */
741 if (conv->channel_converter != NULL) {
742 conv->channel_converter(conv, buffers[buf_idx], fr_in,
743 buffers[buf_idx + 1]);
744 buf_idx++;
745 }
746
747 /* Then SRC. */
748 if (conv->speex_state != NULL) {
749 unsigned int out_limit = out_frames;
750
751 if (post_linear_resample)
752 out_limit = linear_resampler_out_frames_to_in(
753 conv->resampler, out_limit);
754 fr_out = cras_frames_at_rate(conv->in_fmt.frame_rate, fr_in,
755 conv->out_fmt.frame_rate);
756 if (fr_out > out_frames + 1 && !logged_frames_dont_fit) {
757 syslog(LOG_INFO,
758 "fmt_conv: put %u frames in %zu sized buffer",
759 fr_out, out_frames);
760 logged_frames_dont_fit = 1;
761 }
762 /* limit frames to the output size. */
763 fr_out = MIN(fr_out, out_limit);
764 speex_resampler_process_interleaved_int(
765 conv->speex_state, (int16_t *)buffers[buf_idx], &fr_in,
766 (int16_t *)buffers[buf_idx + 1], &fr_out);
767 buf_idx++;
768 }
769
770 if (post_linear_resample) {
771 linear_resample_fr = fr_out;
772 unsigned resample_limit = MIN(conv->tmp_buf_frames, out_frames);
773 fr_out = linear_resampler_resample(
774 conv->resampler, buffers[buf_idx], &linear_resample_fr,
775 buffers[buf_idx + 1], resample_limit);
776 buf_idx++;
777 }
778
779 /* If the output format isn't S16_LE convert to it. */
780 if (conv->out_fmt.format != SND_PCM_FORMAT_S16_LE) {
781 conv->out_format_converter(buffers[buf_idx],
782 fr_out * conv->out_fmt.num_channels,
783 (uint8_t *)buffers[buf_idx + 1]);
784 buf_idx++;
785 }
786
787 if (pre_linear_resample) {
788 *in_frames = linear_resample_fr;
789
790 /* When buffer sizes are small, there's a corner case that
791 * speex library resamples 0 frame to N-1 frames, where N
792 * is the integer ratio of output and input rate. For example,
793 * 16KHz to 48KHz. In this case fmt_conv should claim zero
794 * frames processed, instead of using the linear resampler
795 * processed frames count. Otherwise there will be a frame
796 * leak and, if accumulated, causes delay in multiple devices
797 * use case.
798 */
799 if (conv->speex_state && (fr_in == 0))
800 *in_frames = 0;
801 } else {
802 *in_frames = fr_in;
803 }
804 return fr_out;
805 }
806
cras_fmt_conversion_needed(const struct cras_fmt_conv * conv)807 int cras_fmt_conversion_needed(const struct cras_fmt_conv *conv)
808 {
809 return linear_resampler_needed(conv->resampler) ||
810 (conv->num_converters > 1);
811 }
812
813 /* If the server cannot provide the requested format, configures an audio format
814 * converter that handles transforming the input format to the format used by
815 * the server. */
config_format_converter(struct cras_fmt_conv ** conv,enum CRAS_STREAM_DIRECTION dir,const struct cras_audio_format * from,const struct cras_audio_format * to,unsigned int frames)816 int config_format_converter(struct cras_fmt_conv **conv,
817 enum CRAS_STREAM_DIRECTION dir,
818 const struct cras_audio_format *from,
819 const struct cras_audio_format *to,
820 unsigned int frames)
821 {
822 struct cras_audio_format target;
823
824 /* For input, preserve the channel count and layout of
825 * from format */
826 if (dir == CRAS_STREAM_INPUT) {
827 target = *from;
828 target.format = to->format;
829 target.frame_rate = to->frame_rate;
830 } else {
831 target = *to;
832 }
833
834 syslog(LOG_DEBUG,
835 "format convert: from:%d %zu %zu target: %d %zu %zu "
836 "frames = %u",
837 from->format, from->frame_rate, from->num_channels,
838 target.format, target.frame_rate, target.num_channels, frames);
839 *conv = cras_fmt_conv_create(from, &target, frames,
840 (dir == CRAS_STREAM_INPUT));
841 if (!*conv) {
842 syslog(LOG_ERR, "Failed to create format converter");
843 return -ENOMEM;
844 }
845
846 return 0;
847 }
848