• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /* Copyright (c) 2012 The Chromium OS Authors. All rights reserved.
2  * Use of this source code is governed by a BSD-style license that can be
3  * found in the LICENSE file.
4  */
5 
6 /* For now just use speex, can add more resamplers later. */
7 #include <speex/speex_resampler.h>
8 #include <sys/param.h>
9 #include <syslog.h>
10 #include <endian.h>
11 #include <limits.h>
12 
13 #include "cras_fmt_conv.h"
14 #include "cras_fmt_conv_ops.h"
15 #include "cras_audio_format.h"
16 #include "cras_util.h"
17 #include "linear_resampler.h"
18 
19 /* The quality level is a value between 0 and 10. This is a tradeoff between
20  * performance, latency, and quality. */
21 #define SPEEX_QUALITY_LEVEL 4
22 /* Max number of converters, src, down/up mix, 2xformat, and linear resample. */
23 #define MAX_NUM_CONVERTERS 5
24 /* Channel index for stereo. */
25 #define STEREO_L 0
26 #define STEREO_R 1
27 
28 typedef void (*sample_format_converter_t)(const uint8_t *in, size_t in_samples,
29 					  uint8_t *out);
30 typedef size_t (*channel_converter_t)(struct cras_fmt_conv *conv,
31 				      const uint8_t *in, size_t in_frames,
32 				      uint8_t *out);
33 
34 /* Member data for the resampler. */
35 struct cras_fmt_conv {
36 	SpeexResamplerState *speex_state;
37 	channel_converter_t channel_converter;
38 	float **ch_conv_mtx; /* Coefficient matrix for mixing channels. */
39 	sample_format_converter_t in_format_converter;
40 	sample_format_converter_t out_format_converter;
41 	struct linear_resampler *resampler;
42 	struct cras_audio_format in_fmt;
43 	struct cras_audio_format out_fmt;
44 	uint8_t *tmp_bufs[MAX_NUM_CONVERTERS - 1];
45 	size_t tmp_buf_frames;
46 	size_t pre_linear_resample;
47 	size_t num_converters; /* Incremented once for SRC, channel, format. */
48 };
49 
is_channel_layout_equal(const struct cras_audio_format * a,const struct cras_audio_format * b)50 static int is_channel_layout_equal(const struct cras_audio_format *a,
51 				   const struct cras_audio_format *b)
52 {
53 	int ch;
54 	for (ch = 0; ch < CRAS_CH_MAX; ch++)
55 		if (a->channel_layout[ch] != b->channel_layout[ch])
56 			return 0;
57 
58 	return 1;
59 }
60 
normalize_buf(float * buf,size_t size)61 static void normalize_buf(float *buf, size_t size)
62 {
63 	int i;
64 	float squre_sum = 0.0;
65 	for (i = 0; i < size; i++)
66 		squre_sum += buf[i] * buf[i];
67 	for (i = 0; i < size; i++)
68 		buf[i] /= squre_sum;
69 }
70 
71 /* Populates the down mix matrix by rules:
72  * 1. Front/side left(right) channel will mix to left(right) of
73  *    full scale.
74  * 2. Center and LFE will be split equally to left and right.
75  *    Rear
76  * 3. Rear left/right will split 1/4 of the power to opposite
77  *    channel.
78  */
surround51_to_stereo_downmix_mtx(float ** mtx,int8_t layout[CRAS_CH_MAX])79 static void surround51_to_stereo_downmix_mtx(float **mtx,
80 					     int8_t layout[CRAS_CH_MAX])
81 {
82 	if (layout[CRAS_CH_FC] != -1) {
83 		mtx[STEREO_L][layout[CRAS_CH_FC]] = 0.707;
84 		mtx[STEREO_R][layout[CRAS_CH_FC]] = 0.707;
85 	}
86 	if (layout[CRAS_CH_FL] != -1 && layout[CRAS_CH_FR] != -1) {
87 		mtx[STEREO_L][layout[CRAS_CH_FL]] = 1.0;
88 		mtx[STEREO_R][layout[CRAS_CH_FR]] = 1.0;
89 	}
90 	if (layout[CRAS_CH_SL] != -1 && layout[CRAS_CH_SR] != -1) {
91 		mtx[STEREO_L][layout[CRAS_CH_SL]] = 1.0;
92 		mtx[STEREO_R][layout[CRAS_CH_SR]] = 1.0;
93 	}
94 	if (layout[CRAS_CH_RL] != -1 && layout[CRAS_CH_RR] != -1) {
95 		/* Split 1/4 power to the other side */
96 		mtx[STEREO_L][layout[CRAS_CH_RL]] = 0.866;
97 		mtx[STEREO_R][layout[CRAS_CH_RL]] = 0.5;
98 		mtx[STEREO_R][layout[CRAS_CH_RR]] = 0.866;
99 		mtx[STEREO_L][layout[CRAS_CH_RR]] = 0.5;
100 	}
101 	if (layout[CRAS_CH_LFE] != -1) {
102 		mtx[STEREO_L][layout[CRAS_CH_LFE]] = 0.707;
103 		mtx[STEREO_R][layout[CRAS_CH_LFE]] = 0.707;
104 	}
105 
106 	normalize_buf(mtx[STEREO_L], 6);
107 	normalize_buf(mtx[STEREO_R], 6);
108 }
109 
is_supported_format(const struct cras_audio_format * fmt)110 static int is_supported_format(const struct cras_audio_format *fmt)
111 {
112 	if (!fmt)
113 		return 0;
114 
115 	switch (fmt->format) {
116 	case SND_PCM_FORMAT_U8:
117 	case SND_PCM_FORMAT_S16_LE:
118 	case SND_PCM_FORMAT_S24_3LE:
119 	case SND_PCM_FORMAT_S24_LE:
120 	case SND_PCM_FORMAT_S32_LE:
121 		return 1;
122 	default:
123 		return 0;
124 	}
125 }
126 
mono_to_stereo(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)127 static size_t mono_to_stereo(struct cras_fmt_conv *conv, const uint8_t *in,
128 			     size_t in_frames, uint8_t *out)
129 {
130 	return s16_mono_to_stereo(in, in_frames, out);
131 }
132 
stereo_to_mono(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)133 static size_t stereo_to_mono(struct cras_fmt_conv *conv, const uint8_t *in,
134 			     size_t in_frames, uint8_t *out)
135 {
136 	return s16_stereo_to_mono(in, in_frames, out);
137 }
138 
mono_to_51(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)139 static size_t mono_to_51(struct cras_fmt_conv *conv, const uint8_t *in,
140 			 size_t in_frames, uint8_t *out)
141 {
142 	size_t left, right, center;
143 
144 	left = conv->out_fmt.channel_layout[CRAS_CH_FL];
145 	right = conv->out_fmt.channel_layout[CRAS_CH_FR];
146 	center = conv->out_fmt.channel_layout[CRAS_CH_FC];
147 
148 	return s16_mono_to_51(left, right, center, in, in_frames, out);
149 }
150 
stereo_to_51(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)151 static size_t stereo_to_51(struct cras_fmt_conv *conv, const uint8_t *in,
152 			   size_t in_frames, uint8_t *out)
153 {
154 	size_t left, right, center;
155 
156 	left = conv->out_fmt.channel_layout[CRAS_CH_FL];
157 	right = conv->out_fmt.channel_layout[CRAS_CH_FR];
158 	center = conv->out_fmt.channel_layout[CRAS_CH_FC];
159 
160 	return s16_stereo_to_51(left, right, center, in, in_frames, out);
161 }
162 
_51_to_stereo(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)163 static size_t _51_to_stereo(struct cras_fmt_conv *conv, const uint8_t *in,
164 			    size_t in_frames, uint8_t *out)
165 {
166 	return s16_51_to_stereo(in, in_frames, out);
167 }
168 
stereo_to_quad(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)169 static size_t stereo_to_quad(struct cras_fmt_conv *conv, const uint8_t *in,
170 			     size_t in_frames, uint8_t *out)
171 {
172 	size_t front_left, front_right, rear_left, rear_right;
173 
174 	front_left = conv->out_fmt.channel_layout[CRAS_CH_FL];
175 	front_right = conv->out_fmt.channel_layout[CRAS_CH_FR];
176 	rear_left = conv->out_fmt.channel_layout[CRAS_CH_RL];
177 	rear_right = conv->out_fmt.channel_layout[CRAS_CH_RR];
178 
179 	return s16_stereo_to_quad(front_left, front_right, rear_left,
180 				  rear_right, in, in_frames, out);
181 }
182 
quad_to_stereo(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)183 static size_t quad_to_stereo(struct cras_fmt_conv *conv, const uint8_t *in,
184 			     size_t in_frames, uint8_t *out)
185 {
186 	size_t front_left, front_right, rear_left, rear_right;
187 
188 	front_left = conv->in_fmt.channel_layout[CRAS_CH_FL];
189 	front_right = conv->in_fmt.channel_layout[CRAS_CH_FR];
190 	rear_left = conv->in_fmt.channel_layout[CRAS_CH_RL];
191 	rear_right = conv->in_fmt.channel_layout[CRAS_CH_RR];
192 
193 	return s16_quad_to_stereo(front_left, front_right, rear_left,
194 				  rear_right, in, in_frames, out);
195 }
196 
default_all_to_all(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)197 static size_t default_all_to_all(struct cras_fmt_conv *conv, const uint8_t *in,
198 				 size_t in_frames, uint8_t *out)
199 {
200 	size_t num_in_ch, num_out_ch;
201 
202 	num_in_ch = conv->in_fmt.num_channels;
203 	num_out_ch = conv->out_fmt.num_channels;
204 
205 	return s16_default_all_to_all(&conv->out_fmt, num_in_ch, num_out_ch, in,
206 				      in_frames, out);
207 }
208 
convert_channels(struct cras_fmt_conv * conv,const uint8_t * in,size_t in_frames,uint8_t * out)209 static size_t convert_channels(struct cras_fmt_conv *conv, const uint8_t *in,
210 			       size_t in_frames, uint8_t *out)
211 {
212 	float **ch_conv_mtx;
213 	size_t num_in_ch, num_out_ch;
214 
215 	ch_conv_mtx = conv->ch_conv_mtx;
216 	num_in_ch = conv->in_fmt.num_channels;
217 	num_out_ch = conv->out_fmt.num_channels;
218 
219 	return s16_convert_channels(ch_conv_mtx, num_in_ch, num_out_ch, in,
220 				    in_frames, out);
221 }
222 
223 /*
224  * Exported interface
225  */
226 
cras_fmt_conv_create(const struct cras_audio_format * in,const struct cras_audio_format * out,size_t max_frames,size_t pre_linear_resample)227 struct cras_fmt_conv *cras_fmt_conv_create(const struct cras_audio_format *in,
228 					   const struct cras_audio_format *out,
229 					   size_t max_frames,
230 					   size_t pre_linear_resample)
231 {
232 	struct cras_fmt_conv *conv;
233 	int rc;
234 	unsigned i;
235 
236 	conv = calloc(1, sizeof(*conv));
237 	if (conv == NULL)
238 		return NULL;
239 	conv->in_fmt = *in;
240 	conv->out_fmt = *out;
241 	conv->tmp_buf_frames = max_frames;
242 	conv->pre_linear_resample = pre_linear_resample;
243 
244 	if (!is_supported_format(in)) {
245 		syslog(LOG_ERR, "Invalid input format %d", in->format);
246 		cras_fmt_conv_destroy(&conv);
247 		return NULL;
248 	}
249 
250 	if (!is_supported_format(out)) {
251 		syslog(LOG_ERR, "Invalid output format %d", out->format);
252 		cras_fmt_conv_destroy(&conv);
253 		return NULL;
254 	}
255 
256 	/* Set up sample format conversion. */
257 	/* TODO(dgreid) - modify channel and sample rate conversion so
258 	 * converting to s16 isnt necessary. */
259 	if (in->format != SND_PCM_FORMAT_S16_LE) {
260 		conv->num_converters++;
261 		syslog(LOG_DEBUG, "Convert from format %d to %d.", in->format,
262 		       out->format);
263 		switch (in->format) {
264 		case SND_PCM_FORMAT_U8:
265 			conv->in_format_converter = convert_u8_to_s16le;
266 			break;
267 		case SND_PCM_FORMAT_S24_LE:
268 			conv->in_format_converter = convert_s24le_to_s16le;
269 			break;
270 		case SND_PCM_FORMAT_S32_LE:
271 			conv->in_format_converter = convert_s32le_to_s16le;
272 			break;
273 		case SND_PCM_FORMAT_S24_3LE:
274 			conv->in_format_converter = convert_s243le_to_s16le;
275 			break;
276 		default:
277 			syslog(LOG_ERR, "Should never reachable");
278 			break;
279 		}
280 	}
281 	if (out->format != SND_PCM_FORMAT_S16_LE) {
282 		conv->num_converters++;
283 		syslog(LOG_DEBUG, "Convert from format %d to %d.", in->format,
284 		       out->format);
285 		switch (out->format) {
286 		case SND_PCM_FORMAT_U8:
287 			conv->out_format_converter = convert_s16le_to_u8;
288 			break;
289 		case SND_PCM_FORMAT_S24_LE:
290 			conv->out_format_converter = convert_s16le_to_s24le;
291 			break;
292 		case SND_PCM_FORMAT_S32_LE:
293 			conv->out_format_converter = convert_s16le_to_s32le;
294 			break;
295 		case SND_PCM_FORMAT_S24_3LE:
296 			conv->out_format_converter = convert_s16le_to_s243le;
297 			break;
298 		default:
299 			syslog(LOG_ERR, "Should never reachable");
300 			break;
301 		}
302 	}
303 
304 	/* Set up channel number conversion. */
305 	if (in->num_channels != out->num_channels) {
306 		conv->num_converters++;
307 		syslog(LOG_DEBUG, "Convert from %zu to %zu channels.",
308 		       in->num_channels, out->num_channels);
309 
310 		/* Populate the conversion matrix base on in/out channel count
311 		 * and layout. */
312 		if (in->num_channels == 1 && out->num_channels == 2) {
313 			conv->channel_converter = mono_to_stereo;
314 		} else if (in->num_channels == 1 && out->num_channels == 6) {
315 			conv->channel_converter = mono_to_51;
316 		} else if (in->num_channels == 2 && out->num_channels == 1) {
317 			conv->channel_converter = stereo_to_mono;
318 		} else if (in->num_channels == 2 && out->num_channels == 4) {
319 			conv->channel_converter = stereo_to_quad;
320 		} else if (in->num_channels == 4 && out->num_channels == 2) {
321 			conv->channel_converter = quad_to_stereo;
322 		} else if (in->num_channels == 2 && out->num_channels == 6) {
323 			conv->channel_converter = stereo_to_51;
324 		} else if (in->num_channels == 6 && out->num_channels == 2) {
325 			int in_channel_layout_set = 0;
326 
327 			/* Checks if channel_layout is set in the incoming format */
328 			for (i = 0; i < CRAS_CH_MAX; i++)
329 				if (in->channel_layout[i] != -1)
330 					in_channel_layout_set = 1;
331 
332 			/* Use the conversion matrix based converter when a
333 			 * channel layout is set, or default to use existing
334 			 * converter to downmix to stereo */
335 			if (in_channel_layout_set) {
336 				conv->ch_conv_mtx =
337 					cras_channel_conv_matrix_alloc(
338 						in->num_channels,
339 						out->num_channels);
340 				if (conv->ch_conv_mtx == NULL) {
341 					cras_fmt_conv_destroy(&conv);
342 					return NULL;
343 				}
344 				conv->channel_converter = convert_channels;
345 				surround51_to_stereo_downmix_mtx(
346 					conv->ch_conv_mtx,
347 					conv->in_fmt.channel_layout);
348 			} else {
349 				conv->channel_converter = _51_to_stereo;
350 			}
351 		} else {
352 			syslog(LOG_WARNING,
353 			       "Using default channel map for %zu to %zu",
354 			       in->num_channels, out->num_channels);
355 			conv->channel_converter = default_all_to_all;
356 		}
357 	} else if (in->num_channels > 2 && !is_channel_layout_equal(in, out)) {
358 		conv->num_converters++;
359 		conv->ch_conv_mtx = cras_channel_conv_matrix_create(in, out);
360 		if (conv->ch_conv_mtx == NULL) {
361 			syslog(LOG_ERR,
362 			       "Failed to create channel conversion matrix");
363 			cras_fmt_conv_destroy(&conv);
364 			return NULL;
365 		}
366 		conv->channel_converter = convert_channels;
367 	}
368 	/* Set up sample rate conversion. */
369 	if (in->frame_rate != out->frame_rate) {
370 		conv->num_converters++;
371 		syslog(LOG_DEBUG, "Convert from %zu to %zu Hz.", in->frame_rate,
372 		       out->frame_rate);
373 		conv->speex_state =
374 			speex_resampler_init(out->num_channels, in->frame_rate,
375 					     out->frame_rate,
376 					     SPEEX_QUALITY_LEVEL, &rc);
377 		if (conv->speex_state == NULL) {
378 			syslog(LOG_ERR, "Fail to create speex:%zu %zu %zu %d",
379 			       out->num_channels, in->frame_rate,
380 			       out->frame_rate, rc);
381 			cras_fmt_conv_destroy(&conv);
382 			return NULL;
383 		}
384 	}
385 
386 	/*
387 	 * Set up linear resampler.
388 	 *
389 	 * Note: intended to give both src_rate and dst_rate the same value
390 	 * (i.e. out->frame_rate).  They will be updated in runtime in
391 	 * update_estimated_rate() when the audio thread wants to adjust the
392 	 * rate for inaccurate device consumption rate.
393 	 */
394 	conv->num_converters++;
395 	conv->resampler =
396 		linear_resampler_create(out->num_channels,
397 					cras_get_format_bytes(out),
398 					out->frame_rate, out->frame_rate);
399 	if (conv->resampler == NULL) {
400 		syslog(LOG_ERR, "Fail to create linear resampler");
401 		cras_fmt_conv_destroy(&conv);
402 		return NULL;
403 	}
404 
405 	/* Need num_converters-1 temp buffers, the final converter renders
406 	 * directly into the output. */
407 	for (i = 0; i < conv->num_converters - 1; i++) {
408 		conv->tmp_bufs[i] = malloc(
409 			max_frames * 4 * /* width in bytes largest format. */
410 			MAX(in->num_channels, out->num_channels));
411 		if (conv->tmp_bufs[i] == NULL) {
412 			cras_fmt_conv_destroy(&conv);
413 			return NULL;
414 		}
415 	}
416 
417 	assert(conv->num_converters <= MAX_NUM_CONVERTERS);
418 
419 	return conv;
420 }
421 
cras_fmt_conv_destroy(struct cras_fmt_conv ** convp)422 void cras_fmt_conv_destroy(struct cras_fmt_conv **convp)
423 {
424 	unsigned i;
425 	struct cras_fmt_conv *conv = *convp;
426 
427 	if (conv->ch_conv_mtx)
428 		cras_channel_conv_matrix_destroy(conv->ch_conv_mtx,
429 						 conv->out_fmt.num_channels);
430 	if (conv->speex_state)
431 		speex_resampler_destroy(conv->speex_state);
432 	if (conv->resampler)
433 		linear_resampler_destroy(conv->resampler);
434 	for (i = 0; i < MAX_NUM_CONVERTERS - 1; i++)
435 		free(conv->tmp_bufs[i]);
436 	free(conv);
437 	*convp = NULL;
438 }
439 
cras_channel_remix_conv_create(unsigned int num_channels,const float * coefficient)440 struct cras_fmt_conv *cras_channel_remix_conv_create(unsigned int num_channels,
441 						     const float *coefficient)
442 {
443 	struct cras_fmt_conv *conv;
444 	unsigned out_ch, in_ch;
445 
446 	conv = calloc(1, sizeof(*conv));
447 	if (conv == NULL)
448 		return NULL;
449 	conv->in_fmt.num_channels = num_channels;
450 	conv->out_fmt.num_channels = num_channels;
451 
452 	conv->ch_conv_mtx =
453 		cras_channel_conv_matrix_alloc(num_channels, num_channels);
454 	/* Convert the coeffiencnt array to conversion matrix. */
455 	for (out_ch = 0; out_ch < num_channels; out_ch++)
456 		for (in_ch = 0; in_ch < num_channels; in_ch++)
457 			conv->ch_conv_mtx[out_ch][in_ch] =
458 				coefficient[in_ch + out_ch * num_channels];
459 
460 	conv->num_converters = 1;
461 	conv->tmp_bufs[0] = malloc(4 * /* width in bytes largest format. */
462 				   num_channels);
463 	return conv;
464 }
465 
cras_channel_remix_convert(struct cras_fmt_conv * conv,const struct cras_audio_format * fmt,uint8_t * in_buf,size_t nframes)466 void cras_channel_remix_convert(struct cras_fmt_conv *conv,
467 				const struct cras_audio_format *fmt,
468 				uint8_t *in_buf, size_t nframes)
469 {
470 	unsigned ch, fr;
471 	int16_t *tmp = (int16_t *)conv->tmp_bufs[0];
472 	int16_t *buf = (int16_t *)in_buf;
473 
474 	/*
475 	 * Skip remix for non S16_LE format.
476 	 * TODO(tzungbi): support 24 bits remix convert.
477 	 */
478 	if (fmt->format != SND_PCM_FORMAT_S16_LE)
479 		return;
480 
481 	/* Do remix only when input buffer has the same number of channels. */
482 	if (fmt->num_channels != conv->in_fmt.num_channels)
483 		return;
484 
485 	for (fr = 0; fr < nframes; fr++) {
486 		for (ch = 0; ch < conv->in_fmt.num_channels; ch++)
487 			tmp[ch] = s16_multiply_buf_with_coef(
488 				conv->ch_conv_mtx[ch], buf,
489 				conv->in_fmt.num_channels);
490 		for (ch = 0; ch < conv->in_fmt.num_channels; ch++)
491 			buf[ch] = tmp[ch];
492 		buf += conv->in_fmt.num_channels;
493 	}
494 }
495 
496 const struct cras_audio_format *
cras_fmt_conv_in_format(const struct cras_fmt_conv * conv)497 cras_fmt_conv_in_format(const struct cras_fmt_conv *conv)
498 {
499 	return &conv->in_fmt;
500 }
501 
502 const struct cras_audio_format *
cras_fmt_conv_out_format(const struct cras_fmt_conv * conv)503 cras_fmt_conv_out_format(const struct cras_fmt_conv *conv)
504 {
505 	return &conv->out_fmt;
506 }
507 
cras_fmt_conv_in_frames_to_out(struct cras_fmt_conv * conv,size_t in_frames)508 size_t cras_fmt_conv_in_frames_to_out(struct cras_fmt_conv *conv,
509 				      size_t in_frames)
510 {
511 	if (!conv)
512 		return in_frames;
513 
514 	if (conv->pre_linear_resample)
515 		in_frames = linear_resampler_in_frames_to_out(conv->resampler,
516 							      in_frames);
517 	in_frames = cras_frames_at_rate(conv->in_fmt.frame_rate, in_frames,
518 					conv->out_fmt.frame_rate);
519 	if (!conv->pre_linear_resample)
520 		in_frames = linear_resampler_in_frames_to_out(conv->resampler,
521 							      in_frames);
522 	return in_frames;
523 }
524 
cras_fmt_conv_out_frames_to_in(struct cras_fmt_conv * conv,size_t out_frames)525 size_t cras_fmt_conv_out_frames_to_in(struct cras_fmt_conv *conv,
526 				      size_t out_frames)
527 {
528 	if (!conv)
529 		return out_frames;
530 	if (!conv->pre_linear_resample)
531 		out_frames = linear_resampler_out_frames_to_in(conv->resampler,
532 							       out_frames);
533 	out_frames = cras_frames_at_rate(conv->out_fmt.frame_rate, out_frames,
534 					 conv->in_fmt.frame_rate);
535 	if (conv->pre_linear_resample)
536 		out_frames = linear_resampler_out_frames_to_in(conv->resampler,
537 							       out_frames);
538 	return out_frames;
539 }
540 
cras_fmt_conv_set_linear_resample_rates(struct cras_fmt_conv * conv,float from,float to)541 void cras_fmt_conv_set_linear_resample_rates(struct cras_fmt_conv *conv,
542 					     float from, float to)
543 {
544 	linear_resampler_set_rates(conv->resampler, from, to);
545 }
546 
cras_fmt_conv_convert_frames(struct cras_fmt_conv * conv,const uint8_t * in_buf,uint8_t * out_buf,unsigned int * in_frames,size_t out_frames)547 size_t cras_fmt_conv_convert_frames(struct cras_fmt_conv *conv,
548 				    const uint8_t *in_buf, uint8_t *out_buf,
549 				    unsigned int *in_frames, size_t out_frames)
550 {
551 	uint32_t fr_in, fr_out;
552 	uint8_t *buffers[MAX_NUM_CONVERTERS + 1]; /* converters + out buffer. */
553 	size_t buf_idx = 0;
554 	static int logged_frames_dont_fit;
555 	unsigned int used_converters = conv->num_converters;
556 	unsigned int post_linear_resample = 0;
557 	unsigned int pre_linear_resample = 0;
558 	unsigned int linear_resample_fr = 0;
559 
560 	assert(conv);
561 	assert(*in_frames <= conv->tmp_buf_frames);
562 
563 	if (linear_resampler_needed(conv->resampler)) {
564 		post_linear_resample = !conv->pre_linear_resample;
565 		pre_linear_resample = conv->pre_linear_resample;
566 	}
567 
568 	/* If no SRC, then in_frames should = out_frames. */
569 	if (conv->speex_state == NULL) {
570 		fr_in = MIN(*in_frames, out_frames);
571 		if (out_frames < *in_frames && !logged_frames_dont_fit) {
572 			syslog(LOG_INFO, "fmt_conv: %u to %zu no SRC.",
573 			       *in_frames, out_frames);
574 			logged_frames_dont_fit = 1;
575 		}
576 	} else {
577 		fr_in = *in_frames;
578 	}
579 	fr_out = fr_in;
580 
581 	/* Set up a chain of buffers.  The output buffer of the first conversion
582 	 * is used as input to the second and so forth, ending in the output
583 	 * buffer. */
584 	if (!linear_resampler_needed(conv->resampler))
585 		used_converters--;
586 
587 	buffers[4] = (uint8_t *)conv->tmp_bufs[3];
588 	buffers[3] = (uint8_t *)conv->tmp_bufs[2];
589 	buffers[2] = (uint8_t *)conv->tmp_bufs[1];
590 	buffers[1] = (uint8_t *)conv->tmp_bufs[0];
591 	buffers[0] = (uint8_t *)in_buf;
592 	buffers[used_converters] = out_buf;
593 
594 	if (pre_linear_resample) {
595 		linear_resample_fr = fr_in;
596 		unsigned resample_limit = out_frames;
597 
598 		/* If there is a 2nd fmt conversion we should convert the
599 		 * resample limit and round it to the lower bound in order
600 		 * not to convert too many frames in the pre linear resampler.
601 		 */
602 		if (conv->speex_state != NULL) {
603 			resample_limit = resample_limit *
604 					 conv->in_fmt.frame_rate /
605 					 conv->out_fmt.frame_rate;
606 			/*
607 			 * However if the limit frames count is less than
608 			 * |out_rate / in_rate|, the final limit value could be
609 			 * rounded to zero so it confuses linear resampler to
610 			 * do nothing. Make sure it's non-zero in that case.
611 			 */
612 			if (resample_limit == 0)
613 				resample_limit = 1;
614 		}
615 
616 		resample_limit = MIN(resample_limit, conv->tmp_buf_frames);
617 		fr_in = linear_resampler_resample(
618 			conv->resampler, buffers[buf_idx], &linear_resample_fr,
619 			buffers[buf_idx + 1], resample_limit);
620 		buf_idx++;
621 	}
622 
623 	/* If the input format isn't S16_LE convert to it. */
624 	if (conv->in_fmt.format != SND_PCM_FORMAT_S16_LE) {
625 		conv->in_format_converter(buffers[buf_idx],
626 					  fr_in * conv->in_fmt.num_channels,
627 					  (uint8_t *)buffers[buf_idx + 1]);
628 		buf_idx++;
629 	}
630 
631 	/* Then channel conversion. */
632 	if (conv->channel_converter != NULL) {
633 		conv->channel_converter(conv, buffers[buf_idx], fr_in,
634 					buffers[buf_idx + 1]);
635 		buf_idx++;
636 	}
637 
638 	/* Then SRC. */
639 	if (conv->speex_state != NULL) {
640 		unsigned int out_limit = out_frames;
641 
642 		if (post_linear_resample)
643 			out_limit = linear_resampler_out_frames_to_in(
644 				conv->resampler, out_limit);
645 		fr_out = cras_frames_at_rate(conv->in_fmt.frame_rate, fr_in,
646 					     conv->out_fmt.frame_rate);
647 		if (fr_out > out_frames + 1 && !logged_frames_dont_fit) {
648 			syslog(LOG_INFO,
649 			       "fmt_conv: put %u frames in %zu sized buffer",
650 			       fr_out, out_frames);
651 			logged_frames_dont_fit = 1;
652 		}
653 		/* limit frames to the output size. */
654 		fr_out = MIN(fr_out, out_limit);
655 		speex_resampler_process_interleaved_int(
656 			conv->speex_state, (int16_t *)buffers[buf_idx], &fr_in,
657 			(int16_t *)buffers[buf_idx + 1], &fr_out);
658 		buf_idx++;
659 	}
660 
661 	if (post_linear_resample) {
662 		linear_resample_fr = fr_out;
663 		unsigned resample_limit = MIN(conv->tmp_buf_frames, out_frames);
664 		fr_out = linear_resampler_resample(
665 			conv->resampler, buffers[buf_idx], &linear_resample_fr,
666 			buffers[buf_idx + 1], resample_limit);
667 		buf_idx++;
668 	}
669 
670 	/* If the output format isn't S16_LE convert to it. */
671 	if (conv->out_fmt.format != SND_PCM_FORMAT_S16_LE) {
672 		conv->out_format_converter(buffers[buf_idx],
673 					   fr_out * conv->out_fmt.num_channels,
674 					   (uint8_t *)buffers[buf_idx + 1]);
675 		buf_idx++;
676 	}
677 
678 	if (pre_linear_resample) {
679 		*in_frames = linear_resample_fr;
680 
681 		/* When buffer sizes are small, there's a corner case that
682 		 * speex library resamples 0 frame to N-1 frames, where N
683 		 * is the integer ratio of output and input rate. For example,
684 		 * 16KHz to 48KHz. In this case fmt_conv should claim zero
685 		 * frames processed, instead of using the linear resampler
686 		 * processed frames count. Otherwise there will be a frame
687 		 * leak and, if accumulated, causes delay in multiple devices
688 		 * use case.
689 		 */
690 		if (conv->speex_state && (fr_in == 0))
691 			*in_frames = 0;
692 	} else {
693 		*in_frames = fr_in;
694 	}
695 	return fr_out;
696 }
697 
cras_fmt_conversion_needed(const struct cras_fmt_conv * conv)698 int cras_fmt_conversion_needed(const struct cras_fmt_conv *conv)
699 {
700 	return linear_resampler_needed(conv->resampler) ||
701 	       (conv->num_converters > 1);
702 }
703 
704 /* If the server cannot provide the requested format, configures an audio format
705  * converter that handles transforming the input format to the format used by
706  * the server. */
config_format_converter(struct cras_fmt_conv ** conv,enum CRAS_STREAM_DIRECTION dir,const struct cras_audio_format * from,const struct cras_audio_format * to,unsigned int frames)707 int config_format_converter(struct cras_fmt_conv **conv,
708 			    enum CRAS_STREAM_DIRECTION dir,
709 			    const struct cras_audio_format *from,
710 			    const struct cras_audio_format *to,
711 			    unsigned int frames)
712 {
713 	struct cras_audio_format target;
714 
715 	/* For input, preserve the channel count and layout of
716 	 * from format */
717 	if (dir == CRAS_STREAM_INPUT) {
718 		target = *from;
719 		target.format = to->format;
720 		target.frame_rate = to->frame_rate;
721 	} else {
722 		target = *to;
723 	}
724 
725 	syslog(LOG_DEBUG,
726 	       "format convert: from:%d %zu %zu target: %d %zu %zu "
727 	       "frames = %u",
728 	       from->format, from->frame_rate, from->num_channels,
729 	       target.format, target.frame_rate, target.num_channels, frames);
730 	*conv = cras_fmt_conv_create(from, &target, frames,
731 				     (dir == CRAS_STREAM_INPUT));
732 	if (!*conv) {
733 		syslog(LOG_ERR, "Failed to create format converter");
734 		return -ENOMEM;
735 	}
736 
737 	return 0;
738 }
739