1 /* Copyright (c) 2007-2008 CSIRO
2 Copyright (c) 2007-2009 Xiph.Org Foundation
3 Copyright (c) 2008-2009 Gregory Maxwell
4 Written by Jean-Marc Valin and Gregory Maxwell */
5 /*
6 Redistribution and use in source and binary forms, with or without
7 modification, are permitted provided that the following conditions
8 are met:
9
10 - Redistributions of source code must retain the above copyright
11 notice, this list of conditions and the following disclaimer.
12
13 - Redistributions in binary form must reproduce the above copyright
14 notice, this list of conditions and the following disclaimer in the
15 documentation and/or other materials provided with the distribution.
16
17 THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
18 ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
19 LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
20 A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER
21 OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
22 EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
23 PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
24 PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
25 LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
26 NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
27 SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
28 */
29
30 #ifdef HAVE_CONFIG_H
31 #include "config.h"
32 #endif
33
34 #include <math.h>
35 #include "bands.h"
36 #include "modes.h"
37 #include "vq.h"
38 #include "cwrs.h"
39 #include "stack_alloc.h"
40 #include "os_support.h"
41 #include "mathops.h"
42 #include "rate.h"
43 #include "quant_bands.h"
44 #include "pitch.h"
45
hysteresis_decision(opus_val16 val,const opus_val16 * thresholds,const opus_val16 * hysteresis,int N,int prev)46 int hysteresis_decision(opus_val16 val, const opus_val16 *thresholds, const opus_val16 *hysteresis, int N, int prev)
47 {
48 int i;
49 for (i=0;i<N;i++)
50 {
51 if (val < thresholds[i])
52 break;
53 }
54 if (i>prev && val < thresholds[prev]+hysteresis[prev])
55 i=prev;
56 if (i<prev && val > thresholds[prev-1]-hysteresis[prev-1])
57 i=prev;
58 return i;
59 }
60
celt_lcg_rand(opus_uint32 seed)61 opus_uint32 celt_lcg_rand(opus_uint32 seed)
62 {
63 return 1664525 * seed + 1013904223;
64 }
65
66 /* This is a cos() approximation designed to be bit-exact on any platform. Bit exactness
67 with this approximation is important because it has an impact on the bit allocation */
bitexact_cos(opus_int16 x)68 static opus_int16 bitexact_cos(opus_int16 x)
69 {
70 opus_int32 tmp;
71 opus_int16 x2;
72 tmp = (4096+((opus_int32)(x)*(x)))>>13;
73 celt_assert(tmp<=32767);
74 x2 = tmp;
75 x2 = (32767-x2) + FRAC_MUL16(x2, (-7651 + FRAC_MUL16(x2, (8277 + FRAC_MUL16(-626, x2)))));
76 celt_assert(x2<=32766);
77 return 1+x2;
78 }
79
bitexact_log2tan(int isin,int icos)80 static int bitexact_log2tan(int isin,int icos)
81 {
82 int lc;
83 int ls;
84 lc=EC_ILOG(icos);
85 ls=EC_ILOG(isin);
86 icos<<=15-lc;
87 isin<<=15-ls;
88 return (ls-lc)*(1<<11)
89 +FRAC_MUL16(isin, FRAC_MUL16(isin, -2597) + 7932)
90 -FRAC_MUL16(icos, FRAC_MUL16(icos, -2597) + 7932);
91 }
92
93 #ifdef FIXED_POINT
94 /* Compute the amplitude (sqrt energy) in each of the bands */
compute_band_energies(const CELTMode * m,const celt_sig * X,celt_ener * bandE,int end,int C,int M)95 void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int M)
96 {
97 int i, c, N;
98 const opus_int16 *eBands = m->eBands;
99 N = M*m->shortMdctSize;
100 c=0; do {
101 for (i=0;i<end;i++)
102 {
103 int j;
104 opus_val32 maxval=0;
105 opus_val32 sum = 0;
106
107 j=M*eBands[i]; do {
108 maxval = MAX32(maxval, X[j+c*N]);
109 maxval = MAX32(maxval, -X[j+c*N]);
110 } while (++j<M*eBands[i+1]);
111
112 if (maxval > 0)
113 {
114 int shift = celt_ilog2(maxval)-10;
115 j=M*eBands[i]; do {
116 sum = MAC16_16(sum, EXTRACT16(VSHR32(X[j+c*N],shift)),
117 EXTRACT16(VSHR32(X[j+c*N],shift)));
118 } while (++j<M*eBands[i+1]);
119 /* We're adding one here to ensure the normalized band isn't larger than unity norm */
120 bandE[i+c*m->nbEBands] = EPSILON+VSHR32(EXTEND32(celt_sqrt(sum)),-shift);
121 } else {
122 bandE[i+c*m->nbEBands] = EPSILON;
123 }
124 /*printf ("%f ", bandE[i+c*m->nbEBands]);*/
125 }
126 } while (++c<C);
127 /*printf ("\n");*/
128 }
129
130 /* Normalise each band such that the energy is one. */
normalise_bands(const CELTMode * m,const celt_sig * OPUS_RESTRICT freq,celt_norm * OPUS_RESTRICT X,const celt_ener * bandE,int end,int C,int M)131 void normalise_bands(const CELTMode *m, const celt_sig * OPUS_RESTRICT freq, celt_norm * OPUS_RESTRICT X, const celt_ener *bandE, int end, int C, int M)
132 {
133 int i, c, N;
134 const opus_int16 *eBands = m->eBands;
135 N = M*m->shortMdctSize;
136 c=0; do {
137 i=0; do {
138 opus_val16 g;
139 int j,shift;
140 opus_val16 E;
141 shift = celt_zlog2(bandE[i+c*m->nbEBands])-13;
142 E = VSHR32(bandE[i+c*m->nbEBands], shift);
143 g = EXTRACT16(celt_rcp(SHL32(E,3)));
144 j=M*eBands[i]; do {
145 X[j+c*N] = MULT16_16_Q15(VSHR32(freq[j+c*N],shift-1),g);
146 } while (++j<M*eBands[i+1]);
147 } while (++i<end);
148 } while (++c<C);
149 }
150
151 #else /* FIXED_POINT */
152 /* Compute the amplitude (sqrt energy) in each of the bands */
compute_band_energies(const CELTMode * m,const celt_sig * X,celt_ener * bandE,int end,int C,int M)153 void compute_band_energies(const CELTMode *m, const celt_sig *X, celt_ener *bandE, int end, int C, int M)
154 {
155 int i, c, N;
156 const opus_int16 *eBands = m->eBands;
157 N = M*m->shortMdctSize;
158 c=0; do {
159 for (i=0;i<end;i++)
160 {
161 int j;
162 opus_val32 sum = 1e-27f;
163 for (j=M*eBands[i];j<M*eBands[i+1];j++)
164 sum += X[j+c*N]*X[j+c*N];
165 bandE[i+c*m->nbEBands] = celt_sqrt(sum);
166 /*printf ("%f ", bandE[i+c*m->nbEBands]);*/
167 }
168 } while (++c<C);
169 /*printf ("\n");*/
170 }
171
172 /* Normalise each band such that the energy is one. */
normalise_bands(const CELTMode * m,const celt_sig * OPUS_RESTRICT freq,celt_norm * OPUS_RESTRICT X,const celt_ener * bandE,int end,int C,int M)173 void normalise_bands(const CELTMode *m, const celt_sig * OPUS_RESTRICT freq, celt_norm * OPUS_RESTRICT X, const celt_ener *bandE, int end, int C, int M)
174 {
175 int i, c, N;
176 const opus_int16 *eBands = m->eBands;
177 N = M*m->shortMdctSize;
178 c=0; do {
179 for (i=0;i<end;i++)
180 {
181 int j;
182 opus_val16 g = 1.f/(1e-27f+bandE[i+c*m->nbEBands]);
183 for (j=M*eBands[i];j<M*eBands[i+1];j++)
184 X[j+c*N] = freq[j+c*N]*g;
185 }
186 } while (++c<C);
187 }
188
189 #endif /* FIXED_POINT */
190
191 /* De-normalise the energy to produce the synthesis from the unit-energy bands */
denormalise_bands(const CELTMode * m,const celt_norm * OPUS_RESTRICT X,celt_sig * OPUS_RESTRICT freq,const opus_val16 * bandLogE,int start,int end,int C,int M)192 void denormalise_bands(const CELTMode *m, const celt_norm * OPUS_RESTRICT X,
193 celt_sig * OPUS_RESTRICT freq, const opus_val16 *bandLogE, int start, int end, int C, int M)
194 {
195 int i, c, N;
196 const opus_int16 *eBands = m->eBands;
197 N = M*m->shortMdctSize;
198 celt_assert2(C<=2, "denormalise_bands() not implemented for >2 channels");
199 c=0; do {
200 celt_sig * OPUS_RESTRICT f;
201 const celt_norm * OPUS_RESTRICT x;
202 f = freq+c*N;
203 x = X+c*N+M*eBands[start];
204 for (i=0;i<M*eBands[start];i++)
205 *f++ = 0;
206 for (i=start;i<end;i++)
207 {
208 int j, band_end;
209 opus_val16 g;
210 opus_val16 lg;
211 #ifdef FIXED_POINT
212 int shift;
213 #endif
214 j=M*eBands[i];
215 band_end = M*eBands[i+1];
216 lg = ADD16(bandLogE[i+c*m->nbEBands], SHL16((opus_val16)eMeans[i],6));
217 #ifdef FIXED_POINT
218 /* Handle the integer part of the log energy */
219 shift = 16-(lg>>DB_SHIFT);
220 if (shift>31)
221 {
222 shift=0;
223 g=0;
224 } else {
225 /* Handle the fractional part. */
226 g = celt_exp2_frac(lg&((1<<DB_SHIFT)-1));
227 }
228 #else
229 g = celt_exp2(lg);
230 #endif
231 do {
232 *f++ = SHR32(MULT16_16(*x++, g), shift);
233 } while (++j<band_end);
234 }
235 celt_assert(start <= end);
236 for (i=M*eBands[end];i<N;i++)
237 *f++ = 0;
238 } while (++c<C);
239 }
240
241 /* This prevents energy collapse for transients with multiple short MDCTs */
anti_collapse(const CELTMode * m,celt_norm * X_,unsigned char * collapse_masks,int LM,int C,int size,int start,int end,opus_val16 * logE,opus_val16 * prev1logE,opus_val16 * prev2logE,int * pulses,opus_uint32 seed)242 void anti_collapse(const CELTMode *m, celt_norm *X_, unsigned char *collapse_masks, int LM, int C, int size,
243 int start, int end, opus_val16 *logE, opus_val16 *prev1logE,
244 opus_val16 *prev2logE, int *pulses, opus_uint32 seed)
245 {
246 int c, i, j, k;
247 for (i=start;i<end;i++)
248 {
249 int N0;
250 opus_val16 thresh, sqrt_1;
251 int depth;
252 #ifdef FIXED_POINT
253 int shift;
254 opus_val32 thresh32;
255 #endif
256
257 N0 = m->eBands[i+1]-m->eBands[i];
258 /* depth in 1/8 bits */
259 depth = (1+pulses[i])/((m->eBands[i+1]-m->eBands[i])<<LM);
260
261 #ifdef FIXED_POINT
262 thresh32 = SHR32(celt_exp2(-SHL16(depth, 10-BITRES)),1);
263 thresh = MULT16_32_Q15(QCONST16(0.5f, 15), MIN32(32767,thresh32));
264 {
265 opus_val32 t;
266 t = N0<<LM;
267 shift = celt_ilog2(t)>>1;
268 t = SHL32(t, (7-shift)<<1);
269 sqrt_1 = celt_rsqrt_norm(t);
270 }
271 #else
272 thresh = .5f*celt_exp2(-.125f*depth);
273 sqrt_1 = celt_rsqrt(N0<<LM);
274 #endif
275
276 c=0; do
277 {
278 celt_norm *X;
279 opus_val16 prev1;
280 opus_val16 prev2;
281 opus_val32 Ediff;
282 opus_val16 r;
283 int renormalize=0;
284 prev1 = prev1logE[c*m->nbEBands+i];
285 prev2 = prev2logE[c*m->nbEBands+i];
286 if (C==1)
287 {
288 prev1 = MAX16(prev1,prev1logE[m->nbEBands+i]);
289 prev2 = MAX16(prev2,prev2logE[m->nbEBands+i]);
290 }
291 Ediff = EXTEND32(logE[c*m->nbEBands+i])-EXTEND32(MIN16(prev1,prev2));
292 Ediff = MAX32(0, Ediff);
293
294 #ifdef FIXED_POINT
295 if (Ediff < 16384)
296 {
297 opus_val32 r32 = SHR32(celt_exp2(-EXTRACT16(Ediff)),1);
298 r = 2*MIN16(16383,r32);
299 } else {
300 r = 0;
301 }
302 if (LM==3)
303 r = MULT16_16_Q14(23170, MIN32(23169, r));
304 r = SHR16(MIN16(thresh, r),1);
305 r = SHR32(MULT16_16_Q15(sqrt_1, r),shift);
306 #else
307 /* r needs to be multiplied by 2 or 2*sqrt(2) depending on LM because
308 short blocks don't have the same energy as long */
309 r = 2.f*celt_exp2(-Ediff);
310 if (LM==3)
311 r *= 1.41421356f;
312 r = MIN16(thresh, r);
313 r = r*sqrt_1;
314 #endif
315 X = X_+c*size+(m->eBands[i]<<LM);
316 for (k=0;k<1<<LM;k++)
317 {
318 /* Detect collapse */
319 if (!(collapse_masks[i*C+c]&1<<k))
320 {
321 /* Fill with noise */
322 for (j=0;j<N0;j++)
323 {
324 seed = celt_lcg_rand(seed);
325 X[(j<<LM)+k] = (seed&0x8000 ? r : -r);
326 }
327 renormalize = 1;
328 }
329 }
330 /* We just added some energy, so we need to renormalise */
331 if (renormalize)
332 renormalise_vector(X, N0<<LM, Q15ONE);
333 } while (++c<C);
334 }
335 }
336
intensity_stereo(const CELTMode * m,celt_norm * X,celt_norm * Y,const celt_ener * bandE,int bandID,int N)337 static void intensity_stereo(const CELTMode *m, celt_norm *X, celt_norm *Y, const celt_ener *bandE, int bandID, int N)
338 {
339 int i = bandID;
340 int j;
341 opus_val16 a1, a2;
342 opus_val16 left, right;
343 opus_val16 norm;
344 #ifdef FIXED_POINT
345 int shift = celt_zlog2(MAX32(bandE[i], bandE[i+m->nbEBands]))-13;
346 #endif
347 left = VSHR32(bandE[i],shift);
348 right = VSHR32(bandE[i+m->nbEBands],shift);
349 norm = EPSILON + celt_sqrt(EPSILON+MULT16_16(left,left)+MULT16_16(right,right));
350 a1 = DIV32_16(SHL32(EXTEND32(left),14),norm);
351 a2 = DIV32_16(SHL32(EXTEND32(right),14),norm);
352 for (j=0;j<N;j++)
353 {
354 celt_norm r, l;
355 l = X[j];
356 r = Y[j];
357 X[j] = MULT16_16_Q14(a1,l) + MULT16_16_Q14(a2,r);
358 /* Side is not encoded, no need to calculate */
359 }
360 }
361
stereo_split(celt_norm * X,celt_norm * Y,int N)362 static void stereo_split(celt_norm *X, celt_norm *Y, int N)
363 {
364 int j;
365 for (j=0;j<N;j++)
366 {
367 celt_norm r, l;
368 l = MULT16_16_Q15(QCONST16(.70710678f,15), X[j]);
369 r = MULT16_16_Q15(QCONST16(.70710678f,15), Y[j]);
370 X[j] = l+r;
371 Y[j] = r-l;
372 }
373 }
374
stereo_merge(celt_norm * X,celt_norm * Y,opus_val16 mid,int N)375 static void stereo_merge(celt_norm *X, celt_norm *Y, opus_val16 mid, int N)
376 {
377 int j;
378 opus_val32 xp=0, side=0;
379 opus_val32 El, Er;
380 opus_val16 mid2;
381 #ifdef FIXED_POINT
382 int kl, kr;
383 #endif
384 opus_val32 t, lgain, rgain;
385
386 /* Compute the norm of X+Y and X-Y as |X|^2 + |Y|^2 +/- sum(xy) */
387 dual_inner_prod(Y, X, Y, N, &xp, &side);
388 /* Compensating for the mid normalization */
389 xp = MULT16_32_Q15(mid, xp);
390 /* mid and side are in Q15, not Q14 like X and Y */
391 mid2 = SHR32(mid, 1);
392 El = MULT16_16(mid2, mid2) + side - 2*xp;
393 Er = MULT16_16(mid2, mid2) + side + 2*xp;
394 if (Er < QCONST32(6e-4f, 28) || El < QCONST32(6e-4f, 28))
395 {
396 for (j=0;j<N;j++)
397 Y[j] = X[j];
398 return;
399 }
400
401 #ifdef FIXED_POINT
402 kl = celt_ilog2(El)>>1;
403 kr = celt_ilog2(Er)>>1;
404 #endif
405 t = VSHR32(El, (kl-7)<<1);
406 lgain = celt_rsqrt_norm(t);
407 t = VSHR32(Er, (kr-7)<<1);
408 rgain = celt_rsqrt_norm(t);
409
410 #ifdef FIXED_POINT
411 if (kl < 7)
412 kl = 7;
413 if (kr < 7)
414 kr = 7;
415 #endif
416
417 for (j=0;j<N;j++)
418 {
419 celt_norm r, l;
420 /* Apply mid scaling (side is already scaled) */
421 l = MULT16_16_Q15(mid, X[j]);
422 r = Y[j];
423 X[j] = EXTRACT16(PSHR32(MULT16_16(lgain, SUB16(l,r)), kl+1));
424 Y[j] = EXTRACT16(PSHR32(MULT16_16(rgain, ADD16(l,r)), kr+1));
425 }
426 }
427
428 /* Decide whether we should spread the pulses in the current frame */
spreading_decision(const CELTMode * m,celt_norm * X,int * average,int last_decision,int * hf_average,int * tapset_decision,int update_hf,int end,int C,int M)429 int spreading_decision(const CELTMode *m, celt_norm *X, int *average,
430 int last_decision, int *hf_average, int *tapset_decision, int update_hf,
431 int end, int C, int M)
432 {
433 int i, c, N0;
434 int sum = 0, nbBands=0;
435 const opus_int16 * OPUS_RESTRICT eBands = m->eBands;
436 int decision;
437 int hf_sum=0;
438
439 celt_assert(end>0);
440
441 N0 = M*m->shortMdctSize;
442
443 if (M*(eBands[end]-eBands[end-1]) <= 8)
444 return SPREAD_NONE;
445 c=0; do {
446 for (i=0;i<end;i++)
447 {
448 int j, N, tmp=0;
449 int tcount[3] = {0,0,0};
450 celt_norm * OPUS_RESTRICT x = X+M*eBands[i]+c*N0;
451 N = M*(eBands[i+1]-eBands[i]);
452 if (N<=8)
453 continue;
454 /* Compute rough CDF of |x[j]| */
455 for (j=0;j<N;j++)
456 {
457 opus_val32 x2N; /* Q13 */
458
459 x2N = MULT16_16(MULT16_16_Q15(x[j], x[j]), N);
460 if (x2N < QCONST16(0.25f,13))
461 tcount[0]++;
462 if (x2N < QCONST16(0.0625f,13))
463 tcount[1]++;
464 if (x2N < QCONST16(0.015625f,13))
465 tcount[2]++;
466 }
467
468 /* Only include four last bands (8 kHz and up) */
469 if (i>m->nbEBands-4)
470 hf_sum += 32*(tcount[1]+tcount[0])/N;
471 tmp = (2*tcount[2] >= N) + (2*tcount[1] >= N) + (2*tcount[0] >= N);
472 sum += tmp*256;
473 nbBands++;
474 }
475 } while (++c<C);
476
477 if (update_hf)
478 {
479 if (hf_sum)
480 hf_sum /= C*(4-m->nbEBands+end);
481 *hf_average = (*hf_average+hf_sum)>>1;
482 hf_sum = *hf_average;
483 if (*tapset_decision==2)
484 hf_sum += 4;
485 else if (*tapset_decision==0)
486 hf_sum -= 4;
487 if (hf_sum > 22)
488 *tapset_decision=2;
489 else if (hf_sum > 18)
490 *tapset_decision=1;
491 else
492 *tapset_decision=0;
493 }
494 /*printf("%d %d %d\n", hf_sum, *hf_average, *tapset_decision);*/
495 celt_assert(nbBands>0); /*M*(eBands[end]-eBands[end-1]) <= 8 assures this*/
496 sum /= nbBands;
497 /* Recursive averaging */
498 sum = (sum+*average)>>1;
499 *average = sum;
500 /* Hysteresis */
501 sum = (3*sum + (((3-last_decision)<<7) + 64) + 2)>>2;
502 if (sum < 80)
503 {
504 decision = SPREAD_AGGRESSIVE;
505 } else if (sum < 256)
506 {
507 decision = SPREAD_NORMAL;
508 } else if (sum < 384)
509 {
510 decision = SPREAD_LIGHT;
511 } else {
512 decision = SPREAD_NONE;
513 }
514 #ifdef FUZZING
515 decision = rand()&0x3;
516 *tapset_decision=rand()%3;
517 #endif
518 return decision;
519 }
520
521 /* Indexing table for converting from natural Hadamard to ordery Hadamard
522 This is essentially a bit-reversed Gray, on top of which we've added
523 an inversion of the order because we want the DC at the end rather than
524 the beginning. The lines are for N=2, 4, 8, 16 */
525 static const int ordery_table[] = {
526 1, 0,
527 3, 0, 2, 1,
528 7, 0, 4, 3, 6, 1, 5, 2,
529 15, 0, 8, 7, 12, 3, 11, 4, 14, 1, 9, 6, 13, 2, 10, 5,
530 };
531
deinterleave_hadamard(celt_norm * X,int N0,int stride,int hadamard)532 static void deinterleave_hadamard(celt_norm *X, int N0, int stride, int hadamard)
533 {
534 int i,j;
535 VARDECL(celt_norm, tmp);
536 int N;
537 SAVE_STACK;
538 N = N0*stride;
539 ALLOC(tmp, N, celt_norm);
540 celt_assert(stride>0);
541 if (hadamard)
542 {
543 const int *ordery = ordery_table+stride-2;
544 for (i=0;i<stride;i++)
545 {
546 for (j=0;j<N0;j++)
547 tmp[ordery[i]*N0+j] = X[j*stride+i];
548 }
549 } else {
550 for (i=0;i<stride;i++)
551 for (j=0;j<N0;j++)
552 tmp[i*N0+j] = X[j*stride+i];
553 }
554 for (j=0;j<N;j++)
555 X[j] = tmp[j];
556 RESTORE_STACK;
557 }
558
interleave_hadamard(celt_norm * X,int N0,int stride,int hadamard)559 static void interleave_hadamard(celt_norm *X, int N0, int stride, int hadamard)
560 {
561 int i,j;
562 VARDECL(celt_norm, tmp);
563 int N;
564 SAVE_STACK;
565 N = N0*stride;
566 ALLOC(tmp, N, celt_norm);
567 if (hadamard)
568 {
569 const int *ordery = ordery_table+stride-2;
570 for (i=0;i<stride;i++)
571 for (j=0;j<N0;j++)
572 tmp[j*stride+i] = X[ordery[i]*N0+j];
573 } else {
574 for (i=0;i<stride;i++)
575 for (j=0;j<N0;j++)
576 tmp[j*stride+i] = X[i*N0+j];
577 }
578 for (j=0;j<N;j++)
579 X[j] = tmp[j];
580 RESTORE_STACK;
581 }
582
haar1(celt_norm * X,int N0,int stride)583 void haar1(celt_norm *X, int N0, int stride)
584 {
585 int i, j;
586 N0 >>= 1;
587 for (i=0;i<stride;i++)
588 for (j=0;j<N0;j++)
589 {
590 celt_norm tmp1, tmp2;
591 tmp1 = MULT16_16_Q15(QCONST16(.70710678f,15), X[stride*2*j+i]);
592 tmp2 = MULT16_16_Q15(QCONST16(.70710678f,15), X[stride*(2*j+1)+i]);
593 X[stride*2*j+i] = tmp1 + tmp2;
594 X[stride*(2*j+1)+i] = tmp1 - tmp2;
595 }
596 }
597
compute_qn(int N,int b,int offset,int pulse_cap,int stereo)598 static int compute_qn(int N, int b, int offset, int pulse_cap, int stereo)
599 {
600 static const opus_int16 exp2_table8[8] =
601 {16384, 17866, 19483, 21247, 23170, 25267, 27554, 30048};
602 int qn, qb;
603 int N2 = 2*N-1;
604 if (stereo && N==2)
605 N2--;
606 /* The upper limit ensures that in a stereo split with itheta==16384, we'll
607 always have enough bits left over to code at least one pulse in the
608 side; otherwise it would collapse, since it doesn't get folded. */
609 qb = IMIN(b-pulse_cap-(4<<BITRES), (b+N2*offset)/N2);
610
611 qb = IMIN(8<<BITRES, qb);
612
613 if (qb<(1<<BITRES>>1)) {
614 qn = 1;
615 } else {
616 qn = exp2_table8[qb&0x7]>>(14-(qb>>BITRES));
617 qn = (qn+1)>>1<<1;
618 }
619 celt_assert(qn <= 256);
620 return qn;
621 }
622
623 struct band_ctx {
624 int encode;
625 const CELTMode *m;
626 int i;
627 int intensity;
628 int spread;
629 int tf_change;
630 ec_ctx *ec;
631 opus_int32 remaining_bits;
632 const celt_ener *bandE;
633 opus_uint32 seed;
634 };
635
636 struct split_ctx {
637 int inv;
638 int imid;
639 int iside;
640 int delta;
641 int itheta;
642 int qalloc;
643 };
644
compute_theta(struct band_ctx * ctx,struct split_ctx * sctx,celt_norm * X,celt_norm * Y,int N,int * b,int B,int B0,int LM,int stereo,int * fill)645 static void compute_theta(struct band_ctx *ctx, struct split_ctx *sctx,
646 celt_norm *X, celt_norm *Y, int N, int *b, int B, int B0,
647 int LM,
648 int stereo, int *fill)
649 {
650 int qn;
651 int itheta=0;
652 int delta;
653 int imid, iside;
654 int qalloc;
655 int pulse_cap;
656 int offset;
657 opus_int32 tell;
658 int inv=0;
659 int encode;
660 const CELTMode *m;
661 int i;
662 int intensity;
663 ec_ctx *ec;
664 const celt_ener *bandE;
665
666 encode = ctx->encode;
667 m = ctx->m;
668 i = ctx->i;
669 intensity = ctx->intensity;
670 ec = ctx->ec;
671 bandE = ctx->bandE;
672
673 /* Decide on the resolution to give to the split parameter theta */
674 pulse_cap = m->logN[i]+LM*(1<<BITRES);
675 offset = (pulse_cap>>1) - (stereo&&N==2 ? QTHETA_OFFSET_TWOPHASE : QTHETA_OFFSET);
676 qn = compute_qn(N, *b, offset, pulse_cap, stereo);
677 if (stereo && i>=intensity)
678 qn = 1;
679 if (encode)
680 {
681 /* theta is the atan() of the ratio between the (normalized)
682 side and mid. With just that parameter, we can re-scale both
683 mid and side because we know that 1) they have unit norm and
684 2) they are orthogonal. */
685 itheta = stereo_itheta(X, Y, stereo, N);
686 }
687 tell = ec_tell_frac(ec);
688 if (qn!=1)
689 {
690 if (encode)
691 itheta = (itheta*qn+8192)>>14;
692
693 /* Entropy coding of the angle. We use a uniform pdf for the
694 time split, a step for stereo, and a triangular one for the rest. */
695 if (stereo && N>2)
696 {
697 int p0 = 3;
698 int x = itheta;
699 int x0 = qn/2;
700 int ft = p0*(x0+1) + x0;
701 /* Use a probability of p0 up to itheta=8192 and then use 1 after */
702 if (encode)
703 {
704 ec_encode(ec,x<=x0?p0*x:(x-1-x0)+(x0+1)*p0,x<=x0?p0*(x+1):(x-x0)+(x0+1)*p0,ft);
705 } else {
706 int fs;
707 fs=ec_decode(ec,ft);
708 if (fs<(x0+1)*p0)
709 x=fs/p0;
710 else
711 x=x0+1+(fs-(x0+1)*p0);
712 ec_dec_update(ec,x<=x0?p0*x:(x-1-x0)+(x0+1)*p0,x<=x0?p0*(x+1):(x-x0)+(x0+1)*p0,ft);
713 itheta = x;
714 }
715 } else if (B0>1 || stereo) {
716 /* Uniform pdf */
717 if (encode)
718 ec_enc_uint(ec, itheta, qn+1);
719 else
720 itheta = ec_dec_uint(ec, qn+1);
721 } else {
722 int fs=1, ft;
723 ft = ((qn>>1)+1)*((qn>>1)+1);
724 if (encode)
725 {
726 int fl;
727
728 fs = itheta <= (qn>>1) ? itheta + 1 : qn + 1 - itheta;
729 fl = itheta <= (qn>>1) ? itheta*(itheta + 1)>>1 :
730 ft - ((qn + 1 - itheta)*(qn + 2 - itheta)>>1);
731
732 ec_encode(ec, fl, fl+fs, ft);
733 } else {
734 /* Triangular pdf */
735 int fl=0;
736 int fm;
737 fm = ec_decode(ec, ft);
738
739 if (fm < ((qn>>1)*((qn>>1) + 1)>>1))
740 {
741 itheta = (isqrt32(8*(opus_uint32)fm + 1) - 1)>>1;
742 fs = itheta + 1;
743 fl = itheta*(itheta + 1)>>1;
744 }
745 else
746 {
747 itheta = (2*(qn + 1)
748 - isqrt32(8*(opus_uint32)(ft - fm - 1) + 1))>>1;
749 fs = qn + 1 - itheta;
750 fl = ft - ((qn + 1 - itheta)*(qn + 2 - itheta)>>1);
751 }
752
753 ec_dec_update(ec, fl, fl+fs, ft);
754 }
755 }
756 itheta = (opus_int32)itheta*16384/qn;
757 if (encode && stereo)
758 {
759 if (itheta==0)
760 intensity_stereo(m, X, Y, bandE, i, N);
761 else
762 stereo_split(X, Y, N);
763 }
764 /* NOTE: Renormalising X and Y *may* help fixed-point a bit at very high rate.
765 Let's do that at higher complexity */
766 } else if (stereo) {
767 if (encode)
768 {
769 inv = itheta > 8192;
770 if (inv)
771 {
772 int j;
773 for (j=0;j<N;j++)
774 Y[j] = -Y[j];
775 }
776 intensity_stereo(m, X, Y, bandE, i, N);
777 }
778 if (*b>2<<BITRES && ctx->remaining_bits > 2<<BITRES)
779 {
780 if (encode)
781 ec_enc_bit_logp(ec, inv, 2);
782 else
783 inv = ec_dec_bit_logp(ec, 2);
784 } else
785 inv = 0;
786 itheta = 0;
787 }
788 qalloc = ec_tell_frac(ec) - tell;
789 *b -= qalloc;
790
791 if (itheta == 0)
792 {
793 imid = 32767;
794 iside = 0;
795 *fill &= (1<<B)-1;
796 delta = -16384;
797 } else if (itheta == 16384)
798 {
799 imid = 0;
800 iside = 32767;
801 *fill &= ((1<<B)-1)<<B;
802 delta = 16384;
803 } else {
804 imid = bitexact_cos((opus_int16)itheta);
805 iside = bitexact_cos((opus_int16)(16384-itheta));
806 /* This is the mid vs side allocation that minimizes squared error
807 in that band. */
808 delta = FRAC_MUL16((N-1)<<7,bitexact_log2tan(iside,imid));
809 }
810
811 sctx->inv = inv;
812 sctx->imid = imid;
813 sctx->iside = iside;
814 sctx->delta = delta;
815 sctx->itheta = itheta;
816 sctx->qalloc = qalloc;
817 }
quant_band_n1(struct band_ctx * ctx,celt_norm * X,celt_norm * Y,int b,celt_norm * lowband_out)818 static unsigned quant_band_n1(struct band_ctx *ctx, celt_norm *X, celt_norm *Y, int b,
819 celt_norm *lowband_out)
820 {
821 #ifdef RESYNTH
822 int resynth = 1;
823 #else
824 int resynth = !ctx->encode;
825 #endif
826 int c;
827 int stereo;
828 celt_norm *x = X;
829 int encode;
830 ec_ctx *ec;
831
832 encode = ctx->encode;
833 ec = ctx->ec;
834
835 stereo = Y != NULL;
836 c=0; do {
837 int sign=0;
838 if (ctx->remaining_bits>=1<<BITRES)
839 {
840 if (encode)
841 {
842 sign = x[0]<0;
843 ec_enc_bits(ec, sign, 1);
844 } else {
845 sign = ec_dec_bits(ec, 1);
846 }
847 ctx->remaining_bits -= 1<<BITRES;
848 b-=1<<BITRES;
849 }
850 if (resynth)
851 x[0] = sign ? -NORM_SCALING : NORM_SCALING;
852 x = Y;
853 } while (++c<1+stereo);
854 if (lowband_out)
855 lowband_out[0] = SHR16(X[0],4);
856 return 1;
857 }
858
859 /* This function is responsible for encoding and decoding a mono partition.
860 It can split the band in two and transmit the energy difference with
861 the two half-bands. It can be called recursively so bands can end up being
862 split in 8 parts. */
quant_partition(struct band_ctx * ctx,celt_norm * X,int N,int b,int B,celt_norm * lowband,int LM,opus_val16 gain,int fill)863 static unsigned quant_partition(struct band_ctx *ctx, celt_norm *X,
864 int N, int b, int B, celt_norm *lowband,
865 int LM,
866 opus_val16 gain, int fill)
867 {
868 const unsigned char *cache;
869 int q;
870 int curr_bits;
871 int imid=0, iside=0;
872 int N_B=N;
873 int B0=B;
874 opus_val16 mid=0, side=0;
875 unsigned cm=0;
876 #ifdef RESYNTH
877 int resynth = 1;
878 #else
879 int resynth = !ctx->encode;
880 #endif
881 celt_norm *Y=NULL;
882 int encode;
883 const CELTMode *m;
884 int i;
885 int spread;
886 ec_ctx *ec;
887
888 encode = ctx->encode;
889 m = ctx->m;
890 i = ctx->i;
891 spread = ctx->spread;
892 ec = ctx->ec;
893
894 N_B /= B;
895
896 /* If we need 1.5 more bit than we can produce, split the band in two. */
897 cache = m->cache.bits + m->cache.index[(LM+1)*m->nbEBands+i];
898 if (LM != -1 && b > cache[cache[0]]+12 && N>2)
899 {
900 int mbits, sbits, delta;
901 int itheta;
902 int qalloc;
903 struct split_ctx sctx;
904 celt_norm *next_lowband2=NULL;
905 opus_int32 rebalance;
906
907 N >>= 1;
908 Y = X+N;
909 LM -= 1;
910 if (B==1)
911 fill = (fill&1)|(fill<<1);
912 B = (B+1)>>1;
913
914 compute_theta(ctx, &sctx, X, Y, N, &b, B, B0,
915 LM, 0, &fill);
916 imid = sctx.imid;
917 iside = sctx.iside;
918 delta = sctx.delta;
919 itheta = sctx.itheta;
920 qalloc = sctx.qalloc;
921 #ifdef FIXED_POINT
922 mid = imid;
923 side = iside;
924 #else
925 mid = (1.f/32768)*imid;
926 side = (1.f/32768)*iside;
927 #endif
928
929 /* Give more bits to low-energy MDCTs than they would otherwise deserve */
930 if (B0>1 && (itheta&0x3fff))
931 {
932 if (itheta > 8192)
933 /* Rough approximation for pre-echo masking */
934 delta -= delta>>(4-LM);
935 else
936 /* Corresponds to a forward-masking slope of 1.5 dB per 10 ms */
937 delta = IMIN(0, delta + (N<<BITRES>>(5-LM)));
938 }
939 mbits = IMAX(0, IMIN(b, (b-delta)/2));
940 sbits = b-mbits;
941 ctx->remaining_bits -= qalloc;
942
943 if (lowband)
944 next_lowband2 = lowband+N; /* >32-bit split case */
945
946 rebalance = ctx->remaining_bits;
947 if (mbits >= sbits)
948 {
949 cm = quant_partition(ctx, X, N, mbits, B,
950 lowband, LM,
951 MULT16_16_P15(gain,mid), fill);
952 rebalance = mbits - (rebalance-ctx->remaining_bits);
953 if (rebalance > 3<<BITRES && itheta!=0)
954 sbits += rebalance - (3<<BITRES);
955 cm |= quant_partition(ctx, Y, N, sbits, B,
956 next_lowband2, LM,
957 MULT16_16_P15(gain,side), fill>>B)<<(B0>>1);
958 } else {
959 cm = quant_partition(ctx, Y, N, sbits, B,
960 next_lowband2, LM,
961 MULT16_16_P15(gain,side), fill>>B)<<(B0>>1);
962 rebalance = sbits - (rebalance-ctx->remaining_bits);
963 if (rebalance > 3<<BITRES && itheta!=16384)
964 mbits += rebalance - (3<<BITRES);
965 cm |= quant_partition(ctx, X, N, mbits, B,
966 lowband, LM,
967 MULT16_16_P15(gain,mid), fill);
968 }
969 } else {
970 /* This is the basic no-split case */
971 q = bits2pulses(m, i, LM, b);
972 curr_bits = pulses2bits(m, i, LM, q);
973 ctx->remaining_bits -= curr_bits;
974
975 /* Ensures we can never bust the budget */
976 while (ctx->remaining_bits < 0 && q > 0)
977 {
978 ctx->remaining_bits += curr_bits;
979 q--;
980 curr_bits = pulses2bits(m, i, LM, q);
981 ctx->remaining_bits -= curr_bits;
982 }
983
984 if (q!=0)
985 {
986 int K = get_pulses(q);
987
988 /* Finally do the actual quantization */
989 if (encode)
990 {
991 cm = alg_quant(X, N, K, spread, B, ec
992 #ifdef RESYNTH
993 , gain
994 #endif
995 );
996 } else {
997 cm = alg_unquant(X, N, K, spread, B, ec, gain);
998 }
999 } else {
1000 /* If there's no pulse, fill the band anyway */
1001 int j;
1002 if (resynth)
1003 {
1004 unsigned cm_mask;
1005 /* B can be as large as 16, so this shift might overflow an int on a
1006 16-bit platform; use a long to get defined behavior.*/
1007 cm_mask = (unsigned)(1UL<<B)-1;
1008 fill &= cm_mask;
1009 if (!fill)
1010 {
1011 for (j=0;j<N;j++)
1012 X[j] = 0;
1013 } else {
1014 if (lowband == NULL)
1015 {
1016 /* Noise */
1017 for (j=0;j<N;j++)
1018 {
1019 ctx->seed = celt_lcg_rand(ctx->seed);
1020 X[j] = (celt_norm)((opus_int32)ctx->seed>>20);
1021 }
1022 cm = cm_mask;
1023 } else {
1024 /* Folded spectrum */
1025 for (j=0;j<N;j++)
1026 {
1027 opus_val16 tmp;
1028 ctx->seed = celt_lcg_rand(ctx->seed);
1029 /* About 48 dB below the "normal" folding level */
1030 tmp = QCONST16(1.0f/256, 10);
1031 tmp = (ctx->seed)&0x8000 ? tmp : -tmp;
1032 X[j] = lowband[j]+tmp;
1033 }
1034 cm = fill;
1035 }
1036 renormalise_vector(X, N, gain);
1037 }
1038 }
1039 }
1040 }
1041
1042 return cm;
1043 }
1044
1045
1046 /* This function is responsible for encoding and decoding a band for the mono case. */
quant_band(struct band_ctx * ctx,celt_norm * X,int N,int b,int B,celt_norm * lowband,int LM,celt_norm * lowband_out,opus_val16 gain,celt_norm * lowband_scratch,int fill)1047 static unsigned quant_band(struct band_ctx *ctx, celt_norm *X,
1048 int N, int b, int B, celt_norm *lowband,
1049 int LM, celt_norm *lowband_out,
1050 opus_val16 gain, celt_norm *lowband_scratch, int fill)
1051 {
1052 int N0=N;
1053 int N_B=N;
1054 int N_B0;
1055 int B0=B;
1056 int time_divide=0;
1057 int recombine=0;
1058 int longBlocks;
1059 unsigned cm=0;
1060 #ifdef RESYNTH
1061 int resynth = 1;
1062 #else
1063 int resynth = !ctx->encode;
1064 #endif
1065 int k;
1066 int encode;
1067 int tf_change;
1068
1069 encode = ctx->encode;
1070 tf_change = ctx->tf_change;
1071
1072 longBlocks = B0==1;
1073
1074 N_B /= B;
1075 N_B0 = N_B;
1076
1077 /* Special case for one sample */
1078 if (N==1)
1079 {
1080 return quant_band_n1(ctx, X, NULL, b, lowband_out);
1081 }
1082
1083 if (tf_change>0)
1084 recombine = tf_change;
1085 /* Band recombining to increase frequency resolution */
1086
1087 if (lowband_scratch && lowband && (recombine || ((N_B&1) == 0 && tf_change<0) || B0>1))
1088 {
1089 int j;
1090 for (j=0;j<N;j++)
1091 lowband_scratch[j] = lowband[j];
1092 lowband = lowband_scratch;
1093 }
1094
1095 for (k=0;k<recombine;k++)
1096 {
1097 static const unsigned char bit_interleave_table[16]={
1098 0,1,1,1,2,3,3,3,2,3,3,3,2,3,3,3
1099 };
1100 if (encode)
1101 haar1(X, N>>k, 1<<k);
1102 if (lowband)
1103 haar1(lowband, N>>k, 1<<k);
1104 fill = bit_interleave_table[fill&0xF]|bit_interleave_table[fill>>4]<<2;
1105 }
1106 B>>=recombine;
1107 N_B<<=recombine;
1108
1109 /* Increasing the time resolution */
1110 while ((N_B&1) == 0 && tf_change<0)
1111 {
1112 if (encode)
1113 haar1(X, N_B, B);
1114 if (lowband)
1115 haar1(lowband, N_B, B);
1116 fill |= fill<<B;
1117 B <<= 1;
1118 N_B >>= 1;
1119 time_divide++;
1120 tf_change++;
1121 }
1122 B0=B;
1123 N_B0 = N_B;
1124
1125 /* Reorganize the samples in time order instead of frequency order */
1126 if (B0>1)
1127 {
1128 if (encode)
1129 deinterleave_hadamard(X, N_B>>recombine, B0<<recombine, longBlocks);
1130 if (lowband)
1131 deinterleave_hadamard(lowband, N_B>>recombine, B0<<recombine, longBlocks);
1132 }
1133
1134 cm = quant_partition(ctx, X, N, b, B, lowband,
1135 LM, gain, fill);
1136
1137 /* This code is used by the decoder and by the resynthesis-enabled encoder */
1138 if (resynth)
1139 {
1140 /* Undo the sample reorganization going from time order to frequency order */
1141 if (B0>1)
1142 interleave_hadamard(X, N_B>>recombine, B0<<recombine, longBlocks);
1143
1144 /* Undo time-freq changes that we did earlier */
1145 N_B = N_B0;
1146 B = B0;
1147 for (k=0;k<time_divide;k++)
1148 {
1149 B >>= 1;
1150 N_B <<= 1;
1151 cm |= cm>>B;
1152 haar1(X, N_B, B);
1153 }
1154
1155 for (k=0;k<recombine;k++)
1156 {
1157 static const unsigned char bit_deinterleave_table[16]={
1158 0x00,0x03,0x0C,0x0F,0x30,0x33,0x3C,0x3F,
1159 0xC0,0xC3,0xCC,0xCF,0xF0,0xF3,0xFC,0xFF
1160 };
1161 cm = bit_deinterleave_table[cm];
1162 haar1(X, N0>>k, 1<<k);
1163 }
1164 B<<=recombine;
1165
1166 /* Scale output for later folding */
1167 if (lowband_out)
1168 {
1169 int j;
1170 opus_val16 n;
1171 n = celt_sqrt(SHL32(EXTEND32(N0),22));
1172 for (j=0;j<N0;j++)
1173 lowband_out[j] = MULT16_16_Q15(n,X[j]);
1174 }
1175 cm &= (1<<B)-1;
1176 }
1177 return cm;
1178 }
1179
1180
1181 /* This function is responsible for encoding and decoding a band for the stereo case. */
quant_band_stereo(struct band_ctx * ctx,celt_norm * X,celt_norm * Y,int N,int b,int B,celt_norm * lowband,int LM,celt_norm * lowband_out,celt_norm * lowband_scratch,int fill)1182 static unsigned quant_band_stereo(struct band_ctx *ctx, celt_norm *X, celt_norm *Y,
1183 int N, int b, int B, celt_norm *lowband,
1184 int LM, celt_norm *lowband_out,
1185 celt_norm *lowband_scratch, int fill)
1186 {
1187 int imid=0, iside=0;
1188 int inv = 0;
1189 opus_val16 mid=0, side=0;
1190 unsigned cm=0;
1191 #ifdef RESYNTH
1192 int resynth = 1;
1193 #else
1194 int resynth = !ctx->encode;
1195 #endif
1196 int mbits, sbits, delta;
1197 int itheta;
1198 int qalloc;
1199 struct split_ctx sctx;
1200 int orig_fill;
1201 int encode;
1202 ec_ctx *ec;
1203
1204 encode = ctx->encode;
1205 ec = ctx->ec;
1206
1207 /* Special case for one sample */
1208 if (N==1)
1209 {
1210 return quant_band_n1(ctx, X, Y, b, lowband_out);
1211 }
1212
1213 orig_fill = fill;
1214
1215 compute_theta(ctx, &sctx, X, Y, N, &b, B, B,
1216 LM, 1, &fill);
1217 inv = sctx.inv;
1218 imid = sctx.imid;
1219 iside = sctx.iside;
1220 delta = sctx.delta;
1221 itheta = sctx.itheta;
1222 qalloc = sctx.qalloc;
1223 #ifdef FIXED_POINT
1224 mid = imid;
1225 side = iside;
1226 #else
1227 mid = (1.f/32768)*imid;
1228 side = (1.f/32768)*iside;
1229 #endif
1230
1231 /* This is a special case for N=2 that only works for stereo and takes
1232 advantage of the fact that mid and side are orthogonal to encode
1233 the side with just one bit. */
1234 if (N==2)
1235 {
1236 int c;
1237 int sign=0;
1238 celt_norm *x2, *y2;
1239 mbits = b;
1240 sbits = 0;
1241 /* Only need one bit for the side. */
1242 if (itheta != 0 && itheta != 16384)
1243 sbits = 1<<BITRES;
1244 mbits -= sbits;
1245 c = itheta > 8192;
1246 ctx->remaining_bits -= qalloc+sbits;
1247
1248 x2 = c ? Y : X;
1249 y2 = c ? X : Y;
1250 if (sbits)
1251 {
1252 if (encode)
1253 {
1254 /* Here we only need to encode a sign for the side. */
1255 sign = x2[0]*y2[1] - x2[1]*y2[0] < 0;
1256 ec_enc_bits(ec, sign, 1);
1257 } else {
1258 sign = ec_dec_bits(ec, 1);
1259 }
1260 }
1261 sign = 1-2*sign;
1262 /* We use orig_fill here because we want to fold the side, but if
1263 itheta==16384, we'll have cleared the low bits of fill. */
1264 cm = quant_band(ctx, x2, N, mbits, B, lowband,
1265 LM, lowband_out, Q15ONE, lowband_scratch, orig_fill);
1266 /* We don't split N=2 bands, so cm is either 1 or 0 (for a fold-collapse),
1267 and there's no need to worry about mixing with the other channel. */
1268 y2[0] = -sign*x2[1];
1269 y2[1] = sign*x2[0];
1270 if (resynth)
1271 {
1272 celt_norm tmp;
1273 X[0] = MULT16_16_Q15(mid, X[0]);
1274 X[1] = MULT16_16_Q15(mid, X[1]);
1275 Y[0] = MULT16_16_Q15(side, Y[0]);
1276 Y[1] = MULT16_16_Q15(side, Y[1]);
1277 tmp = X[0];
1278 X[0] = SUB16(tmp,Y[0]);
1279 Y[0] = ADD16(tmp,Y[0]);
1280 tmp = X[1];
1281 X[1] = SUB16(tmp,Y[1]);
1282 Y[1] = ADD16(tmp,Y[1]);
1283 }
1284 } else {
1285 /* "Normal" split code */
1286 opus_int32 rebalance;
1287
1288 mbits = IMAX(0, IMIN(b, (b-delta)/2));
1289 sbits = b-mbits;
1290 ctx->remaining_bits -= qalloc;
1291
1292 rebalance = ctx->remaining_bits;
1293 if (mbits >= sbits)
1294 {
1295 /* In stereo mode, we do not apply a scaling to the mid because we need the normalized
1296 mid for folding later. */
1297 cm = quant_band(ctx, X, N, mbits, B,
1298 lowband, LM, lowband_out,
1299 Q15ONE, lowband_scratch, fill);
1300 rebalance = mbits - (rebalance-ctx->remaining_bits);
1301 if (rebalance > 3<<BITRES && itheta!=0)
1302 sbits += rebalance - (3<<BITRES);
1303
1304 /* For a stereo split, the high bits of fill are always zero, so no
1305 folding will be done to the side. */
1306 cm |= quant_band(ctx, Y, N, sbits, B,
1307 NULL, LM, NULL,
1308 side, NULL, fill>>B);
1309 } else {
1310 /* For a stereo split, the high bits of fill are always zero, so no
1311 folding will be done to the side. */
1312 cm = quant_band(ctx, Y, N, sbits, B,
1313 NULL, LM, NULL,
1314 side, NULL, fill>>B);
1315 rebalance = sbits - (rebalance-ctx->remaining_bits);
1316 if (rebalance > 3<<BITRES && itheta!=16384)
1317 mbits += rebalance - (3<<BITRES);
1318 /* In stereo mode, we do not apply a scaling to the mid because we need the normalized
1319 mid for folding later. */
1320 cm |= quant_band(ctx, X, N, mbits, B,
1321 lowband, LM, lowband_out,
1322 Q15ONE, lowband_scratch, fill);
1323 }
1324 }
1325
1326
1327 /* This code is used by the decoder and by the resynthesis-enabled encoder */
1328 if (resynth)
1329 {
1330 if (N!=2)
1331 stereo_merge(X, Y, mid, N);
1332 if (inv)
1333 {
1334 int j;
1335 for (j=0;j<N;j++)
1336 Y[j] = -Y[j];
1337 }
1338 }
1339 return cm;
1340 }
1341
1342
quant_all_bands(int encode,const CELTMode * m,int start,int end,celt_norm * X_,celt_norm * Y_,unsigned char * collapse_masks,const celt_ener * bandE,int * pulses,int shortBlocks,int spread,int dual_stereo,int intensity,int * tf_res,opus_int32 total_bits,opus_int32 balance,ec_ctx * ec,int LM,int codedBands,opus_uint32 * seed)1343 void quant_all_bands(int encode, const CELTMode *m, int start, int end,
1344 celt_norm *X_, celt_norm *Y_, unsigned char *collapse_masks, const celt_ener *bandE, int *pulses,
1345 int shortBlocks, int spread, int dual_stereo, int intensity, int *tf_res,
1346 opus_int32 total_bits, opus_int32 balance, ec_ctx *ec, int LM, int codedBands, opus_uint32 *seed)
1347 {
1348 int i;
1349 opus_int32 remaining_bits;
1350 const opus_int16 * OPUS_RESTRICT eBands = m->eBands;
1351 celt_norm * OPUS_RESTRICT norm, * OPUS_RESTRICT norm2;
1352 VARDECL(celt_norm, _norm);
1353 celt_norm *lowband_scratch;
1354 int B;
1355 int M;
1356 int lowband_offset;
1357 int update_lowband = 1;
1358 int C = Y_ != NULL ? 2 : 1;
1359 int norm_offset;
1360 #ifdef RESYNTH
1361 int resynth = 1;
1362 #else
1363 int resynth = !encode;
1364 #endif
1365 struct band_ctx ctx;
1366 SAVE_STACK;
1367
1368 M = 1<<LM;
1369 B = shortBlocks ? M : 1;
1370 norm_offset = M*eBands[start];
1371 /* No need to allocate norm for the last band because we don't need an
1372 output in that band. */
1373 ALLOC(_norm, C*(M*eBands[m->nbEBands-1]-norm_offset), celt_norm);
1374 norm = _norm;
1375 norm2 = norm + M*eBands[m->nbEBands-1]-norm_offset;
1376 /* We can use the last band as scratch space because we don't need that
1377 scratch space for the last band. */
1378 lowband_scratch = X_+M*eBands[m->nbEBands-1];
1379
1380 lowband_offset = 0;
1381 ctx.bandE = bandE;
1382 ctx.ec = ec;
1383 ctx.encode = encode;
1384 ctx.intensity = intensity;
1385 ctx.m = m;
1386 ctx.seed = *seed;
1387 ctx.spread = spread;
1388 for (i=start;i<end;i++)
1389 {
1390 opus_int32 tell;
1391 int b;
1392 int N;
1393 opus_int32 curr_balance;
1394 int effective_lowband=-1;
1395 celt_norm * OPUS_RESTRICT X, * OPUS_RESTRICT Y;
1396 int tf_change=0;
1397 unsigned x_cm;
1398 unsigned y_cm;
1399 int last;
1400
1401 ctx.i = i;
1402 last = (i==end-1);
1403
1404 X = X_+M*eBands[i];
1405 if (Y_!=NULL)
1406 Y = Y_+M*eBands[i];
1407 else
1408 Y = NULL;
1409 N = M*eBands[i+1]-M*eBands[i];
1410 tell = ec_tell_frac(ec);
1411
1412 /* Compute how many bits we want to allocate to this band */
1413 if (i != start)
1414 balance -= tell;
1415 remaining_bits = total_bits-tell-1;
1416 ctx.remaining_bits = remaining_bits;
1417 if (i <= codedBands-1)
1418 {
1419 curr_balance = balance / IMIN(3, codedBands-i);
1420 b = IMAX(0, IMIN(16383, IMIN(remaining_bits+1,pulses[i]+curr_balance)));
1421 } else {
1422 b = 0;
1423 }
1424
1425 if (resynth && M*eBands[i]-N >= M*eBands[start] && (update_lowband || lowband_offset==0))
1426 lowband_offset = i;
1427
1428 tf_change = tf_res[i];
1429 ctx.tf_change = tf_change;
1430 if (i>=m->effEBands)
1431 {
1432 X=norm;
1433 if (Y_!=NULL)
1434 Y = norm;
1435 lowband_scratch = NULL;
1436 }
1437 if (i==end-1)
1438 lowband_scratch = NULL;
1439
1440 /* Get a conservative estimate of the collapse_mask's for the bands we're
1441 going to be folding from. */
1442 if (lowband_offset != 0 && (spread!=SPREAD_AGGRESSIVE || B>1 || tf_change<0))
1443 {
1444 int fold_start;
1445 int fold_end;
1446 int fold_i;
1447 /* This ensures we never repeat spectral content within one band */
1448 effective_lowband = IMAX(0, M*eBands[lowband_offset]-norm_offset-N);
1449 fold_start = lowband_offset;
1450 while(M*eBands[--fold_start] > effective_lowband+norm_offset);
1451 fold_end = lowband_offset-1;
1452 while(M*eBands[++fold_end] < effective_lowband+norm_offset+N);
1453 x_cm = y_cm = 0;
1454 fold_i = fold_start; do {
1455 x_cm |= collapse_masks[fold_i*C+0];
1456 y_cm |= collapse_masks[fold_i*C+C-1];
1457 } while (++fold_i<fold_end);
1458 }
1459 /* Otherwise, we'll be using the LCG to fold, so all blocks will (almost
1460 always) be non-zero. */
1461 else
1462 x_cm = y_cm = (1<<B)-1;
1463
1464 if (dual_stereo && i==intensity)
1465 {
1466 int j;
1467
1468 /* Switch off dual stereo to do intensity. */
1469 dual_stereo = 0;
1470 if (resynth)
1471 for (j=0;j<M*eBands[i]-norm_offset;j++)
1472 norm[j] = HALF32(norm[j]+norm2[j]);
1473 }
1474 if (dual_stereo)
1475 {
1476 x_cm = quant_band(&ctx, X, N, b/2, B,
1477 effective_lowband != -1 ? norm+effective_lowband : NULL, LM,
1478 last?NULL:norm+M*eBands[i]-norm_offset, Q15ONE, lowband_scratch, x_cm);
1479 y_cm = quant_band(&ctx, Y, N, b/2, B,
1480 effective_lowband != -1 ? norm2+effective_lowband : NULL, LM,
1481 last?NULL:norm2+M*eBands[i]-norm_offset, Q15ONE, lowband_scratch, y_cm);
1482 } else {
1483 if (Y!=NULL)
1484 {
1485 x_cm = quant_band_stereo(&ctx, X, Y, N, b, B,
1486 effective_lowband != -1 ? norm+effective_lowband : NULL, LM,
1487 last?NULL:norm+M*eBands[i]-norm_offset, lowband_scratch, x_cm|y_cm);
1488 } else {
1489 x_cm = quant_band(&ctx, X, N, b, B,
1490 effective_lowband != -1 ? norm+effective_lowband : NULL, LM,
1491 last?NULL:norm+M*eBands[i]-norm_offset, Q15ONE, lowband_scratch, x_cm|y_cm);
1492 }
1493 y_cm = x_cm;
1494 }
1495 collapse_masks[i*C+0] = (unsigned char)x_cm;
1496 collapse_masks[i*C+C-1] = (unsigned char)y_cm;
1497 balance += pulses[i] + tell;
1498
1499 /* Update the folding position only as long as we have 1 bit/sample depth. */
1500 update_lowband = b>(N<<BITRES);
1501 }
1502 *seed = ctx.seed;
1503
1504 RESTORE_STACK;
1505 }
1506
1507