1 /* ------------------------------------------------------------------
2 * Copyright (C) 1998-2009 PacketVideo
3 *
4 * Licensed under the Apache License, Version 2.0 (the "License");
5 * you may not use this file except in compliance with the License.
6 * You may obtain a copy of the License at
7 *
8 * http://www.apache.org/licenses/LICENSE-2.0
9 *
10 * Unless required by applicable law or agreed to in writing, software
11 * distributed under the License is distributed on an "AS IS" BASIS,
12 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
13 * express or implied.
14 * See the License for the specific language governing permissions
15 * and limitations under the License.
16 * -------------------------------------------------------------------
17 */
18 /*
19 ------------------------------------------------------------------------------
20
21 PacketVideo Corp.
22 MP3 Decoder Library
23
24 Filename: pvmp3_dct_16.cpp
25
26 Functions:
27 dct_16
28 pv_merge_in_place_N32
29 pv_split
30
31 Date: 09/21/2007
32
33 ------------------------------------------------------------------------------
34 REVISION HISTORY
35
36
37 Description:
38
39 ------------------------------------------------------------------------------
40 INPUT AND OUTPUT DEFINITIONS
41
42 dct_16
43
44 Input
45 int32 vec[], input vector length 16
46 Int flag processing direction: forward (1), backward ( 0)
47 Returns
48
49 int32 vec[], dct length 16
50
51 ------------------------------------------------------------------------------
52 INPUT AND OUTPUT DEFINITIONS
53
54 pv_merge_in_place_N32
55
56 Input
57 int32 vec[], input vector length 16
58
59 Returns
60
61 int32 vec[], merged output of two dct 16 to create a dct 32
62
63 ------------------------------------------------------------------------------
64 INPUT AND OUTPUT DEFINITIONS
65
66 pv_split
67
68 Input
69 int32 vec[], input vector length 16
70
71 Returns
72
73 int32 vec[], splitted even/odd and pre processing rotation
74
75 ------------------------------------------------------------------------------
76 FUNCTION DESCRIPTION
77
78 dct 16 and tools to assemble a dct32 output
79
80 ------------------------------------------------------------------------------
81 REQUIREMENTS
82
83
84 ------------------------------------------------------------------------------
85 REFERENCES
86
87 ------------------------------------------------------------------------------
88 PSEUDO-CODE
89
90 ------------------------------------------------------------------------------
91 */
92
93 #if ( !defined(PV_ARM_GCC_V5) && !defined(PV_ARM_GCC_V4) )
94 /*----------------------------------------------------------------------------
95 ; INCLUDES
96 ----------------------------------------------------------------------------*/
97
98 #include "pvmp3_dct_16.h"
99 #include "pv_mp3dec_fxd_op.h"
100
101 /*----------------------------------------------------------------------------
102 ; MACROS
103 ; Define module specific macros here
104 ----------------------------------------------------------------------------*/
105
106
107 /*----------------------------------------------------------------------------
108 ; DEFINES
109 ; Include all pre-processor statements here. Include conditional
110 ; compile variables also.
111 ----------------------------------------------------------------------------*/
112 #define Qfmt(a) (int32)((a)*((int32)1<<27))
113
114 /*----------------------------------------------------------------------------
115 ; LOCAL FUNCTION DEFINITIONS
116 ; Function Prototype declaration
117 ----------------------------------------------------------------------------*/
118
119 /*----------------------------------------------------------------------------
120 ; LOCAL STORE/BUFFER/POINTER DEFINITIONS
121 ; Variable declaration - defined here and used outside this module
122 ----------------------------------------------------------------------------*/
123 const int32 CosTable_dct32[16] =
124 {
125 Qfmt_31(0.50060299823520F) , Qfmt_31(0.50547095989754F) ,
126 Qfmt_31(0.51544730992262F) , Qfmt_31(0.53104259108978F) ,
127 Qfmt_31(0.55310389603444F) , Qfmt_31(0.58293496820613F) ,
128 Qfmt_31(0.62250412303566F) , Qfmt_31(0.67480834145501F) ,
129 Qfmt_31(0.74453627100230F) , Qfmt_31(0.83934964541553F) ,
130
131 Qfmt(0.97256823786196F) , Qfmt(1.16943993343288F) ,
132 Qfmt(1.48416461631417F) , Qfmt(2.05778100995341F) ,
133 Qfmt(3.40760841846872F) , Qfmt(10.19000812354803F)
134 };
135
136
137 /*----------------------------------------------------------------------------
138 ; EXTERNAL FUNCTION REFERENCES
139 ; Declare functions defined elsewhere and referenced in this module
140 ----------------------------------------------------------------------------*/
141
142 /*----------------------------------------------------------------------------
143 ; EXTERNAL GLOBAL STORE/BUFFER/POINTER REFERENCES
144 ; Declare variables used in this module but defined elsewhere
145 ----------------------------------------------------------------------------*/
146
147
148 /*----------------------------------------------------------------------------
149 ; FUNCTION CODE
150 ----------------------------------------------------------------------------*/
151
152 __attribute__((no_sanitize("integer")))
pvmp3_dct_16(int32 vec[],int32 flag)153 void pvmp3_dct_16(int32 vec[], int32 flag)
154 {
155 int32 tmp0;
156 int32 tmp1;
157 int32 tmp2;
158 int32 tmp3;
159 int32 tmp4;
160 int32 tmp5;
161 int32 tmp6;
162 int32 tmp7;
163 int32 tmp_o0;
164 int32 tmp_o1;
165 int32 tmp_o2;
166 int32 tmp_o3;
167 int32 tmp_o4;
168 int32 tmp_o5;
169 int32 tmp_o6;
170 int32 tmp_o7;
171 int32 itmp_e0;
172 int32 itmp_e1;
173 int32 itmp_e2;
174
175 /* split input vector */
176
177 tmp_o0 = fxp_mul32_Q32((vec[ 0] - vec[15]), Qfmt_31(0.50241928618816F));
178 tmp0 = vec[ 0] + vec[15];
179
180 tmp_o7 = fxp_mul32_Q32((vec[ 7] - vec[ 8]) << 3, Qfmt_31(0.63764357733614F));
181 tmp7 = vec[ 7] + vec[ 8];
182
183 itmp_e0 = fxp_mul32_Q32((tmp0 - tmp7), Qfmt_31(0.50979557910416F));
184 tmp7 = (tmp0 + tmp7);
185
186 tmp_o1 = fxp_mul32_Q32((vec[ 1] - vec[14]), Qfmt_31(0.52249861493969F));
187 tmp1 = vec[ 1] + vec[14];
188
189 tmp_o6 = fxp_mul32_Q32((vec[ 6] - vec[ 9]) << 1, Qfmt_31(0.86122354911916F));
190 tmp6 = vec[ 6] + vec[ 9];
191
192
193
194 itmp_e1 = (tmp1 + tmp6);
195 tmp6 = fxp_mul32_Q32((tmp1 - tmp6), Qfmt_31(0.60134488693505F));
196
197
198
199 tmp_o2 = fxp_mul32_Q32((vec[ 2] - vec[13]), Qfmt_31(0.56694403481636F));
200 tmp2 = vec[ 2] + vec[13];
201 tmp_o5 = fxp_mul32_Q32((vec[ 5] - vec[10]) << 1, Qfmt_31(0.53033884299517F));
202 tmp5 = vec[ 5] + vec[10];
203
204 itmp_e2 = (tmp2 + tmp5);
205 tmp5 = fxp_mul32_Q32((tmp2 - tmp5), Qfmt_31(0.89997622313642F));
206
207 tmp_o3 = fxp_mul32_Q32((vec[ 3] - vec[12]), Qfmt_31(0.64682178335999F));
208 tmp3 = vec[ 3] + vec[12];
209 tmp_o4 = fxp_mul32_Q32((vec[ 4] - vec[11]), Qfmt_31(0.78815462345125F));
210 tmp4 = vec[ 4] + vec[11];
211
212 tmp1 = (tmp3 + tmp4);
213 tmp4 = fxp_mul32_Q32((tmp3 - tmp4) << 2, Qfmt_31(0.64072886193538F));
214
215 /* split even part of tmp_e */
216
217 tmp0 = (tmp7 + tmp1);
218 tmp1 = fxp_mul32_Q32((tmp7 - tmp1), Qfmt_31(0.54119610014620F));
219
220 tmp3 = fxp_mul32_Q32((itmp_e1 - itmp_e2) << 1, Qfmt_31(0.65328148243819F));
221 tmp7 = (itmp_e1 + itmp_e2);
222
223 vec[ 0] = (tmp0 + tmp7) >> 1;
224 vec[ 8] = fxp_mul32_Q32((tmp0 - tmp7), Qfmt_31(0.70710678118655F));
225 tmp0 = fxp_mul32_Q32((tmp1 - tmp3) << 1, Qfmt_31(0.70710678118655F));
226 vec[ 4] = tmp1 + tmp3 + tmp0;
227 vec[12] = tmp0;
228
229 /* split odd part of tmp_e */
230
231 tmp1 = fxp_mul32_Q32((itmp_e0 - tmp4) << 1, Qfmt_31(0.54119610014620F));
232 tmp7 = itmp_e0 + tmp4;
233
234 tmp3 = fxp_mul32_Q32((tmp6 - tmp5) << 2, Qfmt_31(0.65328148243819F));
235 tmp6 += tmp5;
236
237 tmp4 = fxp_mul32_Q32((tmp7 - tmp6) << 1, Qfmt_31(0.70710678118655F));
238 tmp6 += tmp7;
239 tmp7 = fxp_mul32_Q32((tmp1 - tmp3) << 1, Qfmt_31(0.70710678118655F));
240
241 tmp1 += tmp3 + tmp7;
242 vec[ 2] = tmp1 + tmp6;
243 vec[ 6] = tmp1 + tmp4;
244 vec[10] = tmp7 + tmp4;
245 vec[14] = tmp7;
246
247
248 // dct8;
249
250 tmp1 = fxp_mul32_Q32((tmp_o0 - tmp_o7) << 1, Qfmt_31(0.50979557910416F));
251 tmp7 = tmp_o0 + tmp_o7;
252
253 tmp6 = tmp_o1 + tmp_o6;
254 tmp_o1 = fxp_mul32_Q32((tmp_o1 - tmp_o6) << 1, Qfmt_31(0.60134488693505F));
255
256 tmp5 = tmp_o2 + tmp_o5;
257 tmp_o5 = fxp_mul32_Q32((tmp_o2 - tmp_o5) << 1, Qfmt_31(0.89997622313642F));
258
259 tmp0 = fxp_mul32_Q32((tmp_o3 - tmp_o4) << 3, Qfmt_31(0.6407288619354F));
260 tmp4 = tmp_o3 + tmp_o4;
261
262 if (!flag)
263 {
264 tmp7 = -tmp7;
265 tmp1 = -tmp1;
266 tmp6 = -tmp6;
267 tmp_o1 = -tmp_o1;
268 tmp5 = -tmp5;
269 tmp_o5 = -tmp_o5;
270 tmp4 = -tmp4;
271 tmp0 = -tmp0;
272 }
273
274
275 tmp2 = fxp_mul32_Q32((tmp1 - tmp0) << 1, Qfmt_31(0.54119610014620F));
276 tmp0 += tmp1;
277 tmp1 = fxp_mul32_Q32((tmp7 - tmp4) << 1, Qfmt_31(0.54119610014620F));
278 tmp7 += tmp4;
279 tmp4 = fxp_mul32_Q32((tmp6 - tmp5) << 2, Qfmt_31(0.65328148243819F));
280 tmp6 += tmp5;
281 tmp5 = fxp_mul32_Q32((tmp_o1 - tmp_o5) << 2, Qfmt_31(0.65328148243819F));
282 tmp_o1 += tmp_o5;
283
284
285 vec[13] = fxp_mul32_Q32((tmp1 - tmp4) << 1, Qfmt_31(0.70710678118655F));
286 vec[ 5] = tmp1 + tmp4 + vec[13];
287
288 vec[ 9] = fxp_mul32_Q32((tmp7 - tmp6) << 1, Qfmt_31(0.70710678118655F));
289 vec[ 1] = tmp7 + tmp6;
290
291 tmp4 = fxp_mul32_Q32((tmp0 - tmp_o1) << 1, Qfmt_31(0.70710678118655F));
292 tmp0 += tmp_o1;
293 tmp6 = fxp_mul32_Q32((tmp2 - tmp5) << 1, Qfmt_31(0.70710678118655F));
294 tmp2 += tmp5 + tmp6;
295 tmp0 += tmp2;
296
297 vec[ 1] += tmp0;
298 vec[ 3] = tmp0 + vec[ 5];
299 tmp2 += tmp4;
300 vec[ 5] = tmp2 + vec[ 5];
301 vec[ 7] = tmp2 + vec[ 9];
302 tmp4 += tmp6;
303 vec[ 9] = tmp4 + vec[ 9];
304 vec[11] = tmp4 + vec[13];
305 vec[13] = tmp6 + vec[13];
306 vec[15] = tmp6;
307
308 }
309 /*----------------------------------------------------------------------------
310 ; FUNCTION CODE
311 ----------------------------------------------------------------------------*/
312 __attribute__((no_sanitize("integer")))
pvmp3_merge_in_place_N32(int32 vec[])313 void pvmp3_merge_in_place_N32(int32 vec[])
314 {
315
316
317 int32 temp0;
318 int32 temp1;
319 int32 temp2;
320 int32 temp3;
321
322 temp0 = vec[14];
323 vec[14] = vec[ 7];
324 temp1 = vec[12];
325 vec[12] = vec[ 6];
326 temp2 = vec[10];
327 vec[10] = vec[ 5];
328 temp3 = vec[ 8];
329 vec[ 8] = vec[ 4];
330 vec[ 6] = vec[ 3];
331 vec[ 4] = vec[ 2];
332 vec[ 2] = vec[ 1];
333
334 vec[ 1] = (vec[16] + vec[17]);
335 vec[16] = temp3;
336 vec[ 3] = (vec[18] + vec[17]);
337 vec[ 5] = (vec[19] + vec[18]);
338 vec[18] = vec[9];
339
340 vec[ 7] = (vec[20] + vec[19]);
341 vec[ 9] = (vec[21] + vec[20]);
342 vec[20] = temp2;
343 temp2 = vec[13];
344 temp3 = vec[11];
345 vec[11] = (vec[22] + vec[21]);
346 vec[13] = (vec[23] + vec[22]);
347 vec[22] = temp3;
348 temp3 = vec[15];
349
350 vec[15] = (vec[24] + vec[23]);
351 vec[17] = (vec[25] + vec[24]);
352 vec[19] = (vec[26] + vec[25]);
353 vec[21] = (vec[27] + vec[26]);
354 vec[23] = (vec[28] + vec[27]);
355 vec[24] = temp1;
356 vec[25] = (vec[29] + vec[28]);
357 vec[26] = temp2;
358 vec[27] = (vec[30] + vec[29]);
359 vec[28] = temp0;
360 vec[29] = (vec[30] + vec[31]);
361 vec[30] = temp3;
362 }
363
364
365 /*----------------------------------------------------------------------------
366 ; FUNCTION CODE
367 ----------------------------------------------------------------------------*/
368
369
370
371 __attribute__((no_sanitize("integer")))
pvmp3_split(int32 * vect)372 void pvmp3_split(int32 *vect)
373 {
374
375 int32 i;
376 const int32 *pt_cosTerms = &CosTable_dct32[15];
377 int32 *pt_vect = vect;
378 int32 *pt_vect_2 = pt_vect - 1;
379
380 for (i = 3; i != 0; i--)
381 {
382 int32 tmp2 = *(pt_vect);
383 int32 tmp1 = *(pt_vect_2);
384 int32 cosx = *(pt_cosTerms--);
385 *(pt_vect_2--) = (tmp1 + tmp2);
386 *(pt_vect++) = fxp_mul32_Q27((tmp1 - tmp2), cosx);
387
388 tmp2 = *(pt_vect);
389 tmp1 = *(pt_vect_2);
390 cosx = *(pt_cosTerms--);
391 *(pt_vect_2--) = (tmp1 + tmp2);
392 *(pt_vect++) = fxp_mul32_Q27((tmp1 - tmp2), cosx);
393
394 }
395
396 for (i = 5; i != 0; i--)
397 {
398 int32 tmp2 = *(pt_vect);
399 int32 tmp1 = *(pt_vect_2);
400 int32 cosx = *(pt_cosTerms--);
401 *(pt_vect_2--) = (tmp1 + tmp2);
402 *(pt_vect++) = fxp_mul32_Q32((tmp1 - tmp2) << 1, cosx);
403
404 tmp2 = *(pt_vect);
405 tmp1 = *(pt_vect_2);
406 cosx = *(pt_cosTerms--);
407 *(pt_vect_2--) = (tmp1 + tmp2);
408 *(pt_vect++) = fxp_mul32_Q32((tmp1 - tmp2) << 1, cosx);
409 }
410
411 }
412
413 #endif
414