1 /* ------------------------------------------------------------------
2  * Copyright (C) 1998-2009 PacketVideo
3  *
4  * Licensed under the Apache License, Version 2.0 (the "License");
5  * you may not use this file except in compliance with the License.
6  * You may obtain a copy of the License at
7  *
8  *      http://www.apache.org/licenses/LICENSE-2.0
9  *
10  * Unless required by applicable law or agreed to in writing, software
11  * distributed under the License is distributed on an "AS IS" BASIS,
12  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
13  * express or implied.
14  * See the License for the specific language governing permissions
15  * and limitations under the License.
16  * -------------------------------------------------------------------
17  */
18 /*
19 ------------------------------------------------------------------------------
20 
21    PacketVideo Corp.
22    MP3 Decoder Library
23 
24    Filename: pvmp3_dct_16.cpp
25 
26    Functions:
27     dct_16
28     pv_merge_in_place_N32
29     pv_split
30 
31      Date: 09/21/2007
32 
33 ------------------------------------------------------------------------------
34  REVISION HISTORY
35 
36 
37  Description:
38 
39 ------------------------------------------------------------------------------
40  INPUT AND OUTPUT DEFINITIONS
41 
42     dct_16
43 
44 Input
45     int32 vec[],        input vector length 16
46     Int flag            processing direction: forward (1), backward ( 0)
47  Returns
48 
49     int32 vec[],        dct length 16
50 
51 ------------------------------------------------------------------------------
52  INPUT AND OUTPUT DEFINITIONS
53 
54     pv_merge_in_place_N32
55 
56 Input
57     int32 vec[],        input vector length 16
58 
59  Returns
60 
61     int32 vec[],        merged  output of two dct 16 to create a dct 32
62 
63 ------------------------------------------------------------------------------
64  INPUT AND OUTPUT DEFINITIONS
65 
66     pv_split
67 
68 Input
69     int32 vec[],        input vector length 16
70 
71  Returns
72 
73     int32 vec[],        splitted even/odd and pre processing rotation
74 
75 ------------------------------------------------------------------------------
76  FUNCTION DESCRIPTION
77 
78     dct 16 and tools to assemble a dct32 output
79 
80 ------------------------------------------------------------------------------
81  REQUIREMENTS
82 
83 
84 ------------------------------------------------------------------------------
85  REFERENCES
86 
87 ------------------------------------------------------------------------------
88  PSEUDO-CODE
89 
90 ------------------------------------------------------------------------------
91 */
92 
93 #if ( !defined(PV_ARM_GCC_V5) && !defined(PV_ARM_GCC_V4) )
94 /*----------------------------------------------------------------------------
95 ; INCLUDES
96 ----------------------------------------------------------------------------*/
97 
98 #include "pvmp3_dct_16.h"
99 #include "pv_mp3dec_fxd_op.h"
100 
101 /*----------------------------------------------------------------------------
102 ; MACROS
103 ; Define module specific macros here
104 ----------------------------------------------------------------------------*/
105 
106 
107 /*----------------------------------------------------------------------------
108 ; DEFINES
109 ; Include all pre-processor statements here. Include conditional
110 ; compile variables also.
111 ----------------------------------------------------------------------------*/
112 #define Qfmt(a)   (int32)((a)*((int32)1<<27))
113 
114 /*----------------------------------------------------------------------------
115 ; LOCAL FUNCTION DEFINITIONS
116 ; Function Prototype declaration
117 ----------------------------------------------------------------------------*/
118 
119 /*----------------------------------------------------------------------------
120 ; LOCAL STORE/BUFFER/POINTER DEFINITIONS
121 ; Variable declaration - defined here and used outside this module
122 ----------------------------------------------------------------------------*/
123 const int32 CosTable_dct32[16] =
124 {
125     Qfmt_31(0.50060299823520F) ,  Qfmt_31(0.50547095989754F) ,
126     Qfmt_31(0.51544730992262F) ,  Qfmt_31(0.53104259108978F) ,
127     Qfmt_31(0.55310389603444F) ,  Qfmt_31(0.58293496820613F) ,
128     Qfmt_31(0.62250412303566F) ,  Qfmt_31(0.67480834145501F) ,
129     Qfmt_31(0.74453627100230F) ,  Qfmt_31(0.83934964541553F) ,
130 
131     Qfmt(0.97256823786196F) ,  Qfmt(1.16943993343288F) ,
132     Qfmt(1.48416461631417F) ,  Qfmt(2.05778100995341F) ,
133     Qfmt(3.40760841846872F) ,  Qfmt(10.19000812354803F)
134 };
135 
136 
137 /*----------------------------------------------------------------------------
138 ; EXTERNAL FUNCTION REFERENCES
139 ; Declare functions defined elsewhere and referenced in this module
140 ----------------------------------------------------------------------------*/
141 
142 /*----------------------------------------------------------------------------
143 ; EXTERNAL GLOBAL STORE/BUFFER/POINTER REFERENCES
144 ; Declare variables used in this module but defined elsewhere
145 ----------------------------------------------------------------------------*/
146 
147 
148 /*----------------------------------------------------------------------------
149 ; FUNCTION CODE
150 ----------------------------------------------------------------------------*/
151 
152 __attribute__((no_sanitize("integer")))
pvmp3_dct_16(int32 vec[],int32 flag)153 void pvmp3_dct_16(int32 vec[], int32 flag)
154 {
155     int32 tmp0;
156     int32 tmp1;
157     int32 tmp2;
158     int32 tmp3;
159     int32 tmp4;
160     int32 tmp5;
161     int32 tmp6;
162     int32 tmp7;
163     int32 tmp_o0;
164     int32 tmp_o1;
165     int32 tmp_o2;
166     int32 tmp_o3;
167     int32 tmp_o4;
168     int32 tmp_o5;
169     int32 tmp_o6;
170     int32 tmp_o7;
171     int32 itmp_e0;
172     int32 itmp_e1;
173     int32 itmp_e2;
174 
175     /*  split input vector */
176 
177     tmp_o0 = fxp_mul32_Q32((vec[ 0] - vec[15]), Qfmt_31(0.50241928618816F));
178     tmp0   =  vec[ 0] + vec[15];
179 
180     tmp_o7 = fxp_mul32_Q32((vec[ 7] - vec[ 8]) << 3, Qfmt_31(0.63764357733614F));
181     tmp7   =  vec[ 7] + vec[ 8];
182 
183     itmp_e0    = fxp_mul32_Q32((tmp0 - tmp7), Qfmt_31(0.50979557910416F));
184     tmp7 = (tmp0 + tmp7);
185 
186     tmp_o1 = fxp_mul32_Q32((vec[ 1] - vec[14]), Qfmt_31(0.52249861493969F));
187     tmp1   =  vec[ 1] + vec[14];
188 
189     tmp_o6 = fxp_mul32_Q32((vec[ 6] - vec[ 9]) << 1, Qfmt_31(0.86122354911916F));
190     tmp6   =  vec[ 6] + vec[ 9];
191 
192 
193 
194     itmp_e1 = (tmp1 + tmp6);
195     tmp6    = fxp_mul32_Q32((tmp1 - tmp6), Qfmt_31(0.60134488693505F));
196 
197 
198 
199     tmp_o2 = fxp_mul32_Q32((vec[ 2] - vec[13]), Qfmt_31(0.56694403481636F));
200     tmp2   =  vec[ 2] + vec[13];
201     tmp_o5 = fxp_mul32_Q32((vec[ 5] - vec[10]) << 1, Qfmt_31(0.53033884299517F));
202     tmp5   =  vec[ 5] + vec[10];
203 
204     itmp_e2 = (tmp2 + tmp5);
205     tmp5    = fxp_mul32_Q32((tmp2 - tmp5), Qfmt_31(0.89997622313642F));
206 
207     tmp_o3 = fxp_mul32_Q32((vec[ 3] - vec[12]), Qfmt_31(0.64682178335999F));
208     tmp3   =  vec[ 3] + vec[12];
209     tmp_o4 = fxp_mul32_Q32((vec[ 4] - vec[11]), Qfmt_31(0.78815462345125F));
210     tmp4   =  vec[ 4] + vec[11];
211 
212     tmp1   = (tmp3 + tmp4);
213     tmp4   =  fxp_mul32_Q32((tmp3 - tmp4) << 2, Qfmt_31(0.64072886193538F));
214 
215     /*  split even part of tmp_e */
216 
217     tmp0 = (tmp7 + tmp1);
218     tmp1 = fxp_mul32_Q32((tmp7 - tmp1), Qfmt_31(0.54119610014620F));
219 
220     tmp3 = fxp_mul32_Q32((itmp_e1 - itmp_e2) << 1, Qfmt_31(0.65328148243819F));
221     tmp7 = (itmp_e1 + itmp_e2);
222 
223     vec[ 0]  = (tmp0 + tmp7) >> 1;
224     vec[ 8]  = fxp_mul32_Q32((tmp0 - tmp7), Qfmt_31(0.70710678118655F));
225     tmp0     = fxp_mul32_Q32((tmp1 - tmp3) << 1, Qfmt_31(0.70710678118655F));
226     vec[ 4]  =  tmp1 + tmp3 + tmp0;
227     vec[12]  =  tmp0;
228 
229     /*  split odd part of tmp_e */
230 
231     tmp1 = fxp_mul32_Q32((itmp_e0 - tmp4) << 1, Qfmt_31(0.54119610014620F));
232     tmp7 = itmp_e0 + tmp4;
233 
234     tmp3  = fxp_mul32_Q32((tmp6 - tmp5) << 2, Qfmt_31(0.65328148243819F));
235     tmp6 += tmp5;
236 
237     tmp4  = fxp_mul32_Q32((tmp7 - tmp6) << 1, Qfmt_31(0.70710678118655F));
238     tmp6 += tmp7;
239     tmp7  = fxp_mul32_Q32((tmp1 - tmp3) << 1, Qfmt_31(0.70710678118655F));
240 
241     tmp1    +=  tmp3 + tmp7;
242     vec[ 2]  =  tmp1 + tmp6;
243     vec[ 6]  =  tmp1 + tmp4;
244     vec[10]  =  tmp7 + tmp4;
245     vec[14]  =  tmp7;
246 
247 
248     // dct8;
249 
250     tmp1 = fxp_mul32_Q32((tmp_o0 - tmp_o7) << 1, Qfmt_31(0.50979557910416F));
251     tmp7 = tmp_o0 + tmp_o7;
252 
253     tmp6   = tmp_o1 + tmp_o6;
254     tmp_o1 = fxp_mul32_Q32((tmp_o1 - tmp_o6) << 1, Qfmt_31(0.60134488693505F));
255 
256     tmp5   = tmp_o2 + tmp_o5;
257     tmp_o5 = fxp_mul32_Q32((tmp_o2 - tmp_o5) << 1, Qfmt_31(0.89997622313642F));
258 
259     tmp0 = fxp_mul32_Q32((tmp_o3 - tmp_o4) << 3, Qfmt_31(0.6407288619354F));
260     tmp4 = tmp_o3 + tmp_o4;
261 
262     if (!flag)
263     {
264         tmp7   = -tmp7;
265         tmp1   = -tmp1;
266         tmp6   = -tmp6;
267         tmp_o1 = -tmp_o1;
268         tmp5   = -tmp5;
269         tmp_o5 = -tmp_o5;
270         tmp4   = -tmp4;
271         tmp0   = -tmp0;
272     }
273 
274 
275     tmp2     =  fxp_mul32_Q32((tmp1 -   tmp0) << 1, Qfmt_31(0.54119610014620F));
276     tmp0    +=  tmp1;
277     tmp1     =  fxp_mul32_Q32((tmp7 -   tmp4) << 1, Qfmt_31(0.54119610014620F));
278     tmp7    +=  tmp4;
279     tmp4     =  fxp_mul32_Q32((tmp6 -   tmp5) << 2, Qfmt_31(0.65328148243819F));
280     tmp6    +=  tmp5;
281     tmp5     =  fxp_mul32_Q32((tmp_o1 - tmp_o5) << 2, Qfmt_31(0.65328148243819F));
282     tmp_o1  += tmp_o5;
283 
284 
285     vec[13]  =  fxp_mul32_Q32((tmp1 -   tmp4) << 1, Qfmt_31(0.70710678118655F));
286     vec[ 5]  =  tmp1 + tmp4 + vec[13];
287 
288     vec[ 9]  =  fxp_mul32_Q32((tmp7 -   tmp6) << 1, Qfmt_31(0.70710678118655F));
289     vec[ 1]  =  tmp7 + tmp6;
290 
291     tmp4     =  fxp_mul32_Q32((tmp0 - tmp_o1) << 1, Qfmt_31(0.70710678118655F));
292     tmp0    +=  tmp_o1;
293     tmp6     =  fxp_mul32_Q32((tmp2 -   tmp5) << 1, Qfmt_31(0.70710678118655F));
294     tmp2    +=  tmp5 + tmp6;
295     tmp0    +=  tmp2;
296 
297     vec[ 1] += tmp0;
298     vec[ 3]  = tmp0 + vec[ 5];
299     tmp2    += tmp4;
300     vec[ 5]  = tmp2 + vec[ 5];
301     vec[ 7]  = tmp2 + vec[ 9];
302     tmp4    += tmp6;
303     vec[ 9]  = tmp4 + vec[ 9];
304     vec[11]  = tmp4 + vec[13];
305     vec[13]  = tmp6 + vec[13];
306     vec[15]  = tmp6;
307 
308 }
309 /*----------------------------------------------------------------------------
310 ; FUNCTION CODE
311 ----------------------------------------------------------------------------*/
312 __attribute__((no_sanitize("integer")))
pvmp3_merge_in_place_N32(int32 vec[])313 void pvmp3_merge_in_place_N32(int32 vec[])
314 {
315 
316 
317     int32 temp0;
318     int32 temp1;
319     int32 temp2;
320     int32 temp3;
321 
322     temp0   = vec[14];
323     vec[14] = vec[ 7];
324     temp1   = vec[12];
325     vec[12] = vec[ 6];
326     temp2   = vec[10];
327     vec[10] = vec[ 5];
328     temp3   = vec[ 8];
329     vec[ 8] = vec[ 4];
330     vec[ 6] = vec[ 3];
331     vec[ 4] = vec[ 2];
332     vec[ 2] = vec[ 1];
333 
334     vec[ 1] = (vec[16] + vec[17]);
335     vec[16] = temp3;
336     vec[ 3] = (vec[18] + vec[17]);
337     vec[ 5] = (vec[19] + vec[18]);
338     vec[18] = vec[9];
339 
340     vec[ 7] = (vec[20] + vec[19]);
341     vec[ 9] = (vec[21] + vec[20]);
342     vec[20] = temp2;
343     temp2   = vec[13];
344     temp3   = vec[11];
345     vec[11] = (vec[22] + vec[21]);
346     vec[13] = (vec[23] + vec[22]);
347     vec[22] = temp3;
348     temp3   = vec[15];
349 
350     vec[15] = (vec[24] + vec[23]);
351     vec[17] = (vec[25] + vec[24]);
352     vec[19] = (vec[26] + vec[25]);
353     vec[21] = (vec[27] + vec[26]);
354     vec[23] = (vec[28] + vec[27]);
355     vec[24] = temp1;
356     vec[25] = (vec[29] + vec[28]);
357     vec[26] = temp2;
358     vec[27] = (vec[30] + vec[29]);
359     vec[28] = temp0;
360     vec[29] = (vec[30] + vec[31]);
361     vec[30] = temp3;
362 }
363 
364 
365 /*----------------------------------------------------------------------------
366 ; FUNCTION CODE
367 ----------------------------------------------------------------------------*/
368 
369 
370 
371 __attribute__((no_sanitize("integer")))
pvmp3_split(int32 * vect)372 void pvmp3_split(int32 *vect)
373 {
374 
375     int32 i;
376     const int32 *pt_cosTerms = &CosTable_dct32[15];
377     int32 *pt_vect   = vect;
378     int32 *pt_vect_2 = pt_vect - 1;
379 
380     for (i = 3; i != 0; i--)
381     {
382         int32 tmp2 = *(pt_vect);
383         int32 tmp1 = *(pt_vect_2);
384         int32 cosx = *(pt_cosTerms--);
385         *(pt_vect_2--) = (tmp1  + tmp2);
386         *(pt_vect++)   = fxp_mul32_Q27((tmp1 - tmp2), cosx);
387 
388         tmp2 = *(pt_vect);
389         tmp1 = *(pt_vect_2);
390         cosx = *(pt_cosTerms--);
391         *(pt_vect_2--) = (tmp1  + tmp2);
392         *(pt_vect++)   = fxp_mul32_Q27((tmp1 - tmp2), cosx);
393 
394     }
395 
396     for (i = 5; i != 0; i--)
397     {
398         int32 tmp2 = *(pt_vect);
399         int32 tmp1 = *(pt_vect_2);
400         int32 cosx = *(pt_cosTerms--);
401         *(pt_vect_2--) = (tmp1  + tmp2);
402         *(pt_vect++) = fxp_mul32_Q32((tmp1 - tmp2) << 1, cosx);
403 
404         tmp2 = *(pt_vect);
405         tmp1 = *(pt_vect_2);
406         cosx = *(pt_cosTerms--);
407         *(pt_vect_2--) = (tmp1  + tmp2);
408         *(pt_vect++) = fxp_mul32_Q32((tmp1 - tmp2) << 1, cosx);
409     }
410 
411 }
412 
413 #endif
414