/* ------------------------------------------------------------------ * Copyright (C) 1998-2009 PacketVideo * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either * express or implied. * See the License for the specific language governing permissions * and limitations under the License. * ------------------------------------------------------------------- */ /* Filename: dct64.c ------------------------------------------------------------------------------ REVISION HISTORY Who: Date: MM/DD/YYYY Description: ------------------------------------------------------------------------------ INPUT AND OUTPUT DEFINITIONS Int32 x 32-bit integer input length 64 ------------------------------------------------------------------------------ FUNCTION DESCRIPTION Implement dct of lenght 64 ------------------------------------------------------------------------------ REQUIREMENTS ------------------------------------------------------------------------------ REFERENCES ------------------------------------------------------------------------------ PSEUDO-CODE ------------------------------------------------------------------------------ */ /*---------------------------------------------------------------------------- ; INCLUDES ----------------------------------------------------------------------------*/ #ifdef AAC_PLUS #include "dct16.h" #include "dct64.h" #include "pv_audio_type_defs.h" #include "synthesis_sub_band.h" #include "fxp_mul32.h" /*---------------------------------------------------------------------------- ; MACROS ; Define module specific macros here ----------------------------------------------------------------------------*/ /*---------------------------------------------------------------------------- ; DEFINES ; Include all pre-processor statements here. Include conditional ; compile variables also. ----------------------------------------------------------------------------*/ #define Qfmt(a) (Int32)(a*((Int32)1<<26) + (a>=0?0.5F:-0.5F)) #define Qfmt31(a) (Int32)(a*0x7FFFFFFF) const Int32 CosTable_48[48] = { Qfmt31(0.50015063602065F) , Qfmt31(0.50135845244641F) , Qfmt31(0.50378872568104F) , Qfmt31(0.50747117207256F) , Qfmt31(0.51245147940822F) , Qfmt31(0.51879271310533F) , Qfmt31(0.52657731515427F) , Qfmt31(0.53590981690799F) , Qfmt31(0.54692043798551F) , Qfmt31(0.55976981294708F) , Qfmt31(0.57465518403266F) , Qfmt31(0.59181853585742F) , Qfmt31(0.61155734788251F) , Qfmt31(0.63423893668840F) , Qfmt31(0.66031980781371F) , Qfmt31(0.69037212820021F) , Qfmt31(0.72512052237720F) , Qfmt31(0.76549416497309F) , Qfmt31(0.81270209081449F) , Qfmt31(0.86834471522335F) , Qfmt(0.93458359703641F) , Qfmt(1.01440826499705F) , Qfmt(1.11207162057972F) , Qfmt(1.23383273797657F) , Qfmt(1.38929395863283F) , Qfmt(1.59397228338563F) , Qfmt(1.87467598000841F) , Qfmt(2.28205006800516F) , Qfmt(2.92462842815822F) , Qfmt(4.08461107812925F) , Qfmt(6.79675071167363F) , Qfmt(20.37387816723145F) , /* 32 */ Qfmt(0.50060299823520F) , Qfmt(0.50547095989754F) , Qfmt(0.51544730992262F) , Qfmt(0.53104259108978F) , Qfmt(0.55310389603444F) , Qfmt(0.58293496820613F) , Qfmt(0.62250412303566F) , Qfmt(0.67480834145501F) , Qfmt(0.74453627100230F) , Qfmt(0.83934964541553F) , Qfmt(0.97256823786196F) , Qfmt(1.16943993343288F) , Qfmt(1.48416461631417F) , Qfmt(2.05778100995341F) , Qfmt(3.40760841846872F) , Qfmt(10.19000812354803F) }; /*---------------------------------------------------------------------------- ; LOCAL FUNCTION DEFINITIONS ; Function Prototype declaration ----------------------------------------------------------------------------*/ /*---------------------------------------------------------------------------- ; LOCAL STORE/BUFFER/POINTER DEFINITIONS ; Variable declaration - defined here and used outside this module ----------------------------------------------------------------------------*/ /*---------------------------------------------------------------------------- ; EXTERNAL FUNCTION REFERENCES ; Declare functions defined elsewhere and referenced in this module ----------------------------------------------------------------------------*/ /*---------------------------------------------------------------------------- ; EXTERNAL GLOBAL STORE/BUFFER/POINTER REFERENCES ; Declare variables used in this module but defined elsewhere ----------------------------------------------------------------------------*/ /*---------------------------------------------------------------------------- ; FUNCTION CODE ----------------------------------------------------------------------------*/ /*---------------------------------------------------------------------------- ; dct_64 ----------------------------------------------------------------------------*/ void pv_split_LC(Int32 *vector, Int32 *temp_o) { Int32 i; Int32 *pt_vector = &vector[0]; Int32 *pt_vector_N_1 = &vector[31]; const Int32 *pt_cosTerms = &CosTable_48[32]; Int32 *pt_temp_o = temp_o; Int32 tmp1; Int32 tmp2; Int32 tmp3; tmp1 = *(pt_vector); tmp2 = *(pt_vector_N_1--); for (i = 16; i != 0; i--) { tmp3 = *(pt_cosTerms++); *(pt_vector++) = tmp1 + tmp2; *(pt_temp_o++) = fxp_mul32_Q26((tmp1 - tmp2), tmp3); tmp1 = *(pt_vector); tmp2 = *(pt_vector_N_1--); } } #ifdef HQ_SBR void dct_64(Int32 vec[], Int32 *scratch_mem) { Int32 *temp_e1; Int32 *temp_o1; Int32 *pt_vec; Int i; Int32 aux1; Int32 aux2; Int32 aux3; Int32 aux4; const Int32 *cosTerms = &CosTable_48[31]; temp_o1 = &vec[32]; temp_e1 = temp_o1 - 1; for (i = 6; i != 0; i--) { aux1 = *(temp_e1); aux2 = *(temp_o1); aux3 = *(cosTerms--); *(temp_e1--) = aux1 + aux2; *(temp_o1++) = fxp_mul32_Q26((aux1 - aux2), aux3); aux1 = *(temp_e1); aux2 = *(temp_o1); aux3 = *(cosTerms--); *(temp_e1--) = aux1 + aux2; *(temp_o1++) = fxp_mul32_Q26((aux1 - aux2), aux3); } for (i = 10; i != 0; i--) { aux1 = *(temp_e1); aux2 = *(temp_o1); aux3 = *(cosTerms--); *(temp_e1--) = aux1 + aux2; *(temp_o1++) = fxp_mul32_Q31((aux1 - aux2), aux3) << 1; aux1 = *(temp_e1); aux2 = *(temp_o1); aux3 = *(cosTerms--); *(temp_e1--) = aux1 + aux2; *(temp_o1++) = fxp_mul32_Q31((aux1 - aux2), aux3) << 1; } pv_split(&vec[16]); dct_16(&vec[16], 0); dct_16(vec, 1); // Even terms pv_merge_in_place_N32(vec); pv_split_z(&vec[32]); dct_16(&vec[32], 1); // Even terms dct_16(&vec[48], 0); pv_merge_in_place_N32(&vec[32]); aux1 = vec[32]; aux3 = vec[33]; aux4 = vec[ 1]; /* vec[ 1] */ /* -----------------------------------*/ aux1 = vec[32] + vec[33]; vec[ 0] += aux1; vec[ 1] += aux1; aux1 = vec[34]; aux2 = vec[ 2]; /* vec[ 2] */ aux3 += aux1; vec[ 2] = aux4 + aux3; aux4 = vec[ 3]; /* vec[ 3] */ vec[ 3] = aux2 + aux3; aux3 = vec[35]; /* -----------------------------------*/ aux1 += aux3; vec[32] = vec[ 4]; vec[33] = vec[ 5]; vec[ 4] = aux2 + aux1; vec[ 5] = aux4 + aux1; aux1 = vec[36]; aux2 = vec[32]; /* vec[ 4] */ aux3 += aux1; vec[34] = vec[ 6]; vec[35] = vec[ 7]; vec[ 6] = aux4 + aux3; vec[ 7] = aux2 + aux3; aux3 = vec[37]; aux4 = vec[33]; /* vec[ 5] */ /* -----------------------------------*/ aux1 += aux3; vec[32] = vec[ 8]; vec[33] = vec[ 9]; vec[ 8] = aux2 + aux1; vec[ 9] = aux4 + aux1; aux1 = vec[38]; aux2 = vec[34]; /* vec[ 6] */ aux3 += aux1; vec[34] = vec[10]; vec[10] = aux4 + aux3; aux4 = vec[35]; /* vec[ 7] */ vec[35] = vec[11]; vec[11] = aux2 + aux3; aux3 = vec[39]; /* -----------------------------------*/ aux1 += aux3; vec[36] = vec[12]; vec[37] = vec[13]; vec[12] = aux2 + aux1; vec[13] = aux4 + aux1; aux1 = vec[40]; aux2 = vec[32]; /* vec[ 8] */ aux3 += aux1; vec[32] = vec[14]; vec[14] = aux4 + aux3; aux4 = vec[33]; /* vec[ 9] */ vec[33] = vec[15]; vec[15] = aux2 + aux3; aux3 = vec[41]; /* -----------------------------------*/ aux1 += aux3; vec[38] = vec[16]; vec[39] = vec[17]; vec[16] = aux2 + aux1; vec[17] = aux4 + aux1; aux1 = vec[42]; aux2 = vec[34]; /* vec[10] */ aux3 += aux1; vec[34] = vec[18]; vec[18] = aux4 + aux3; aux4 = vec[35]; /* vec[11] */ vec[35] = vec[19]; vec[19] = aux2 + aux3; aux3 = vec[43]; /* -----------------------------------*/ aux1 += aux3; vec[40] = vec[20]; vec[41] = vec[21]; vec[20] = aux2 + aux1; vec[21] = aux4 + aux1; aux1 = vec[44]; aux2 = vec[36]; /* vec[12] */ aux3 += aux1; vec[42] = vec[22]; vec[43] = vec[23]; vec[22] = aux4 + aux3; vec[23] = aux2 + aux3; aux3 = vec[45]; aux4 = vec[37]; /* vec[13] */ /* -----------------------------------*/ scratch_mem[0] = vec[24]; scratch_mem[1] = vec[25]; aux1 += aux3; vec[24] = aux2 + aux1; vec[25] = aux4 + aux1; aux1 = vec[46]; aux2 = vec[32]; /* vec[14] */ scratch_mem[2] = vec[26]; scratch_mem[3] = vec[27]; aux3 += aux1; vec[26] = aux4 + aux3; vec[27] = aux2 + aux3; aux3 = vec[47]; aux4 = vec[33]; /* vec[15] */ /* -----------------------------------*/ scratch_mem[4] = vec[28]; scratch_mem[5] = vec[29]; aux1 += aux3; vec[28] = aux2 + aux1; vec[29] = aux4 + aux1; aux1 = vec[48]; aux2 = vec[38]; /* vec[16] */ scratch_mem[6] = vec[30]; scratch_mem[7] = vec[31]; aux3 += aux1; vec[30] = aux4 + aux3; vec[31] = aux2 + aux3; aux3 = vec[49]; aux4 = vec[39]; /* vec[17] */ /* -----------------------------------*/ aux1 += aux3; vec[32] = aux2 + aux1; vec[33] = aux4 + aux1; aux1 = vec[50]; aux2 = vec[34]; /* vec[18] */ aux3 += aux1; vec[34] = aux4 + aux3; aux4 = vec[35]; /* vec[19] */ vec[35] = aux2 + aux3; aux3 = vec[51]; /* -----------------------------------*/ aux1 += aux3; vec[36] = aux2 + aux1; vec[37] = aux4 + aux1; aux1 = vec[52]; aux2 = vec[40]; /* vec[20] */ aux3 += aux1; vec[38] = aux4 + aux3; vec[39] = aux2 + aux3; aux3 = vec[53]; aux4 = vec[41]; /* vec[21] */ /* -----------------------------------*/ aux1 += aux3; vec[40] = aux2 + aux1; vec[41] = aux4 + aux1; aux1 = vec[54]; aux2 = vec[42]; /* vec[22] */ aux3 += aux1; vec[42] = aux4 + aux3; aux4 = vec[43]; /* vec[23] */ vec[43] = aux2 + aux3; aux3 = vec[55]; /* -----------------------------------*/ pt_vec = &vec[44]; temp_o1 = &vec[56]; temp_e1 = &scratch_mem[0]; for (i = 4; i != 0; i--) { aux1 += aux3; *(pt_vec++) = aux2 + aux1; *(pt_vec++) = aux4 + aux1; aux1 = *(temp_o1++); aux3 += aux1; aux2 = *(temp_e1++); *(pt_vec++) = aux4 + aux3; *(pt_vec++) = aux2 + aux3; aux3 = *(temp_o1++); aux4 = *(temp_e1++); } aux1 += aux3; vec[60] = aux2 + aux1; vec[61] = aux4 + aux1; vec[62] = aux4 + aux3; } #endif /*---------------------------------------------------------------------------- ; pv_split ----------------------------------------------------------------------------*/ void pv_split(Int32 *temp_o) { Int32 i; const Int32 *pt_cosTerms = &CosTable_48[47]; Int32 *pt_temp_o = temp_o; Int32 *pt_temp_e = pt_temp_o - 1; Int32 tmp1; Int32 tmp2; Int32 cosx; for (i = 8; i != 0; i--) { tmp2 = *(pt_temp_o); tmp1 = *(pt_temp_e); cosx = *(pt_cosTerms--); *(pt_temp_e--) = tmp1 + tmp2; *(pt_temp_o++) = fxp_mul32_Q26((tmp1 - tmp2), cosx); tmp1 = *(pt_temp_e); tmp2 = *(pt_temp_o); cosx = *(pt_cosTerms--); *(pt_temp_e--) = tmp1 + tmp2; *(pt_temp_o++) = fxp_mul32_Q26((tmp1 - tmp2), cosx); } } void pv_split_z(Int32 *vector) { Int32 i; Int32 *pt_vector = &vector[31]; const Int32 *pt_cosTerms = &CosTable_48[32]; Int32 *pt_temp_e = vector; Int32 tmp1; Int32 tmp2; Int32 cosx; for (i = 8; i != 0; i--) { tmp1 = *(pt_vector); tmp2 = *(pt_temp_e); cosx = *(pt_cosTerms++); *(pt_temp_e++) = tmp1 + tmp2; *(pt_vector--) = fxp_mul32_Q26((tmp1 - tmp2), cosx); tmp2 = *(pt_temp_e); tmp1 = *(pt_vector); cosx = *(pt_cosTerms++); *(pt_temp_e++) = tmp1 + tmp2; *(pt_vector--) = fxp_mul32_Q26((tmp1 - tmp2), cosx); } } void pv_merge_in_place_N32(Int32 vec[]) { Int32 temp[4]; temp[0] = vec[14]; vec[14] = vec[ 7]; temp[1] = vec[12]; vec[12] = vec[ 6]; temp[2] = vec[10]; vec[10] = vec[ 5]; temp[3] = vec[ 8]; vec[ 8] = vec[ 4]; vec[ 6] = vec[ 3]; vec[ 4] = vec[ 2]; vec[ 2] = vec[ 1]; vec[ 1] = vec[16] + vec[17]; vec[16] = temp[3]; vec[ 3] = vec[18] + vec[17]; vec[ 5] = vec[19] + vec[18]; vec[18] = vec[9]; temp[3] = vec[11]; vec[ 7] = vec[20] + vec[19]; vec[ 9] = vec[21] + vec[20]; vec[20] = temp[2]; temp[2] = vec[13]; vec[11] = vec[22] + vec[21]; vec[13] = vec[23] + vec[22]; vec[22] = temp[3]; temp[3] = vec[15]; vec[15] = vec[24] + vec[23]; vec[17] = vec[25] + vec[24]; vec[19] = vec[26] + vec[25]; vec[21] = vec[27] + vec[26]; vec[23] = vec[28] + vec[27]; vec[25] = vec[29] + vec[28]; vec[27] = vec[30] + vec[29]; vec[29] = vec[30] + vec[31]; vec[24] = temp[1]; vec[26] = temp[2]; vec[28] = temp[0]; vec[30] = temp[3]; } #endif