40 #define B0 1.000000000000000000000000000000000000
41 #define B1 0.720959822006947913789091890943021267 // (cos(pi*1/16)sqrt(2))^-1
42 #define B2 0.765366864730179543456919968060797734 // (cos(pi*2/16)sqrt(2))^-1
43 #define B3 0.850430094767256448766702844371412325 // (cos(pi*3/16)sqrt(2))^-1
44 #define B4 1.000000000000000000000000000000000000 // (cos(pi*4/16)sqrt(2))^-1
45 #define B5 1.272758580572833938461007018281767032 // (cos(pi*5/16)sqrt(2))^-1
46 #define B6 1.847759065022573512256366378793576574 // (cos(pi*6/16)sqrt(2))^-1
47 #define B7 3.624509785411551372409941227504289587 // (cos(pi*7/16)sqrt(2))^-1
49 #define A1 M_SQRT1_2 // cos(pi*4/16)
50 #define A2 0.54119610014619698435 // cos(pi*6/16)sqrt(2)
51 #define A5 0.38268343236508977170 // cos(pi*6/16)
52 #define A4 1.30656296487637652774 // cos(pi*2/16)sqrt(2)
67 FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
68 FLOAT tmp10, tmp11, tmp12, tmp13;
69 FLOAT z2, z4, z11, z13;
72 for (
i=0;
i<8*8;
i+=8) {
87 temp[0 +
i]= tmp10 + tmp11;
88 temp[4 +
i]= tmp10 - tmp11;
92 temp[2 +
i]= tmp13 + tmp12;
93 temp[6 +
i]= tmp13 - tmp12;
99 z2= tmp4*(
A2+
A5) - tmp6*
A5;
100 z4= tmp6*(
A4-
A5) + tmp4*
A5;
107 temp[5 +
i]= z13 + z2;
108 temp[3 +
i]= z13 - z2;
109 temp[1 +
i]= z11 + z4;
110 temp[7 +
i]= z11 - z4;
116 FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
117 FLOAT tmp10, tmp11, tmp12, tmp13;
118 FLOAT z2, z4, z11, z13;
126 for (
i=0;
i<8;
i++) {
153 z2= tmp4*(
A2+
A5) - tmp6*
A5;
154 z4= tmp6*(
A4-
A5) + tmp4*
A5;
170 FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
171 FLOAT tmp10, tmp11, tmp12, tmp13;
179 for (
i=0;
i<8;
i++) {