xref: /utopia/UTPA2-700.0.x/modules/ojpd_vdec_v1/api/jpeg/cmodel/src/idct.c (revision 53ee8cc121a030b8d368113ac3e966b4705770ef)
1*53ee8cc1Swenshuai.xi //<MStar Software>
2*53ee8cc1Swenshuai.xi //******************************************************************************
3*53ee8cc1Swenshuai.xi // MStar Software
4*53ee8cc1Swenshuai.xi // Copyright (c) 2010 - 2012 MStar Semiconductor, Inc. All rights reserved.
5*53ee8cc1Swenshuai.xi // All software, firmware and related documentation herein ("MStar Software") are
6*53ee8cc1Swenshuai.xi // intellectual property of MStar Semiconductor, Inc. ("MStar") and protected by
7*53ee8cc1Swenshuai.xi // law, including, but not limited to, copyright law and international treaties.
8*53ee8cc1Swenshuai.xi // Any use, modification, reproduction, retransmission, or republication of all
9*53ee8cc1Swenshuai.xi // or part of MStar Software is expressly prohibited, unless prior written
10*53ee8cc1Swenshuai.xi // permission has been granted by MStar.
11*53ee8cc1Swenshuai.xi //
12*53ee8cc1Swenshuai.xi // By accessing, browsing and/or using MStar Software, you acknowledge that you
13*53ee8cc1Swenshuai.xi // have read, understood, and agree, to be bound by below terms ("Terms") and to
14*53ee8cc1Swenshuai.xi // comply with all applicable laws and regulations:
15*53ee8cc1Swenshuai.xi //
16*53ee8cc1Swenshuai.xi // 1. MStar shall retain any and all right, ownership and interest to MStar
17*53ee8cc1Swenshuai.xi //    Software and any modification/derivatives thereof.
18*53ee8cc1Swenshuai.xi //    No right, ownership, or interest to MStar Software and any
19*53ee8cc1Swenshuai.xi //    modification/derivatives thereof is transferred to you under Terms.
20*53ee8cc1Swenshuai.xi //
21*53ee8cc1Swenshuai.xi // 2. You understand that MStar Software might include, incorporate or be
22*53ee8cc1Swenshuai.xi //    supplied together with third party`s software and the use of MStar
23*53ee8cc1Swenshuai.xi //    Software may require additional licenses from third parties.
24*53ee8cc1Swenshuai.xi //    Therefore, you hereby agree it is your sole responsibility to separately
25*53ee8cc1Swenshuai.xi //    obtain any and all third party right and license necessary for your use of
26*53ee8cc1Swenshuai.xi //    such third party`s software.
27*53ee8cc1Swenshuai.xi //
28*53ee8cc1Swenshuai.xi // 3. MStar Software and any modification/derivatives thereof shall be deemed as
29*53ee8cc1Swenshuai.xi //    MStar`s confidential information and you agree to keep MStar`s
30*53ee8cc1Swenshuai.xi //    confidential information in strictest confidence and not disclose to any
31*53ee8cc1Swenshuai.xi //    third party.
32*53ee8cc1Swenshuai.xi //
33*53ee8cc1Swenshuai.xi // 4. MStar Software is provided on an "AS IS" basis without warranties of any
34*53ee8cc1Swenshuai.xi //    kind. Any warranties are hereby expressly disclaimed by MStar, including
35*53ee8cc1Swenshuai.xi //    without limitation, any warranties of merchantability, non-infringement of
36*53ee8cc1Swenshuai.xi //    intellectual property rights, fitness for a particular purpose, error free
37*53ee8cc1Swenshuai.xi //    and in conformity with any international standard.  You agree to waive any
38*53ee8cc1Swenshuai.xi //    claim against MStar for any loss, damage, cost or expense that you may
39*53ee8cc1Swenshuai.xi //    incur related to your use of MStar Software.
40*53ee8cc1Swenshuai.xi //    In no event shall MStar be liable for any direct, indirect, incidental or
41*53ee8cc1Swenshuai.xi //    consequential damages, including without limitation, lost of profit or
42*53ee8cc1Swenshuai.xi //    revenues, lost or damage of data, and unauthorized system use.
43*53ee8cc1Swenshuai.xi //    You agree that this Section 4 shall still apply without being affected
44*53ee8cc1Swenshuai.xi //    even if MStar Software has been modified by MStar in accordance with your
45*53ee8cc1Swenshuai.xi //    request or instruction for your use, except otherwise agreed by both
46*53ee8cc1Swenshuai.xi //    parties in writing.
47*53ee8cc1Swenshuai.xi //
48*53ee8cc1Swenshuai.xi // 5. If requested, MStar may from time to time provide technical supports or
49*53ee8cc1Swenshuai.xi //    services in relation with MStar Software to you for your use of
50*53ee8cc1Swenshuai.xi //    MStar Software in conjunction with your or your customer`s product
51*53ee8cc1Swenshuai.xi //    ("Services").
52*53ee8cc1Swenshuai.xi //    You understand and agree that, except otherwise agreed by both parties in
53*53ee8cc1Swenshuai.xi //    writing, Services are provided on an "AS IS" basis and the warranty
54*53ee8cc1Swenshuai.xi //    disclaimer set forth in Section 4 above shall apply.
55*53ee8cc1Swenshuai.xi //
56*53ee8cc1Swenshuai.xi // 6. Nothing contained herein shall be construed as by implication, estoppels
57*53ee8cc1Swenshuai.xi //    or otherwise:
58*53ee8cc1Swenshuai.xi //    (a) conferring any license or right to use MStar name, trademark, service
59*53ee8cc1Swenshuai.xi //        mark, symbol or any other identification;
60*53ee8cc1Swenshuai.xi //    (b) obligating MStar or any of its affiliates to furnish any person,
61*53ee8cc1Swenshuai.xi //        including without limitation, you and your customers, any assistance
62*53ee8cc1Swenshuai.xi //        of any kind whatsoever, or any information; or
63*53ee8cc1Swenshuai.xi //    (c) conferring any license or right under any intellectual property right.
64*53ee8cc1Swenshuai.xi //
65*53ee8cc1Swenshuai.xi // 7. These terms shall be governed by and construed in accordance with the laws
66*53ee8cc1Swenshuai.xi //    of Taiwan, R.O.C., excluding its conflict of law rules.
67*53ee8cc1Swenshuai.xi //    Any and all dispute arising out hereof or related hereto shall be finally
68*53ee8cc1Swenshuai.xi //    settled by arbitration referred to the Chinese Arbitration Association,
69*53ee8cc1Swenshuai.xi //    Taipei in accordance with the ROC Arbitration Law and the Arbitration
70*53ee8cc1Swenshuai.xi //    Rules of the Association by three (3) arbitrators appointed in accordance
71*53ee8cc1Swenshuai.xi //    with the said Rules.
72*53ee8cc1Swenshuai.xi //    The place of arbitration shall be in Taipei, Taiwan and the language shall
73*53ee8cc1Swenshuai.xi //    be English.
74*53ee8cc1Swenshuai.xi //    The arbitration award shall be final and binding to both parties.
75*53ee8cc1Swenshuai.xi //
76*53ee8cc1Swenshuai.xi //******************************************************************************
77*53ee8cc1Swenshuai.xi //<MStar Software>
78*53ee8cc1Swenshuai.xi //
79*53ee8cc1Swenshuai.xi // 2D IDCT
80*53ee8cc1Swenshuai.xi // Derived from an older version of the IJG's JPEG software.
81*53ee8cc1Swenshuai.xi // Downloadable from: www.ijg.org
82*53ee8cc1Swenshuai.xi // This module is going to be replaced with a faster (and
83*53ee8cc1Swenshuai.xi // uncopyrighted) version.
84*53ee8cc1Swenshuai.xi // I am unable to find the original file from which this code was derived.
85*53ee8cc1Swenshuai.xi // I have included the copyright notice included with latest IJG version of this
86*53ee8cc1Swenshuai.xi // module.
87*53ee8cc1Swenshuai.xi //
88*53ee8cc1Swenshuai.xi 
89*53ee8cc1Swenshuai.xi /*
90*53ee8cc1Swenshuai.xi  * jidctint.c
91*53ee8cc1Swenshuai.xi  *
92*53ee8cc1Swenshuai.xi  * Copyright (C) 1991-1998, Thomas G. Lane.
93*53ee8cc1Swenshuai.xi  * This file is part of the Independent JPEG Group's software.
94*53ee8cc1Swenshuai.xi  * For conditions of distribution and use, see the accompanying README file.
95*53ee8cc1Swenshuai.xi  *
96*53ee8cc1Swenshuai.xi  * This file contains a slow-but-accurate integer implementation of the
97*53ee8cc1Swenshuai.xi  * inverse DCT (Discrete Cosine Transform).  In the IJG code, this routine
98*53ee8cc1Swenshuai.xi  * must also perform dequantization of the input coefficients.
99*53ee8cc1Swenshuai.xi  *
100*53ee8cc1Swenshuai.xi  * A 2-D IDCT can be done by 1-D IDCT on each column followed by 1-D IDCT
101*53ee8cc1Swenshuai.xi  * on each row (or vice versa, but it's more convenient to emit a row at
102*53ee8cc1Swenshuai.xi  * a time).  Direct algorithms are also available, but they are much more
103*53ee8cc1Swenshuai.xi  * complex and seem not to be any faster when reduced to code.
104*53ee8cc1Swenshuai.xi  *
105*53ee8cc1Swenshuai.xi  * This implementation is based on an algorithm described in
106*53ee8cc1Swenshuai.xi  *   C. Loeffler, A. Ligtenberg and G. Moschytz, "Practical Fast 1-D DCT
107*53ee8cc1Swenshuai.xi  *   Algorithms with 11 Multiplications", Proc. Int'l. Conf. on Acoustics,
108*53ee8cc1Swenshuai.xi  *   Speech, and Signal Processing 1989 (ICASSP '89), pp. 988-991.
109*53ee8cc1Swenshuai.xi  * The primary algorithm described there uses 11 multiplies and 29 adds.
110*53ee8cc1Swenshuai.xi  * We use their alternate method with 12 multiplies and 32 adds.
111*53ee8cc1Swenshuai.xi  * The advantage of this method is that no data path contains more than one
112*53ee8cc1Swenshuai.xi  * multiplication; this allows a very simple and accurate implementation in
113*53ee8cc1Swenshuai.xi  * scaled fixed-point arithmetic, with a minimal number of shifts.
114*53ee8cc1Swenshuai.xi  */
115*53ee8cc1Swenshuai.xi 
116*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
117*53ee8cc1Swenshuai.xi #include "jpegmain.h"
118*53ee8cc1Swenshuai.xi #include "apiJPEG.h"
119*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
120*53ee8cc1Swenshuai.xi #define CONST_BITS  13
121*53ee8cc1Swenshuai.xi #define PASS1_BITS  2
122*53ee8cc1Swenshuai.xi #define SCALEDONE ((S32) 1)
123*53ee8cc1Swenshuai.xi #define CONST_SCALE (SCALEDONE << CONST_BITS)
124*53ee8cc1Swenshuai.xi #define FIX(x)  ((S32) ((x) * CONST_SCALE + 0.5))
125*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
126*53ee8cc1Swenshuai.xi #define FIX_0_298631336  ((S32)  2446)        /* FIX(0.298631336) */
127*53ee8cc1Swenshuai.xi #define FIX_0_390180644  ((S32)  3196)        /* FIX(0.390180644) */
128*53ee8cc1Swenshuai.xi #define FIX_0_541196100  ((S32)  4433)        /* FIX(0.541196100) */
129*53ee8cc1Swenshuai.xi #define FIX_0_765366865  ((S32)  6270)        /* FIX(0.765366865) */
130*53ee8cc1Swenshuai.xi #define FIX_0_899976223  ((S32)  7373)        /* FIX(0.899976223) */
131*53ee8cc1Swenshuai.xi #define FIX_1_175875602  ((S32)  9633)        /* FIX(1.175875602) */
132*53ee8cc1Swenshuai.xi #define FIX_1_501321110  ((S32)  12299)       /* FIX(1.501321110) */
133*53ee8cc1Swenshuai.xi #define FIX_1_847759065  ((S32)  15137)       /* FIX(1.847759065) */
134*53ee8cc1Swenshuai.xi #define FIX_1_961570560  ((S32)  16069)       /* FIX(1.961570560) */
135*53ee8cc1Swenshuai.xi #define FIX_2_053119869  ((S32)  16819)       /* FIX(2.053119869) */
136*53ee8cc1Swenshuai.xi #define FIX_2_562915447  ((S32)  20995)       /* FIX(2.562915447) */
137*53ee8cc1Swenshuai.xi #define FIX_3_072711026  ((S32)  25172)       /* FIX(3.072711026) */
138*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
139*53ee8cc1Swenshuai.xi #define DESCALE(x,n)  (((x) + (SCALEDONE << ((n)-1))) >> (n))
140*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
141*53ee8cc1Swenshuai.xi #define MULTIPLY(var,cnst)  ((var) * (cnst))
142*53ee8cc1Swenshuai.xi #define clamp(i) if (i & 0xFF00) i = (((~i) >> 15) & 0xFF);
143*53ee8cc1Swenshuai.xi 
144*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
idct(JPEG_BLOCK_TYPE * data,U8 * Pdst_ptr)145*53ee8cc1Swenshuai.xi void idct( JPEG_BLOCK_TYPE *data, U8 *Pdst_ptr )
146*53ee8cc1Swenshuai.xi {
147*53ee8cc1Swenshuai.xi     S32 tmp0, tmp1, tmp2, tmp3;
148*53ee8cc1Swenshuai.xi     S32 tmp10, tmp11, tmp12, tmp13;
149*53ee8cc1Swenshuai.xi     S32 z1, z2, z3, z4, z5;
150*53ee8cc1Swenshuai.xi     register JPEG_BLOCK_TYPE *dataptr;
151*53ee8cc1Swenshuai.xi     int rowctr;
152*53ee8cc1Swenshuai.xi 
153*53ee8cc1Swenshuai.xi     //kevinhuang, use an internal array in idct to avoid memcpy to save time
154*53ee8cc1Swenshuai.xi     JPEG_BLOCK_TYPE workspace[64];
155*53ee8cc1Swenshuai.xi     JPEG_BLOCK_TYPE *wsptr;
156*53ee8cc1Swenshuai.xi //printf("idct::idct\n");
157*53ee8cc1Swenshuai.xi     dataptr = data;
158*53ee8cc1Swenshuai.xi     wsptr = workspace;
159*53ee8cc1Swenshuai.xi     for ( rowctr = 8 - 1; rowctr >= 0; rowctr-- )
160*53ee8cc1Swenshuai.xi     {
161*53ee8cc1Swenshuai.xi         if ( ( dataptr[1] | dataptr[2] | dataptr[3] | dataptr[4] | dataptr[5] | dataptr[6] | dataptr[7] ) == 0 )
162*53ee8cc1Swenshuai.xi         {
163*53ee8cc1Swenshuai.xi             S16 dcval = ( S16 )( dataptr[0] << PASS1_BITS );
164*53ee8cc1Swenshuai.xi 
165*53ee8cc1Swenshuai.xi             wsptr[0] = dcval;
166*53ee8cc1Swenshuai.xi             wsptr[1] = dcval;
167*53ee8cc1Swenshuai.xi             wsptr[2] = dcval;
168*53ee8cc1Swenshuai.xi             wsptr[3] = dcval;
169*53ee8cc1Swenshuai.xi             wsptr[4] = dcval;
170*53ee8cc1Swenshuai.xi             wsptr[5] = dcval;
171*53ee8cc1Swenshuai.xi             wsptr[6] = dcval;
172*53ee8cc1Swenshuai.xi             wsptr[7] = dcval;
173*53ee8cc1Swenshuai.xi 
174*53ee8cc1Swenshuai.xi             dataptr += 8;       /* advance pointer to next row */
175*53ee8cc1Swenshuai.xi             wsptr += 8;
176*53ee8cc1Swenshuai.xi             continue;
177*53ee8cc1Swenshuai.xi         }
178*53ee8cc1Swenshuai.xi 
179*53ee8cc1Swenshuai.xi         z2 = ( S32 )dataptr[2];
180*53ee8cc1Swenshuai.xi         z3 = ( S32 )dataptr[6];
181*53ee8cc1Swenshuai.xi 
182*53ee8cc1Swenshuai.xi         z1 = MULTIPLY( z2 + z3, FIX_0_541196100 );
183*53ee8cc1Swenshuai.xi         tmp2 = z1 + MULTIPLY( z3, -FIX_1_847759065 );
184*53ee8cc1Swenshuai.xi         tmp3 = z1 + MULTIPLY( z2, FIX_0_765366865 );
185*53ee8cc1Swenshuai.xi 
186*53ee8cc1Swenshuai.xi         tmp0 = ( ( S32 )dataptr[0] + ( S32 )dataptr[4] ) << CONST_BITS;
187*53ee8cc1Swenshuai.xi         tmp1 = ( ( S32 )dataptr[0] - ( S32 )dataptr[4] ) << CONST_BITS;
188*53ee8cc1Swenshuai.xi 
189*53ee8cc1Swenshuai.xi         tmp10 = tmp0 + tmp3;
190*53ee8cc1Swenshuai.xi         tmp13 = tmp0 - tmp3;
191*53ee8cc1Swenshuai.xi         tmp11 = tmp1 + tmp2;
192*53ee8cc1Swenshuai.xi         tmp12 = tmp1 - tmp2;
193*53ee8cc1Swenshuai.xi 
194*53ee8cc1Swenshuai.xi         tmp0 = ( S32 )dataptr[7];
195*53ee8cc1Swenshuai.xi         tmp1 = ( S32 )dataptr[5];
196*53ee8cc1Swenshuai.xi         tmp2 = ( S32 )dataptr[3];
197*53ee8cc1Swenshuai.xi         tmp3 = ( S32 )dataptr[1];
198*53ee8cc1Swenshuai.xi 
199*53ee8cc1Swenshuai.xi         z1 = tmp0 + tmp3;
200*53ee8cc1Swenshuai.xi         z2 = tmp1 + tmp2;
201*53ee8cc1Swenshuai.xi         z3 = tmp0 + tmp2;
202*53ee8cc1Swenshuai.xi         z4 = tmp1 + tmp3;
203*53ee8cc1Swenshuai.xi         z5 = MULTIPLY( z3 + z4, FIX_1_175875602 );
204*53ee8cc1Swenshuai.xi 
205*53ee8cc1Swenshuai.xi         tmp0 = MULTIPLY( tmp0, FIX_0_298631336 );
206*53ee8cc1Swenshuai.xi         tmp1 = MULTIPLY( tmp1, FIX_2_053119869 );
207*53ee8cc1Swenshuai.xi         tmp2 = MULTIPLY( tmp2, FIX_3_072711026 );
208*53ee8cc1Swenshuai.xi         tmp3 = MULTIPLY( tmp3, FIX_1_501321110 );
209*53ee8cc1Swenshuai.xi         z1 = MULTIPLY( z1, -FIX_0_899976223 );
210*53ee8cc1Swenshuai.xi         z2 = MULTIPLY( z2, -FIX_2_562915447 );
211*53ee8cc1Swenshuai.xi         z3 = MULTIPLY( z3, -FIX_1_961570560 );
212*53ee8cc1Swenshuai.xi         z4 = MULTIPLY( z4, -FIX_0_390180644 );
213*53ee8cc1Swenshuai.xi 
214*53ee8cc1Swenshuai.xi         z3 += z5;
215*53ee8cc1Swenshuai.xi         z4 += z5;
216*53ee8cc1Swenshuai.xi 
217*53ee8cc1Swenshuai.xi         tmp0 += z1 + z3;
218*53ee8cc1Swenshuai.xi         tmp1 += z2 + z4;
219*53ee8cc1Swenshuai.xi         tmp2 += z2 + z3;
220*53ee8cc1Swenshuai.xi         tmp3 += z1 + z4;
221*53ee8cc1Swenshuai.xi 
222*53ee8cc1Swenshuai.xi         wsptr[0] = ( S16 )DESCALE( tmp10 + tmp3, CONST_BITS - PASS1_BITS );
223*53ee8cc1Swenshuai.xi         wsptr[7] = ( S16 )DESCALE( tmp10 - tmp3, CONST_BITS - PASS1_BITS );
224*53ee8cc1Swenshuai.xi         wsptr[1] = ( S16 )DESCALE( tmp11 + tmp2, CONST_BITS - PASS1_BITS );
225*53ee8cc1Swenshuai.xi         wsptr[6] = ( S16 )DESCALE( tmp11 - tmp2, CONST_BITS - PASS1_BITS );
226*53ee8cc1Swenshuai.xi         wsptr[2] = ( S16 )DESCALE( tmp12 + tmp1, CONST_BITS - PASS1_BITS );
227*53ee8cc1Swenshuai.xi         wsptr[5] = ( S16 )DESCALE( tmp12 - tmp1, CONST_BITS - PASS1_BITS );
228*53ee8cc1Swenshuai.xi         wsptr[3] = ( S16 )DESCALE( tmp13 + tmp0, CONST_BITS - PASS1_BITS );
229*53ee8cc1Swenshuai.xi         wsptr[4] = ( S16 )DESCALE( tmp13 - tmp0, CONST_BITS - PASS1_BITS );
230*53ee8cc1Swenshuai.xi 
231*53ee8cc1Swenshuai.xi         dataptr += 8;
232*53ee8cc1Swenshuai.xi         wsptr += 8;
233*53ee8cc1Swenshuai.xi     }
234*53ee8cc1Swenshuai.xi 
235*53ee8cc1Swenshuai.xi     dataptr = workspace;
236*53ee8cc1Swenshuai.xi     for ( rowctr = 8 - 1; rowctr >= 0; rowctr-- )
237*53ee8cc1Swenshuai.xi     {
238*53ee8cc1Swenshuai.xi         S16 i;
239*53ee8cc1Swenshuai.xi 
240*53ee8cc1Swenshuai.xi         if ( ( dataptr[8 * 1] | dataptr[8 * 2] | dataptr[8 * 3] | dataptr[8 * 4] | dataptr[8 * 5] | dataptr[8 * 6] | dataptr[8 * 7] ) == 0 )
241*53ee8cc1Swenshuai.xi         {
242*53ee8cc1Swenshuai.xi             S16 dcval = ( S16 )DESCALE( ( S32 )dataptr[0], PASS1_BITS + 3 ) + 128;
243*53ee8cc1Swenshuai.xi             /*
244*53ee8cc1Swenshuai.xi             if ((dcval) < 0)
245*53ee8cc1Swenshuai.xi               dcval = 0;
246*53ee8cc1Swenshuai.xi             else if (dcval > 255)
247*53ee8cc1Swenshuai.xi               dcval = 255;
248*53ee8cc1Swenshuai.xi             */
249*53ee8cc1Swenshuai.xi             clamp( dcval );
250*53ee8cc1Swenshuai.xi 
251*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 0] = ( U8 )dcval;
252*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 1] = ( U8 )dcval;
253*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 2] = ( U8 )dcval;
254*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 3] = ( U8 )dcval;
255*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 4] = ( U8 )dcval;
256*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 5] = ( U8 )dcval;
257*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 6] = ( U8 )dcval;
258*53ee8cc1Swenshuai.xi             Pdst_ptr[8 * 7] = ( U8 )dcval;
259*53ee8cc1Swenshuai.xi 
260*53ee8cc1Swenshuai.xi             dataptr++;
261*53ee8cc1Swenshuai.xi             Pdst_ptr++;
262*53ee8cc1Swenshuai.xi             continue;
263*53ee8cc1Swenshuai.xi         }
264*53ee8cc1Swenshuai.xi 
265*53ee8cc1Swenshuai.xi         z2 = ( S32 )dataptr[8 * 2];
266*53ee8cc1Swenshuai.xi         z3 = ( S32 )dataptr[8 * 6];
267*53ee8cc1Swenshuai.xi 
268*53ee8cc1Swenshuai.xi         z1 = MULTIPLY( z2 + z3, FIX_0_541196100 );
269*53ee8cc1Swenshuai.xi         tmp2 = z1 + MULTIPLY( z3, -FIX_1_847759065 );
270*53ee8cc1Swenshuai.xi         tmp3 = z1 + MULTIPLY( z2, FIX_0_765366865 );
271*53ee8cc1Swenshuai.xi 
272*53ee8cc1Swenshuai.xi         tmp0 = ( ( S32 )dataptr[8 * 0] + ( S32 )dataptr[8 * 4] ) << CONST_BITS;
273*53ee8cc1Swenshuai.xi         tmp1 = ( ( S32 )dataptr[8 * 0] - ( S32 )dataptr[8 * 4] ) << CONST_BITS;
274*53ee8cc1Swenshuai.xi 
275*53ee8cc1Swenshuai.xi         tmp10 = tmp0 + tmp3;
276*53ee8cc1Swenshuai.xi         tmp13 = tmp0 - tmp3;
277*53ee8cc1Swenshuai.xi         tmp11 = tmp1 + tmp2;
278*53ee8cc1Swenshuai.xi         tmp12 = tmp1 - tmp2;
279*53ee8cc1Swenshuai.xi 
280*53ee8cc1Swenshuai.xi         tmp0 = ( S32 )dataptr[8 * 7];
281*53ee8cc1Swenshuai.xi         tmp1 = ( S32 )dataptr[8 * 5];
282*53ee8cc1Swenshuai.xi         tmp2 = ( S32 )dataptr[8 * 3];
283*53ee8cc1Swenshuai.xi         tmp3 = ( S32 )dataptr[8 * 1];
284*53ee8cc1Swenshuai.xi 
285*53ee8cc1Swenshuai.xi         z1 = tmp0 + tmp3;
286*53ee8cc1Swenshuai.xi         z2 = tmp1 + tmp2;
287*53ee8cc1Swenshuai.xi         z3 = tmp0 + tmp2;
288*53ee8cc1Swenshuai.xi         z4 = tmp1 + tmp3;
289*53ee8cc1Swenshuai.xi         z5 = MULTIPLY( z3 + z4, FIX_1_175875602 );
290*53ee8cc1Swenshuai.xi 
291*53ee8cc1Swenshuai.xi         tmp0 = MULTIPLY( tmp0, FIX_0_298631336 );
292*53ee8cc1Swenshuai.xi         tmp1 = MULTIPLY( tmp1, FIX_2_053119869 );
293*53ee8cc1Swenshuai.xi         tmp2 = MULTIPLY( tmp2, FIX_3_072711026 );
294*53ee8cc1Swenshuai.xi         tmp3 = MULTIPLY( tmp3, FIX_1_501321110 );
295*53ee8cc1Swenshuai.xi         z1 = MULTIPLY( z1, -FIX_0_899976223 );
296*53ee8cc1Swenshuai.xi         z2 = MULTIPLY( z2, -FIX_2_562915447 );
297*53ee8cc1Swenshuai.xi         z3 = MULTIPLY( z3, -FIX_1_961570560 );
298*53ee8cc1Swenshuai.xi         z4 = MULTIPLY( z4, -FIX_0_390180644 );
299*53ee8cc1Swenshuai.xi 
300*53ee8cc1Swenshuai.xi         z3 += z5;
301*53ee8cc1Swenshuai.xi         z4 += z5;
302*53ee8cc1Swenshuai.xi 
303*53ee8cc1Swenshuai.xi         tmp0 += z1 + z3;
304*53ee8cc1Swenshuai.xi         tmp1 += z2 + z4;
305*53ee8cc1Swenshuai.xi         tmp2 += z2 + z3;
306*53ee8cc1Swenshuai.xi         tmp3 += z1 + z4;
307*53ee8cc1Swenshuai.xi 
308*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp10 + tmp3, CONST_BITS + PASS1_BITS + 3 ) + 128;
309*53ee8cc1Swenshuai.xi         clamp( i )
310*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 0] = ( U8 )i;
311*53ee8cc1Swenshuai.xi 
312*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp10 - tmp3, CONST_BITS + PASS1_BITS + 3 ) + 128;
313*53ee8cc1Swenshuai.xi         clamp( i )
314*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 7] = ( U8 )i;
315*53ee8cc1Swenshuai.xi 
316*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp11 + tmp2, CONST_BITS + PASS1_BITS + 3 ) + 128;
317*53ee8cc1Swenshuai.xi         clamp( i )
318*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 1] = ( U8 )i;
319*53ee8cc1Swenshuai.xi 
320*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp11 - tmp2, CONST_BITS + PASS1_BITS + 3 ) + 128;
321*53ee8cc1Swenshuai.xi         clamp( i )
322*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 6] = ( U8 )i;
323*53ee8cc1Swenshuai.xi 
324*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp12 + tmp1, CONST_BITS + PASS1_BITS + 3 ) + 128;
325*53ee8cc1Swenshuai.xi         clamp( i )
326*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 2] = ( U8 )i;
327*53ee8cc1Swenshuai.xi 
328*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp12 - tmp1, CONST_BITS + PASS1_BITS + 3 ) + 128;
329*53ee8cc1Swenshuai.xi         clamp( i )
330*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 5] = ( U8 )i;
331*53ee8cc1Swenshuai.xi 
332*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp13 + tmp0, CONST_BITS + PASS1_BITS + 3 ) + 128;
333*53ee8cc1Swenshuai.xi         clamp( i )
334*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 3] = ( U8 )i;
335*53ee8cc1Swenshuai.xi 
336*53ee8cc1Swenshuai.xi         i = ( S16 )DESCALE( tmp13 - tmp0, CONST_BITS + PASS1_BITS + 3 ) + 128;
337*53ee8cc1Swenshuai.xi         clamp( i )
338*53ee8cc1Swenshuai.xi         Pdst_ptr[8 * 4] = ( U8 )i;
339*53ee8cc1Swenshuai.xi 
340*53ee8cc1Swenshuai.xi         dataptr++;
341*53ee8cc1Swenshuai.xi         Pdst_ptr++;
342*53ee8cc1Swenshuai.xi     }
343*53ee8cc1Swenshuai.xi }
344*53ee8cc1Swenshuai.xi /*----------------------------------------------------------------------------*/
345*53ee8cc1Swenshuai.xi 
346