idct.c
上传用户:zhongxx05
上传日期:2007-06-06
资源大小:33641k
文件大小:43k
- /* ***** BEGIN LICENSE BLOCK *****
- * Version: RCSL 1.0/RPSL 1.0
- *
- * Portions Copyright (c) 1995-2002 RealNetworks, Inc. All Rights Reserved.
- *
- * The contents of this file, and the files included with this file, are
- * subject to the current version of the RealNetworks Public Source License
- * Version 1.0 (the "RPSL") available at
- * http://www.helixcommunity.org/content/rpsl unless you have licensed
- * the file under the RealNetworks Community Source License Version 1.0
- * (the "RCSL") available at http://www.helixcommunity.org/content/rcsl,
- * in which case the RCSL will apply. You may also obtain the license terms
- * directly from RealNetworks. You may not use this file except in
- * compliance with the RPSL or, if you have a valid RCSL with RealNetworks
- * applicable to this file, the RCSL. Please see the applicable RPSL or
- * RCSL for the rights, obligations and limitations governing use of the
- * contents of the file.
- *
- * This file is part of the Helix DNA Technology. RealNetworks is the
- * developer of the Original Code and owns the copyrights in the portions
- * it created.
- *
- * This file, and the files included with this file, is distributed and made
- * available on an 'AS IS' basis, WITHOUT WARRANTY OF ANY KIND, EITHER
- * EXPRESS OR IMPLIED, AND REALNETWORKS HEREBY DISCLAIMS ALL SUCH WARRANTIES,
- * INCLUDING WITHOUT LIMITATION, ANY WARRANTIES OF MERCHANTABILITY, FITNESS
- * FOR A PARTICULAR PURPOSE, QUIET ENJOYMENT OR NON-INFRINGEMENT.
- *
- * Technology Compatibility Kit Test Suite(s) Location:
- * http://www.helixcommunity.org/content/tck
- *
- * Contributor(s):
- *
- * ***** END LICENSE BLOCK ***** */
- #include <math.h>
- #include "dllindex.h"
- #include "h261defs.h"
- #include "h261func.h"
- #include "clip.h"
- #include "h263plus.h"
- #ifdef _MACINTOSH
- #include <string.h> // for memset
- #endif
- #ifndef UNREFERENCED_PARAMETER
- #define UNREFERENCED_PARAMETER(x) (x) = (x)
- #endif
- extern S16 Recon [QUANT_MAX - QUANT_MIN + 1] [N_SYM_INDICES];
- // Function prototypes
- static void init_inv_dct (void);
- static void Fix_PTel_S4000_mismatch( void );
- static void truncate_more( S32 * idct_tab_entry );
- static void idct2_goertzel( SYMBOL sym[], int nsym, S32 x[8][4],
- S16 recon[], int intra, int clean, int idct_class );
- static int idct2_energy_test( SYMBOL sym[], int nsym,
- S16 recon[] );
- static void recon_intra_dc( U8 index, S32 vec[8]);
- static void recon_dc( S32 y, S32 vec[8]);
- static void recon_hor_ac( S32 y, S32 vec[8]);
- static void recon_vert_ac( S32 y, S32 vec[8]);
- static void update( S32 x[8], S32 index, S32 table[][8*8*8]);
- static double dctfunc (int freq, int index);
- static S32 dct_tab_entry (double x, double y);
- static S32 combine (S32 iy, S32 ix);
- extern void idct2_advanced_intra( SYMBOL sym[], int nsym, S32 x[8][4], S16 recon[],
- U8 rDCpred, S8 rACpred[8], U8 rDCstore[1], S8 rACstore[8],
- U8 cDCpred, S8 cACpred[8], U8 cDCstore[1], S8 cACstore[8],
- int predtype, int fixedDC, int leftBoundary, int upperBoundary);
- #define PI 3.141592654
- #define FRACBITS 6 /* Fractional bits in IDCT computation */
- #define SCALE_FACTOR 64. /* 2**FRACBITS */
- #define MAX_DCT_INDEX 1024
- #define IDCT_NTAB1_BITS 5
- #define IDCT_NTAB1_SIZE 32 /* 2**NTAB1_BITS entries in table for small values */
- #define IDCT_NTAB2_SIZE ((MAX_DCT_INDEX - 1) / IDCT_NTAB1_SIZE)
- /* Entries to handle values > NTAB1_SIZE */
- #define PIXEL_MIN 0
- #define PIXEL_MAX 255
- #define CLIPMARGIN 300
- #define CLIPMIN (PIXEL_MIN - CLIPMARGIN)
- #define CLIPMAX (PIXEL_MAX + CLIPMARGIN)
- #define N_DCT_INDEX 1024
- // Reconstruction levels for QUANT = 1,2,..,31
- S16 Recon [QUANT_MAX - QUANT_MIN + 1] [N_SYM_INDICES];
- // Define zigzag scanning pattern
- static int ZigZag[64] = { 0, 1, 5, 6, 14, 15, 27, 28,
- 2, 4, 7, 13, 16, 26, 29, 42,
- 3, 8, 12, 17, 25, 30, 41, 43,
- 9, 11, 18, 24, 31, 40, 44, 53,
- 10, 19, 23, 32, 39, 45, 52, 54,
- 20, 22, 33, 38, 46, 51, 55, 60,
- 21, 34, 37, 47, 50, 56, 59, 61,
- 35, 36, 48, 49, 57, 58, 62, 63
- };
- static int InvZZ[64];
- static S32 idct_tab [(IDCT_NTAB1_SIZE + IDCT_NTAB2_SIZE)][8*8][8];
- /* LUT for all coeffs; [amplitude][zigzag position][] */
- static S32 dc_tab [MAX_DCT_INDEX]; /* LUT for DC coeff */
- static S32 hor_ac_tab [MAX_DCT_INDEX][2]; /* LUT for 1st hor AC coeff */
- static S32 vert_ac_tab [MAX_DCT_INDEX][4]; /* LUT for 1st vert AC coeff */
- static S32 intra_dc_tab[N_SYM_INDICES]; /* LUT for INTRA DC coeff */
- PIXEL clip[(CLIPMAX-CLIPMIN+1)]; /* LUT to limit to 0-255 */
- static int even_odd_index[8*8]; /* Classify zigzag pos. as even or odd */
- extern void InitReconTables( void )
- {
- int level, index, quant;
- // QUANT=1 => 3,5,7,...
- // QUANT=2 => 5,9,13,...
- // QUANT=3 => 9,15,21,...
- // QUANT=4 => 11,19,27,...
- for (quant = QUANT_MIN; quant <= QUANT_MAX; quant++) {
- index = (quant + 1) / 2;
- for (level = 1; level < N_SYM_INDICES/2; level++) {
- index += quant;
- index = min( index, N_DCT_INDEX);
- Recon [quant - QUANT_MIN] [level] = index;
- Recon [quant - QUANT_MIN] [N_SYM_INDICES-level] = -index;
- }
- Recon [quant - QUANT_MIN] [0] = 0;
- }
- /* Generate zigzag table */
- for (index = 0; index < 64; index++) {
- InvZZ[ ZigZag[index] ] = index;
- }
- init_inv_dct();
- return;
- }
- // Idct2 - Reconstruct DCT coeffs, perform IDCT, and clip to allowed pixel range */
- // Requires nsym > 0
- extern void Idct2( SYMBOL sym[], int nsym, PIXEL x[], int xdim, S16 recon[], int clean)
- {
- union {
- S16 bshort[8][8];
- S32 blong[8][4];
- } block; /* Output from IDCT */
- int intra;
- int idct_class;
- idct_class = GENERAL; /* assume the general case */
- /* look for situations involving specific involving 1,2,3 symbols */
- if (sym[0].type==0)
- {
- switch (nsym)
- {
- case 1:
- idct_class = DC_ONLY;
- break;
- case 2:
- if (sym[1].type == 0)
- idct_class = DC_AC_H;
- if (sym[1].type == 1)
- idct_class = DC_AC_V;
- break;
- case 3:
- if ( (sym[1].type | sym[2].type) == 0)
- idct_class = DC_3;
- break;
- }
- }
- intra = YES;
- switch (idct_class)
- {
- case DC_ONLY:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_ONLY);
- idct2_clip(x, xdim, block.blong, DC_ONLY);
- break;
- }
- case DC_AC_H:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_AC_H);
- idct2_clip(x, xdim, block.blong, DC_AC_H);
- break;
- }
- case DC_AC_V:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_AC_V);
- idct2_clip(x, xdim, block.blong, GENERAL);
- break;
- }
- case DC_3:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_3);
- idct2_clip(x, xdim, block.blong, GENERAL);
- break;
- }
- default:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, GENERAL);
- idct2_clip(x, xdim, block.blong, GENERAL);
- }
- }
- return;
- }
- // Idct2Sum - Reconstruct DCT coeffs, perform IDCT, add to predition,
- // and clip to allowed pixel range. Requires nsym > 0
- extern void Idct2Sum( SYMBOL sym[], int nsym, PIXEL x[], int xdim, S16 recon[],int clean)
- {
- union {
- S16 bshort[8][8];
- S32 blong[8][4];
- } block; /* Output from IDCT */
- int intra;
- int idct_class;
-
- idct_class = GENERAL; /* assume the general case */
- /* look for situations involving specific involving 1,2,3 symbols */
- if (sym[0].type==0)
- {
- switch (nsym)
- {
- case 1:
- idct_class = DC_ONLY;
- break;
- case 2:
- if (sym[1].type == 0)
- idct_class = DC_AC_H;
- if (sym[1].type == 1)
- idct_class = DC_AC_V;
- break;
- case 3:
- if ( (sym[1].type | sym[2].type) == 0)
- idct_class = DC_3;
- break;
- }
- }
- intra = NO;
- // if (clean == YES || (idct2_energy_test( sym, nsym, recon) > 20)){
- // activate this for sleazy IDCT in decoder
- //
- switch (idct_class)
- {
- case DC_ONLY:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_ONLY);
- idct2sum_clip(x, xdim, block.blong, DC_ONLY);
- break;
- }
- case DC_AC_H:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_AC_H);
- idct2sum_clip(x, xdim, block.blong, DC_AC_H);
- break;
- }
- case DC_AC_V:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_AC_V);
- idct2sum_clip(x, xdim, block.blong, GENERAL);
- break;
- }
- case DC_3:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, DC_3);
- idct2sum_clip(x, xdim, block.blong, GENERAL);
- break;
- }
- default:
- {
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, GENERAL);
- idct2sum_clip(x, xdim, block.blong, GENERAL);
- }
- }
- // } // activate this for sleazy IDCT in decoder
- return;
- }
- // Idct2_s16 - Reconstruct DCT coeffs, perform IDCT, and write as signed 16-bit values
- // Set output block to zero if nsym=0
- extern void Idct2_s16( int intra, SYMBOL sym[], int nsym, S16 x[], int xdim, S16 recon[] )
- {
- int i, clean = YES;
- union {
- S16 bshort[8][8];
- S32 blong[8][4];
- } block; /* Output from IDCT */
- if (nsym == 0) {
- for (i = 0; i < 8; i++) {
- S32 * px = (S32 *)x;
- px[0] = px[1] = px[2] = px[3] = 0;
- x += xdim;
- }
- return;
- }
- idct2_goertzel( sym, nsym, block.blong, recon, intra, clean, GENERAL);
- // Shift out fractional bits
- for (i = 0; i < 8; i++) {
- x[i*xdim + 0] = block.bshort[i][0] >> FRACBITS;
- x[i*xdim + 1] = block.bshort[i][1] >> FRACBITS;
- x[i*xdim + 2] = block.bshort[i][2] >> FRACBITS;
- x[i*xdim + 3] = block.bshort[i][3] >> FRACBITS;
- x[i*xdim + 4] = block.bshort[i][7] >> FRACBITS;
- x[i*xdim + 5] = block.bshort[i][6] >> FRACBITS;
- x[i*xdim + 6] = block.bshort[i][5] >> FRACBITS;
- x[i*xdim + 7] = block.bshort[i][4] >> FRACBITS;
- }
- }
- // Initialize tables for inverse DCT
- // Note: This routine has not been optimized for speed
- static void init_inv_dct (void)
- {
- int i,j,m,n, index, zzpos;
- double magn; /* amplitude of DCT coefficient */
- static double bfunc[8][8][4][4]; /* DCT basis functions [vert freq][hor freq][][] */
- for (n=0; n < 8; n++) { /* Construct 2-D basis functions */
- for (m=0; m < 8; m++) {
- for (j=0; j < 4; j++) {
- for (i=0; i < 4; i++) {
- bfunc[n][m][j][i] = SCALE_FACTOR * dctfunc(n,j) * dctfunc(m,i);
- }
- }
- }
- }
- // Initialize table for INTRA DC coeff reconstruction */
- for (index = 0; index < N_SYM_INDICES; index++) {
- magn = 8 * index;
- //printf( "Init index = %d magn = %f n", index, magn);
- intra_dc_tab [index] = dct_tab_entry (magn * bfunc[0][0][0][0],
- magn * bfunc[0][0][0][1]);
- }
- // 128 is represented by index=255
- index = 255;
- magn = 8 * 128;
- //printf( "Init index = %d magn = %f n", index, magn);
- intra_dc_tab [index] = dct_tab_entry (magn * bfunc[0][0][0][0],
- magn * bfunc[0][0][0][1]);
-
- // Initialize tables for DC and first two AC coeffs
- for (index = 0; index < MAX_DCT_INDEX; index++) {
- magn = 2*index + 1;
- //printf( "Init index = %d magn = %f n", index, magn);
- dc_tab [index] = dct_tab_entry (magn * bfunc[0][0][0][0],
- magn * bfunc[0][0][0][1]);
- for (i = 0; i < 2; i++) {
- hor_ac_tab [index][i]
- = dct_tab_entry (magn * bfunc[0][1][0][2*i],
- magn * bfunc[0][1][0][2*i+1]);
- }
- for (j = 0; j < 4; j++) {
- vert_ac_tab [index][j]
- = dct_tab_entry (magn * bfunc[1][0][j][0],
- magn * bfunc[1][0][j][1]);
- }
- }
- // Initialize table for all coeffs
- for (index = 0; index < IDCT_NTAB1_SIZE; index++) {
- magn = 2*index + 1;
- //printf( "Init index = %d magn = %f n", index, magn);
- for (zzpos = 0; zzpos < 8*8; zzpos++) {
- n = InvZZ[zzpos] / 8;
- m = InvZZ[zzpos] % 8;
- for (j=0; j < 4; j++) {
- for (i=0; i < 2; i++) {
- idct_tab [index][zzpos][2*j+i]
- = dct_tab_entry (magn * bfunc[n][m][j][2*i],
- magn * bfunc[n][m][j][2*i+1]);
- }
- }
- }
- }
- for (index = 0; index < IDCT_NTAB2_SIZE; index++) {
- magn = 2 * IDCT_NTAB1_SIZE * (index + 1);
- //printf( "Init index = %d magn = %f n", index+IDCT_NTAB1_SIZE, magn);
- for (zzpos = 0; zzpos < 8*8; zzpos++) {
- n = InvZZ[zzpos] / 8;
- m = InvZZ[zzpos] % 8;
- for (j=0; j < 4; j++) {
- for (i=0; i < 2; i++) {
- idct_tab [index + IDCT_NTAB1_SIZE][zzpos][2*j+i]
- = dct_tab_entry (magn * bfunc[n][m][j][2*i],
- magn * bfunc[n][m][j][2*i+1]);
- }
- }
- }
- }
- // Modify tables for index=1 to truncate more values to zero
- Fix_PTel_S4000_mismatch();
- // LUT to clip to allowed range for PIXEL
- for (i = CLIPMIN; i <= CLIPMAX; i++) {
- clip[i-CLIPMIN] = max( PIXEL_MIN, min( PIXEL_MAX, i));
- }
- // Classify zigzag position as even or odd, horizontally and vertically
- for (zzpos = 0; zzpos < 8*8; zzpos++) {
- n = InvZZ[zzpos] / 8;
- m = InvZZ[zzpos] % 8;
- even_odd_index[zzpos] = 2 * (n % 2) + m % 2;
- }
- #ifdef DO_H263_PLUS
- InitAdvancedIntraTables();
- #endif
- return;
- }
- // Fix_PTel_S4000_mismatch - Modify tables for index=1 to truncate more
- // values to zero. This improves the quality when communicating with a
- // system that has an IDCT mismatch problem (PTel S-4000, bug #250)
- static void Fix_PTel_S4000_mismatch( void )
- {
- int index, i, j, zzpos;
-
- index = 1;
- for (i = 0; i < 2; i++) {
- truncate_more( &hor_ac_tab [index][i] );
- }
- for (j = 0; j < 4; j++) {
- truncate_more( &vert_ac_tab [index][j] );
- }
- for (zzpos = 0; zzpos < 8*8; zzpos++) {
- for (j=0; j < 4; j++) {
- for (i=0; i < 2; i++) {
- truncate_more( &idct_tab [index][zzpos][2*j+i] );
- }
- }
- }
- return;
- }
- // truncate_more
- static void truncate_more( S32 * idct_tab_entry )
- {
- #define ONE_HALF (1 << (FRACBITS - 1))
- #define PTEL_FIX_INTERVAL (3) // Set to 0 if no fix needed
- S32 halfword[2];
- int i;
-
- halfword[0] = *idct_tab_entry >> 16; // Upper part of word
- halfword[1] = (*idct_tab_entry << 16) >> 16; // Lower part of word
- for (i = 0; i < 2; ++i) {
- if (halfword[i] >= ONE_HALF && halfword[i] < ONE_HALF + PTEL_FIX_INTERVAL) {
- halfword[i] = ONE_HALF - 1;
- } else if (halfword[i] <= -ONE_HALF && halfword[i] > -(ONE_HALF + PTEL_FIX_INTERVAL)) {
- halfword[i] = -(ONE_HALF - 1);
- }
- }
- *idct_tab_entry = (halfword[0] << 16) | (halfword[1] & 0xffff);
- return;
- }
-
- #ifdef WHY_IS_THIS_HERE
- static int idct2_energy_test( SYMBOL sym[], int nsym,
- S16 recon[] )
- {
- int isym, zzpos;
- int temp;
- isym = 0;
- temp = 0;
- zzpos = sym[0].type;
- while (isym < nsym && zzpos < 10) {
- temp += abs((int) recon[(U8)sym[isym].value]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- return(temp);
- }
- #endif
- static void idct2_goertzel( SYMBOL sym[], int nsym, S32 x[8][4],
- S16 recon[], int intra, int clean, int idct_class)
- {
- int i, zzpos, isym;
- S32 even_odd[4][8]; /* Accumulate even/even, even/odd, odd/even, odd/odd */
- S32 temp[4]; /* Used in final butterfly computations */
- #ifdef LITTLE_ENDIAN
- char msg[120]; /* Flawfinder: ignore */
- int LUT_index;
- #endif
- UNREFERENCED_PARAMETER(clean);
- // The four special class implementations are specific to LITTLE_ENDIAN.
- #ifdef LITTLE_ENDIAN
- switch (idct_class)
- {
- case GENERAL:
- {
- memset(even_odd, 0, 128);
- isym = 0;
- zzpos = sym[0].type;
- // Reconstruct DC coeff
- if (intra == YES) {
- recon_intra_dc( (U8) sym[0].value, even_odd[0]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- else if (zzpos == 0) {
- recon_dc( (S32) recon[(U8)sym[0].value], even_odd[0]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Init even/odd: reconstruct first hor. AC coeff
- if (isym < nsym && zzpos == 1) {
- recon_hor_ac( (S32) recon[(U8)sym[isym].value], even_odd[1]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Init odd/even: reconstruct first vert. AC coeff
- if (isym < nsym && zzpos == 2) {
- recon_vert_ac( (S32) recon[(U8)sym[isym].value], even_odd[2]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Reconstruct remaining coeffs
- // if (clean == YES) { // activate this for sleazy IDCT decoder
- while (isym < nsym) {
- //printf(" Calling update with zzpos = %dn", zzpos);
- update( &even_odd[ even_odd_index[zzpos]] [0],
- (S32) recon[(U8)sym[isym].value],
- (long (*)[512]) &idct_tab[0][zzpos][0]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // } // activate this for sleazy IDCT decoder
- // else {
- //
- // Sleazy reconstruction
- //
- // while (isym < nsym && zzpos < 10) {
- // //printf(" Calling update with zzpos = %dn", zzpos);
- // update( &even_odd[ even_odd_index[zzpos]] [0],
- // (S32) recon[(U8)sym[isym].value],
- // (U32 (*)[8*8*8])&idct_tab[0][zzpos][0]);
- // isym++;
- // zzpos += 1 + sym[isym].type;
- // }
- // }
- }
- break;
- case DC_ONLY:
- case DC_AC_H:
- case DC_AC_V:
- case DC_3:
- {
- isym = 0;
- zzpos = sym[0].type;
- // Reconstruct DC coeff
- if (intra == YES)
- {
- LUT_index = (U8)sym[0].value;
- even_odd[0][0] = intra_dc_tab[LUT_index];
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- else if (zzpos == 0)
- {
- LUT_index = (S32)recon[(U8)sym[0].value];
- if (LUT_index>0)
- even_odd[0][0] = dc_tab[LUT_index-1];
- else if (LUT_index<0)
- even_odd[0][0] = -dc_tab[-LUT_index-1];
- else
- {
- //sprintf(msg, "ERROR:recon_dc called with arg=0");
- //H261ErrMsg(msg);
- }
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Init even/odd: reconstruct first hor. AC coeff
- if (isym < nsym && zzpos == 1) {
- recon_hor_ac( (S32) recon[(U8)sym[isym].value], even_odd[1]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Init odd/even: reconstruct first vert. AC coeff
- if (isym < nsym && zzpos == 2) {
- recon_vert_ac( (S32) recon[(U8)sym[isym].value], even_odd[2]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- }
- break;
-
- default:
- break;
- }
- #else
- memset(even_odd, 0, 128);
- isym = 0;
- zzpos = sym[0].type;
- // Reconstruct DC coeff
- if (intra == YES) {
- recon_intra_dc( (U8) sym[0].value, even_odd[0]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- else if (zzpos == 0) {
- recon_dc( (S32) recon[(U8)sym[0].value], even_odd[0]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Init even/odd: reconstruct first hor. AC coeff
- if (isym < nsym && zzpos == 1) {
- recon_hor_ac( (S32) recon[(U8)sym[isym].value], even_odd[1]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Init odd/even: reconstruct first vert. AC coeff
- if (isym < nsym && zzpos == 2) {
- recon_vert_ac( (S32) recon[(U8)sym[isym].value], even_odd[2]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // Reconstruct remaining coeffs
- // if (clean == YES) { // activate this for sleazy IDCT decoder
- while (isym < nsym) {
- //printf(" Calling update with zzpos = %dn", zzpos);
- update( &even_odd[ even_odd_index[zzpos]] [0],
- (S32) recon[(U8)sym[isym].value],
- (S32 (*)[8*8*8]) &idct_tab[0][zzpos][0]);
- isym++;
- zzpos += 1 + sym[isym].type;
- }
- // } // activate this for sleazy IDCT decoder
- // else {
- //
- // Sleazy reconstruction
- //
- // while (isym < nsym && zzpos < 10) {
- // //printf(" Calling update with zzpos = %dn", zzpos);
- // update( &even_odd[ even_odd_index[zzpos]] [0],
- // (S32) recon[(U8)sym[isym].value],
- // (U32 (*)[8*8*8]) &idct_tab[0][zzpos][0]);
- // isym++;
- // zzpos += 1 + sym[isym].type;
- // }
- // }
- #endif
- #ifdef LITTLE_ENDIAN
- // Final butterflies
- switch (idct_class)
- {
- // DC only case
- case DC_ONLY:
- {
- temp[0] = even_odd[0][0];
- temp[0] += (0x10001L << (FRACBITS-1));
- x[0][0] = temp[0];
- }
- break;
-
- // DC + 1 horizontal AC case
- case DC_AC_H:
- {
- temp[0] = even_odd[0][0];
-
- temp[0] += (0x10001L << (FRACBITS-1));
-
- x[0][0] = temp[0] + even_odd[1][0];
- x[0][2] = temp[0] - even_odd[1][0];
- x[0][1] = temp[0] + even_odd[1][1];
- x[0][3] = temp[0] - even_odd[1][1];
- }
- break;
- // DC + 1 vertical AC case
- case DC_AC_V:
- {
- for (i = 0; i < 4; i++)
- {
- temp[0] = even_odd[0][0] + even_odd[2][2*i];
- temp[1] = even_odd[0][0] - even_odd[2][2*i];
- temp[0] += (0x10001L << (FRACBITS-1));
- temp[1] += (0x10001L << (FRACBITS-1));
- x[i][0] = temp[0];
- x[i][1] = temp[0];
- x[i][2] = temp[0];
- x[i][3] = temp[0];
- x[7-i][0] = temp[1];
- x[7-i][1] = temp[1];
- x[7-i][2] = temp[1];
- x[7-i][3] = temp[1];
- }
- }
- break;
- // DC + 1 vertical AC + 1 horizontal AC case
- case DC_3:
- {
- for (i = 0; i < 4; i++)
- {
- temp[0] = even_odd[0][0] + even_odd[2][2*i];
- temp[2] = even_odd[0][0] - even_odd[2][2*i];
- temp[0] += (0x10001L << (FRACBITS-1));
- temp[2] += (0x10001L << (FRACBITS-1));
- x[i][0] = temp[0] + even_odd[1][2*i];
- x[i][2] = temp[0] - even_odd[1][2*i];
- x[7-i][0] = temp[2] + even_odd[1][2*i];
- x[7-i][2] = temp[2] - even_odd[1][2*i];
- x[i][1] = temp[0] + even_odd[1][2*i+1];
- x[i][3] = temp[0] - even_odd[1][2*i+1];
- x[7-i][1] = temp[2] + even_odd[1][2*i+1];
- x[7-i][3] = temp[2] - even_odd[1][2*i+1];
- }
- }
- break;
- case GENERAL:
- {
- for (i = 0; i < 4; i++)
- {
- // j=0
- temp[0] = even_odd[0][2*i] + even_odd[2][2*i];
- temp[2] = even_odd[0][2*i] - even_odd[2][2*i];
- temp[1] = even_odd[1][2*i] + even_odd[3][2*i];
- temp[3] = even_odd[1][2*i] - even_odd[3][2*i];
- temp[0] += (0x10001L << (FRACBITS-1)); /* Round */
- x[i][0] = temp[0] + temp[1];
- x[i][2] = temp[0] - temp[1];
- temp[2] += (0x10001L << (FRACBITS-1)); /* Round */
- x[7-i][0] = temp[2] + temp[3];
- x[7-i][2] = temp[2] - temp[3];
- // j=1
- temp[0] = even_odd[0][2*i+1] + even_odd[2][2*i+1];
- temp[2] = even_odd[0][2*i+1] - even_odd[2][2*i+1];
- temp[1] = even_odd[1][2*i+1] + even_odd[3][2*i+1];
- temp[3] = even_odd[1][2*i+1] - even_odd[3][2*i+1];
- temp[0] += (0x10001L << (FRACBITS-1)); /* Round */
- x[i][1] = temp[0] + temp[1];
- x[i][3] = temp[0] - temp[1];
- temp[2] += (0x10001L << (FRACBITS-1)); /* Round */
- x[7-i][1] = temp[2] + temp[3];
- x[7-i][3] = temp[2] - temp[3];
- }
- }
- break;
-
- default:
- break;
- }
- #else
- {
- for (i = 0; i < 4; i++)
- {
- // j=0
- temp[0] = even_odd[0][2*i] + even_odd[2][2*i];
- temp[2] = even_odd[0][2*i] - even_odd[2][2*i];
- temp[1] = even_odd[1][2*i] + even_odd[3][2*i];
- temp[3] = even_odd[1][2*i] - even_odd[3][2*i];
- temp[0] += (0x10001L << (FRACBITS-1)); /* Round */
- x[i][0] = temp[0] + temp[1];
- x[i][2] = temp[0] - temp[1];
- temp[2] += (0x10001L << (FRACBITS-1)); /* Round */
- x[7-i][0] = temp[2] + temp[3];
- x[7-i][2] = temp[2] - temp[3];
- // j=1
- temp[0] = even_odd[0][2*i+1] + even_odd[2][2*i+1];
- temp[2] = even_odd[0][2*i+1] - even_odd[2][2*i+1];
- temp[1] = even_odd[1][2*i+1] + even_odd[3][2*i+1];
- temp[3] = even_odd[1][2*i+1] - even_odd[3][2*i+1];
- temp[0] += (0x10001L << (FRACBITS-1)); /* Round */
- x[i][1] = temp[0] + temp[1];
- x[i][3] = temp[0] - temp[1];
- temp[2] += (0x10001L << (FRACBITS-1)); /* Round */
- x[7-i][1] = temp[2] + temp[3];
- x[7-i][3] = temp[2] - temp[3];
- }
- }
- #endif
- return;
- }
- #ifdef DO_H263_PLUS
- // recon_advanced_intra_dc - Reconstruct DC coeff in INTRA block
- static void recon_advanced_intra_dc( U8 index, S32 vec[8])
- {
- int j, temp;
- double bfunc;
- bfunc = SCALE_FACTOR * dctfunc(0,0) * dctfunc(0,0);
- temp = 8 * index;
- temp = dct_tab_entry( temp * bfunc, temp * bfunc);
- for (j = 0; j < 8; j++) {
- vec[j] = temp;
- }
- return;
- }
- //
- // Quick implementation of intra prediction
- //
- extern void idct2_advanced_intra( SYMBOL sym[], int nsym, S32 x[8][4], S16 recon[],
- U8 rDCpred, S8 rACpred[8], U8 rDCstore[1], S8 rACstore[8],
- U8 cDCpred, S8 cACpred[8], U8 cDCstore[1], S8 cACstore[8],
- int predtype, int fixedDC, int leftBoundary, int upperBoundary)
- {
- int i, pos, isym;
- S32 even_odd[4][8]; /* Accumulate even/even, even/odd, odd/even, odd/odd */
- S32 temp[4]; /* Used in final butterfly computations */
- int skip;
- S8 value;
- int *scan_to_zz;
- int *inv_scan_order;
- memset(even_odd, 0, 128);
-
- // in advanced intra mode, the AC and DC are coded in the same way, so it
- // is possible for the DC residual to be zero and the first symbol to
- // have a non-trivial zero run
- if(nsym) {
- if(sym[0].type) {
- value = 0;
- isym = 0;
- skip = sym[0].type - 1; // we'll take care of DC outside the loop
- } else {
- value = sym[0].value;
- isym = 1;
- skip = sym[isym].type;
- }
- } else {
- value = 0;
- isym = 0;
- skip = 0;
- }
- // Reconstruct DC coeff
- switch(predtype) {
- case ADV_INTRA_PRED_DC_ONLY:
- scan_to_zz = &zigzag_to_zigzag[0];
- inv_scan_order = &InvZZ[0];
- rDCstore[0] = cDCstore[0] = (U8)(value + ((
- (upperBoundary ? cDCpred : rDCpred) + // use row predictor unless on upper boundary
- (leftBoundary ? rDCpred : cDCpred) + // use column predictor unless on left boundary
- 1)>>1) );
- break;
- case ADV_INTRA_PRED_COLUMN:
- scan_to_zz = &alt_ver_to_zigzag[0];
- inv_scan_order = &inv_alt_ver_scan_no_reorder[0];
- rDCstore[0] = cDCstore[0] = (U8)(value + cDCpred);
- break;
- case ADV_INTRA_PRED_ROW:
- scan_to_zz = &alt_hor_to_zigzag[0];
- inv_scan_order = &inv_alt_hor_scan_no_reorder[0];
- rDCstore[0] = cDCstore[0] = (U8)(value + rDCpred);
- break;
- case ADV_INTRA_PRED_NONE:
- scan_to_zz = &zigzag_to_zigzag[0];
- inv_scan_order = &InvZZ[0];
- rDCstore[0] = cDCstore[0] = (U8)(value);
- break;
- }
- // We deviate from the H.263+ spec and the standard H.263 8-bit INTRA_DC quantizer
- // for small quantizer values so that we avoid problems with the dynamic range
- // getting too small
- if(fixedDC) {
- recon_advanced_intra_dc( rDCstore[0], even_odd[0]);
- } else {
- if(rDCstore[0]) update( &even_odd[even_odd_index[0]][0],
- (S32) recon[rDCstore[0]],
- (S32 (*)[8*8*8]) &idct_tab[0][0][0]);
- }
- for(pos=1; pos<64; pos++)
- {
- // compute the quantized AC coefficient
- if(skip || isym>=nsym) {
- value = 0;
- skip--;
- } else {
- value = sym[isym++].value;
- skip = sym[isym].type;
- }
- // row predict and store reconstructed
- if(inv_scan_order[pos] < 8) {
- if(predtype == ADV_INTRA_PRED_ROW)
- value += rACpred[inv_scan_order[pos]];
- rACstore[inv_scan_order[pos]] = value;
- }
- // col predict and store reconstructed
- if((inv_scan_order[pos] & 7) == 0) {
- if(predtype == ADV_INTRA_PRED_COLUMN)
- value += cACpred[inv_scan_order[pos]>>3];
- cACstore[inv_scan_order[pos]>>3] = value;
- }
-
- // note that both even_odd_index and idct_tab assume that we are indexing
- // by zigzag order; hence the conversion of the variable pos
- if(value) update( &even_odd[ even_odd_index[scan_to_zz[pos]]] [0],
- (S32) recon[ (U8)value],
- (S32 (*)[8*8*8]) &idct_tab[0][scan_to_zz[pos]][0]);
- }
- // Do the final butterfly
- for (i = 0; i < 4; i++)
- {
- // j=0
- temp[0] = even_odd[0][2*i] + even_odd[2][2*i];
- temp[2] = even_odd[0][2*i] - even_odd[2][2*i];
- temp[1] = even_odd[1][2*i] + even_odd[3][2*i];
- temp[3] = even_odd[1][2*i] - even_odd[3][2*i];
- temp[0] += (0x10001L << (FRACBITS-1)); /* Round */
- x[i][0] = temp[0] + temp[1];
- x[i][2] = temp[0] - temp[1];
- temp[2] += (0x10001L << (FRACBITS-1)); /* Round */
- x[7-i][0] = temp[2] + temp[3];
- x[7-i][2] = temp[2] - temp[3];
- // j=1
- temp[0] = even_odd[0][2*i+1] + even_odd[2][2*i+1];
- temp[2] = even_odd[0][2*i+1] - even_odd[2][2*i+1];
- temp[1] = even_odd[1][2*i+1] + even_odd[3][2*i+1];
- temp[3] = even_odd[1][2*i+1] - even_odd[3][2*i+1];
- temp[0] += (0x10001L << (FRACBITS-1)); /* Round */
- x[i][1] = temp[0] + temp[1];
- x[i][3] = temp[0] - temp[1];
- temp[2] += (0x10001L << (FRACBITS-1)); /* Round */
- x[7-i][1] = temp[2] + temp[3];
- x[7-i][3] = temp[2] - temp[3];
- }
- return;
- }
- // Idct2 - Reconstruct DCT coeffs, perform IDCT, and clip to allowed pixel range */
- // Requires nsym > 0
- extern void Idct2AdvancedIntra( SYMBOL sym[], int nsym, PIXEL x[], int xdim, S16 recon[],
- U8 rDCpred, S8 rACpred[8], U8 rDCstore[1], S8 rACstore[8],
- U8 cDCpred, S8 cACpred[8], U8 cDCstore[1], S8 cACstore[8],
- int predtype, int fixedDC, int leftBoundary, int upperBoundary)
- {
- union {
- S16 bshort[8][8];
- S32 blong[8][4];
- } block; /* Output from IDCT */
- idct2_advanced_intra( sym, nsym, block.blong, recon,
- rDCpred, rACpred, rDCstore, rACstore,
- cDCpred, cACpred, cDCstore, cACstore,
- predtype, fixedDC,leftBoundary,upperBoundary);
- idct2_clip(x, xdim, block.blong, GENERAL);
- return;
- }
- #endif
- // recon_intra_dc - Reconstruct DC coeff in INTRA block
- static void recon_intra_dc( U8 index, S32 vec[8])
- {
- int j, temp;
-
- temp = intra_dc_tab [index];
- for (j = 0; j < 8; j++) {
- vec[j] = temp;
- }
- return;
- }
- // recon_dc - Reconstruct DC coeff
- static void recon_dc( S32 y, S32 vec[8])
- {
- int j, temp;
- char msg[120]; /* Flawfinder: ignore */
-
- if (y > 0) {
- temp = dc_tab[ y - 1 ];
- } else if (y < 0) {
- temp = -dc_tab[ -y - 1 ];
- } else {
- //sprintf( msg, "ERROR: recon_dc called with arg=0");
- //H261ErrMsg( msg );
- }
- for (j = 0; j < 8; j++) {
- vec[j] = temp;
- }
- return;
- }
- // recon_hor_ac - Reconstruct first hor. AC coeff
- static void recon_hor_ac( S32 y, S32 vec[8])
- {
- int j, temp0, temp1;
- char msg[120]; /* Flawfinder: ignore */
-
- if (y > 0) {
- temp0 = hor_ac_tab[ y - 1 ] [0];
- temp1 = hor_ac_tab[ y - 1 ] [1];
- } else if (y < 0) {
- temp0 = -hor_ac_tab[ -y - 1 ] [0];
- temp1 = -hor_ac_tab[ -y - 1 ] [1];
- } else {
- //sprintf( msg, "ERROR: recon_hor_ac called with arg=0");
- //H261ErrMsg( msg );
- }
- for (j = 0; j < 8; j += 2) {
- vec[j] = temp0;
- vec[j+1] = temp1;
- }
- return;
- }
- // recon_vert_ac - Reconstruct first vert. AC coeff
- static void recon_vert_ac( S32 y, S32 vec[8])
- {
- int j, temp, index;
- char msg[120]; /* Flawfinder: ignore */
-
- if (y > 0) {
- for (j = 0; j < 4; j++) {
- vec[2*j] = vert_ac_tab[ y - 1 ] [j];
- vec[2*j+1] = vert_ac_tab[ y - 1 ] [j];
- }
- } else if (y < 0) {
- index = -y - 1;
- for (j = 0; j < 4; j++) {
- temp = -vert_ac_tab[ index ] [j];
- vec[2*j] = temp;
- vec[2*j+1] = temp;
- }
- } else {
- //sprintf( msg, "ERROR: recon_vert_ac called with arg=0");
- //H261ErrMsg( msg );
- }
- return;
- }
- static void update( S32 x[8], S32 index, S32 table[][8*8*8])
- {
- int tab1_index, tab2_index;
- char msg[120]; /* Flawfinder: ignore */
-
- //printf( "Entered updaten" );
- if (index > 0) {
- index -= 1;
- tab1_index = index & ((0x1L << IDCT_NTAB1_BITS) - 1); /* index % SIZE */
- tab2_index = index >> IDCT_NTAB1_BITS;
- //printf( "update plus: tab2 = %d tab1 = %dn", tab2_index, tab1_index);
- //printf( "x0 = %d table = %dn", x[0], table[tab1_index][0]);
- x[0] += table [tab1_index][0];
- x[1] += table [tab1_index][1];
- x[2] += table [tab1_index][2];
- x[3] += table [tab1_index][3];
- x[4] += table [tab1_index][4];
- x[5] += table [tab1_index][5];
- x[6] += table [tab1_index][6];
- x[7] += table [tab1_index][7];
- if (tab2_index != 0) {
- //printf( "x0 = %d table = %dn", x[0],
- // table[tab2_index - 1 + IDCT_NTAB1_SIZE][0]);
- x[0] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][0];
- x[1] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][1];
- x[2] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][2];
- x[3] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][3];
- x[4] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][4];
- x[5] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][5];
- x[6] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][6];
- x[7] += table [tab2_index - 1 + IDCT_NTAB1_SIZE][7];
- //printf( "x0 = %dn", x[0]);
- }
- } else if (index < 0) {
- index = -index - 1;
- tab1_index = index & ((0x1L << IDCT_NTAB1_BITS) - 1); /* index % SIZE */
- tab2_index = index >> IDCT_NTAB1_BITS;
- //printf( "update minus: tab2 = %d tab1 = %dn", tab2_index, tab1_index);
- x[0] -= table [tab1_index][0];
- x[1] -= table [tab1_index][1];
- x[2] -= table [tab1_index][2];
- x[3] -= table [tab1_index][3];
- x[4] -= table [tab1_index][4];
- x[5] -= table [tab1_index][5];
- x[6] -= table [tab1_index][6];
- x[7] -= table [tab1_index][7];
- if (tab2_index != 0) {
- x[0] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][0];
- x[1] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][1];
- x[2] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][2];
- x[3] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][3];
- x[4] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][4];
- x[5] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][5];
- x[6] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][6];
- x[7] -= table [tab2_index - 1 + IDCT_NTAB1_SIZE][7];
- }
- } else if (index == 0) {
- //sprintf( msg, "ERROR: update called with arg=0");
- //H261ErrMsg( msg );
- }
- return;
- }
- static double dctfunc (int freq, int index)
- {
- if (freq == 0) {
- return (1./sqrt(8.));
- }
- return ( cos(PI*freq*(index+0.5)/8.) / 2.);
- }
- // Turn off "warning C4244: '=' : conversion from 'double ' to 'long ',
- // possible loss of data" for MSVC 4.0
- #pragma message("Turning off ConvFromDblToLong Warning")
- #pragma warning(disable:4244)
- // Round x and y; put x in lower halfword, y in upper halfword (if little-endian)
- static S32 dct_tab_entry (double x, double y)
- {
- S32 ix, iy;
- ix = x * 65536.; /* Mult by 2**16 */
- iy = y * 65536.;
- #ifdef LITTLE_ENDIAN /* x in lower halfword, y in upper */
- return (combine (iy, ix));
- #elif defined BIG_ENDIAN /* x in upper halfword, y in lower */
- return (combine (ix, iy));
- #else
- # error
- #endif
- }
- // Turn back on "warning C4244: '=' : conversion from 'double ' to 'long ',
- // possible loss of data" for MSVC 4.0
- #pragma warning(default:4244)
- // iy in upper halfword, ix>>16 in lower
- static S32 combine (S32 iy, S32 ix)
- {
- S32 low_tab, high_tab;
- // Note: this should not be a big-endian problem because calls to this function
- // exchange the order of ix and iy as needed. (Though wouldn't it have been
- // simpler to make the change here?) tkent
- low_tab = (ix + 0x8000L) >> 16 & 0x0000ffffL;
- high_tab = iy + 0x8000L - low_tab;
- high_tab &= 0xffff0000L;
- return (low_tab | high_tab);
- }