1*7dd7cddfSDavid du Colombier /* 2*7dd7cddfSDavid du Colombier * jdct.h 3*7dd7cddfSDavid du Colombier * 4*7dd7cddfSDavid du Colombier * Copyright (C) 1994-1996, Thomas G. Lane. 5*7dd7cddfSDavid du Colombier * This file is part of the Independent JPEG Group's software. 6*7dd7cddfSDavid du Colombier * For conditions of distribution and use, see the accompanying README file. 7*7dd7cddfSDavid du Colombier * 8*7dd7cddfSDavid du Colombier * This include file contains common declarations for the forward and 9*7dd7cddfSDavid du Colombier * inverse DCT modules. These declarations are private to the DCT managers 10*7dd7cddfSDavid du Colombier * (jcdctmgr.c, jddctmgr.c) and the individual DCT algorithms. 11*7dd7cddfSDavid du Colombier * The individual DCT algorithms are kept in separate files to ease 12*7dd7cddfSDavid du Colombier * machine-dependent tuning (e.g., assembly coding). 13*7dd7cddfSDavid du Colombier */ 14*7dd7cddfSDavid du Colombier 15*7dd7cddfSDavid du Colombier 16*7dd7cddfSDavid du Colombier /* 17*7dd7cddfSDavid du Colombier * A forward DCT routine is given a pointer to a work area of type DCTELEM[]; 18*7dd7cddfSDavid du Colombier * the DCT is to be performed in-place in that buffer. Type DCTELEM is int 19*7dd7cddfSDavid du Colombier * for 8-bit samples, INT32 for 12-bit samples. (NOTE: Floating-point DCT 20*7dd7cddfSDavid du Colombier * implementations use an array of type FAST_FLOAT, instead.) 21*7dd7cddfSDavid du Colombier * The DCT inputs are expected to be signed (range +-CENTERJSAMPLE). 22*7dd7cddfSDavid du Colombier * The DCT outputs are returned scaled up by a factor of 8; they therefore 23*7dd7cddfSDavid du Colombier * have a range of +-8K for 8-bit data, +-128K for 12-bit data. This 24*7dd7cddfSDavid du Colombier * convention improves accuracy in integer implementations and saves some 25*7dd7cddfSDavid du Colombier * work in floating-point ones. 26*7dd7cddfSDavid du Colombier * Quantization of the output coefficients is done by jcdctmgr.c. 27*7dd7cddfSDavid du Colombier */ 28*7dd7cddfSDavid du Colombier 29*7dd7cddfSDavid du Colombier #if BITS_IN_JSAMPLE == 8 30*7dd7cddfSDavid du Colombier typedef int DCTELEM; /* 16 or 32 bits is fine */ 31*7dd7cddfSDavid du Colombier #else 32*7dd7cddfSDavid du Colombier typedef INT32 DCTELEM; /* must have 32 bits */ 33*7dd7cddfSDavid du Colombier #endif 34*7dd7cddfSDavid du Colombier 35*7dd7cddfSDavid du Colombier typedef JMETHOD(void, forward_DCT_method_ptr, (DCTELEM * data)); 36*7dd7cddfSDavid du Colombier typedef JMETHOD(void, float_DCT_method_ptr, (FAST_FLOAT * data)); 37*7dd7cddfSDavid du Colombier 38*7dd7cddfSDavid du Colombier 39*7dd7cddfSDavid du Colombier /* 40*7dd7cddfSDavid du Colombier * An inverse DCT routine is given a pointer to the input JBLOCK and a pointer 41*7dd7cddfSDavid du Colombier * to an output sample array. The routine must dequantize the input data as 42*7dd7cddfSDavid du Colombier * well as perform the IDCT; for dequantization, it uses the multiplier table 43*7dd7cddfSDavid du Colombier * pointed to by compptr->dct_table. The output data is to be placed into the 44*7dd7cddfSDavid du Colombier * sample array starting at a specified column. (Any row offset needed will 45*7dd7cddfSDavid du Colombier * be applied to the array pointer before it is passed to the IDCT code.) 46*7dd7cddfSDavid du Colombier * Note that the number of samples emitted by the IDCT routine is 47*7dd7cddfSDavid du Colombier * DCT_scaled_size * DCT_scaled_size. 48*7dd7cddfSDavid du Colombier */ 49*7dd7cddfSDavid du Colombier 50*7dd7cddfSDavid du Colombier /* typedef inverse_DCT_method_ptr is declared in jpegint.h */ 51*7dd7cddfSDavid du Colombier 52*7dd7cddfSDavid du Colombier /* 53*7dd7cddfSDavid du Colombier * Each IDCT routine has its own ideas about the best dct_table element type. 54*7dd7cddfSDavid du Colombier */ 55*7dd7cddfSDavid du Colombier 56*7dd7cddfSDavid du Colombier typedef MULTIPLIER ISLOW_MULT_TYPE; /* short or int, whichever is faster */ 57*7dd7cddfSDavid du Colombier #if BITS_IN_JSAMPLE == 8 58*7dd7cddfSDavid du Colombier typedef MULTIPLIER IFAST_MULT_TYPE; /* 16 bits is OK, use short if faster */ 59*7dd7cddfSDavid du Colombier #define IFAST_SCALE_BITS 2 /* fractional bits in scale factors */ 60*7dd7cddfSDavid du Colombier #else 61*7dd7cddfSDavid du Colombier typedef INT32 IFAST_MULT_TYPE; /* need 32 bits for scaled quantizers */ 62*7dd7cddfSDavid du Colombier #define IFAST_SCALE_BITS 13 /* fractional bits in scale factors */ 63*7dd7cddfSDavid du Colombier #endif 64*7dd7cddfSDavid du Colombier typedef FAST_FLOAT FLOAT_MULT_TYPE; /* preferred floating type */ 65*7dd7cddfSDavid du Colombier 66*7dd7cddfSDavid du Colombier 67*7dd7cddfSDavid du Colombier /* 68*7dd7cddfSDavid du Colombier * Each IDCT routine is responsible for range-limiting its results and 69*7dd7cddfSDavid du Colombier * converting them to unsigned form (0..MAXJSAMPLE). The raw outputs could 70*7dd7cddfSDavid du Colombier * be quite far out of range if the input data is corrupt, so a bulletproof 71*7dd7cddfSDavid du Colombier * range-limiting step is required. We use a mask-and-table-lookup method 72*7dd7cddfSDavid du Colombier * to do the combined operations quickly. See the comments with 73*7dd7cddfSDavid du Colombier * prepare_range_limit_table (in jdmaster.c) for more info. 74*7dd7cddfSDavid du Colombier */ 75*7dd7cddfSDavid du Colombier 76*7dd7cddfSDavid du Colombier #define IDCT_range_limit(cinfo) ((cinfo)->sample_range_limit + CENTERJSAMPLE) 77*7dd7cddfSDavid du Colombier 78*7dd7cddfSDavid du Colombier #define RANGE_MASK (MAXJSAMPLE * 4 + 3) /* 2 bits wider than legal samples */ 79*7dd7cddfSDavid du Colombier 80*7dd7cddfSDavid du Colombier 81*7dd7cddfSDavid du Colombier /* Short forms of external names for systems with brain-damaged linkers. */ 82*7dd7cddfSDavid du Colombier 83*7dd7cddfSDavid du Colombier #ifdef NEED_SHORT_EXTERNAL_NAMES 84*7dd7cddfSDavid du Colombier #define jpeg_fdct_islow jFDislow 85*7dd7cddfSDavid du Colombier #define jpeg_fdct_ifast jFDifast 86*7dd7cddfSDavid du Colombier #define jpeg_fdct_float jFDfloat 87*7dd7cddfSDavid du Colombier #define jpeg_idct_islow jRDislow 88*7dd7cddfSDavid du Colombier #define jpeg_idct_ifast jRDifast 89*7dd7cddfSDavid du Colombier #define jpeg_idct_float jRDfloat 90*7dd7cddfSDavid du Colombier #define jpeg_idct_4x4 jRD4x4 91*7dd7cddfSDavid du Colombier #define jpeg_idct_2x2 jRD2x2 92*7dd7cddfSDavid du Colombier #define jpeg_idct_1x1 jRD1x1 93*7dd7cddfSDavid du Colombier #endif /* NEED_SHORT_EXTERNAL_NAMES */ 94*7dd7cddfSDavid du Colombier 95*7dd7cddfSDavid du Colombier /* Extern declarations for the forward and inverse DCT routines. */ 96*7dd7cddfSDavid du Colombier 97*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_fdct_islow JPP((DCTELEM * data)); 98*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_fdct_ifast JPP((DCTELEM * data)); 99*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_fdct_float JPP((FAST_FLOAT * data)); 100*7dd7cddfSDavid du Colombier 101*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_idct_islow 102*7dd7cddfSDavid du Colombier JPP((j_decompress_ptr cinfo, jpeg_component_info * compptr, 103*7dd7cddfSDavid du Colombier JCOEFPTR coef_block, JSAMPARRAY output_buf, JDIMENSION output_col)); 104*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_idct_ifast 105*7dd7cddfSDavid du Colombier JPP((j_decompress_ptr cinfo, jpeg_component_info * compptr, 106*7dd7cddfSDavid du Colombier JCOEFPTR coef_block, JSAMPARRAY output_buf, JDIMENSION output_col)); 107*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_idct_float 108*7dd7cddfSDavid du Colombier JPP((j_decompress_ptr cinfo, jpeg_component_info * compptr, 109*7dd7cddfSDavid du Colombier JCOEFPTR coef_block, JSAMPARRAY output_buf, JDIMENSION output_col)); 110*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_idct_4x4 111*7dd7cddfSDavid du Colombier JPP((j_decompress_ptr cinfo, jpeg_component_info * compptr, 112*7dd7cddfSDavid du Colombier JCOEFPTR coef_block, JSAMPARRAY output_buf, JDIMENSION output_col)); 113*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_idct_2x2 114*7dd7cddfSDavid du Colombier JPP((j_decompress_ptr cinfo, jpeg_component_info * compptr, 115*7dd7cddfSDavid du Colombier JCOEFPTR coef_block, JSAMPARRAY output_buf, JDIMENSION output_col)); 116*7dd7cddfSDavid du Colombier EXTERN(void) jpeg_idct_1x1 117*7dd7cddfSDavid du Colombier JPP((j_decompress_ptr cinfo, jpeg_component_info * compptr, 118*7dd7cddfSDavid du Colombier JCOEFPTR coef_block, JSAMPARRAY output_buf, JDIMENSION output_col)); 119*7dd7cddfSDavid du Colombier 120*7dd7cddfSDavid du Colombier 121*7dd7cddfSDavid du Colombier /* 122*7dd7cddfSDavid du Colombier * Macros for handling fixed-point arithmetic; these are used by many 123*7dd7cddfSDavid du Colombier * but not all of the DCT/IDCT modules. 124*7dd7cddfSDavid du Colombier * 125*7dd7cddfSDavid du Colombier * All values are expected to be of type INT32. 126*7dd7cddfSDavid du Colombier * Fractional constants are scaled left by CONST_BITS bits. 127*7dd7cddfSDavid du Colombier * CONST_BITS is defined within each module using these macros, 128*7dd7cddfSDavid du Colombier * and may differ from one module to the next. 129*7dd7cddfSDavid du Colombier */ 130*7dd7cddfSDavid du Colombier 131*7dd7cddfSDavid du Colombier #define ONE ((INT32) 1) 132*7dd7cddfSDavid du Colombier #define CONST_SCALE (ONE << CONST_BITS) 133*7dd7cddfSDavid du Colombier 134*7dd7cddfSDavid du Colombier /* Convert a positive real constant to an integer scaled by CONST_SCALE. 135*7dd7cddfSDavid du Colombier * Caution: some C compilers fail to reduce "FIX(constant)" at compile time, 136*7dd7cddfSDavid du Colombier * thus causing a lot of useless floating-point operations at run time. 137*7dd7cddfSDavid du Colombier */ 138*7dd7cddfSDavid du Colombier 139*7dd7cddfSDavid du Colombier #define FIX(x) ((INT32) ((x) * CONST_SCALE + 0.5)) 140*7dd7cddfSDavid du Colombier 141*7dd7cddfSDavid du Colombier /* Descale and correctly round an INT32 value that's scaled by N bits. 142*7dd7cddfSDavid du Colombier * We assume RIGHT_SHIFT rounds towards minus infinity, so adding 143*7dd7cddfSDavid du Colombier * the fudge factor is correct for either sign of X. 144*7dd7cddfSDavid du Colombier */ 145*7dd7cddfSDavid du Colombier 146*7dd7cddfSDavid du Colombier #define DESCALE(x,n) RIGHT_SHIFT((x) + (ONE << ((n)-1)), n) 147*7dd7cddfSDavid du Colombier 148*7dd7cddfSDavid du Colombier /* Multiply an INT32 variable by an INT32 constant to yield an INT32 result. 149*7dd7cddfSDavid du Colombier * This macro is used only when the two inputs will actually be no more than 150*7dd7cddfSDavid du Colombier * 16 bits wide, so that a 16x16->32 bit multiply can be used instead of a 151*7dd7cddfSDavid du Colombier * full 32x32 multiply. This provides a useful speedup on many machines. 152*7dd7cddfSDavid du Colombier * Unfortunately there is no way to specify a 16x16->32 multiply portably 153*7dd7cddfSDavid du Colombier * in C, but some C compilers will do the right thing if you provide the 154*7dd7cddfSDavid du Colombier * correct combination of casts. 155*7dd7cddfSDavid du Colombier */ 156*7dd7cddfSDavid du Colombier 157*7dd7cddfSDavid du Colombier #ifdef SHORTxSHORT_32 /* may work if 'int' is 32 bits */ 158*7dd7cddfSDavid du Colombier #define MULTIPLY16C16(var,const) (((INT16) (var)) * ((INT16) (const))) 159*7dd7cddfSDavid du Colombier #endif 160*7dd7cddfSDavid du Colombier #ifdef SHORTxLCONST_32 /* known to work with Microsoft C 6.0 */ 161*7dd7cddfSDavid du Colombier #define MULTIPLY16C16(var,const) (((INT16) (var)) * ((INT32) (const))) 162*7dd7cddfSDavid du Colombier #endif 163*7dd7cddfSDavid du Colombier 164*7dd7cddfSDavid du Colombier #ifndef MULTIPLY16C16 /* default definition */ 165*7dd7cddfSDavid du Colombier #define MULTIPLY16C16(var,const) ((var) * (const)) 166*7dd7cddfSDavid du Colombier #endif 167*7dd7cddfSDavid du Colombier 168*7dd7cddfSDavid du Colombier /* Same except both inputs are variables. */ 169*7dd7cddfSDavid du Colombier 170*7dd7cddfSDavid du Colombier #ifdef SHORTxSHORT_32 /* may work if 'int' is 32 bits */ 171*7dd7cddfSDavid du Colombier #define MULTIPLY16V16(var1,var2) (((INT16) (var1)) * ((INT16) (var2))) 172*7dd7cddfSDavid du Colombier #endif 173*7dd7cddfSDavid du Colombier 174*7dd7cddfSDavid du Colombier #ifndef MULTIPLY16V16 /* default definition */ 175*7dd7cddfSDavid du Colombier #define MULTIPLY16V16(var1,var2) ((var1) * (var2)) 176*7dd7cddfSDavid du Colombier #endif 177