package org.jcodec.common.dct;
import java.nio.ShortBuffer;
/**
* This class is part of JCodec ( www.jcodec.org )
* This software is distributed under FreeBSD License
*
* @author Alex Zhukov
*
*/
public class FfmpegIntDct {
private static final int DCTSIZE = 8;
private static final int DCTSIZE_6 = DCTSIZE * 6;
private static final int DCTSIZE_5 = DCTSIZE * 5;
private static final int DCTSIZE_4 = DCTSIZE * 4;
private static final int DCTSIZE_3 = DCTSIZE * 3;
private static final int DCTSIZE_2 = DCTSIZE * 2;
private static final int DCTSIZE_1 = DCTSIZE * 1;
private static final int DCTSIZE_7 = DCTSIZE * 7;
private static final int DCTSIZE_0 = DCTSIZE * 0;
private static final int PASS1_BITS = 2;
private static final int CONST_BITS = 13;
private static final int D1 = CONST_BITS - PASS1_BITS;
private static final int D2 = CONST_BITS + PASS1_BITS + 3;
private static final int ONEHALF_11 = (1 << (D1 - 1));
private static final int ONEHALF_18 = (1 << (D2 - 1));
public short[] decode(short[] orig) {
ShortBuffer data = ShortBuffer.wrap(orig);
pass1(data);
pass2(data);
return orig;
}
private static ShortBuffer advance(ShortBuffer dataptr, int size) {
dataptr.position(dataptr.position() + size);
return dataptr.slice();
}
/*
* Unlike our decoder where we approximate the FIXes, we need to use exact
* ones here or successive P-frames will drift too much with Reference frame
* coding
*/
private final static short FIX_0_211164243 = 1730;
private final static short FIX_0_275899380 = 2260;
private final static short FIX_0_298631336 = 2446;
private final static short FIX_0_390180644 = 3196;
private final static short FIX_0_509795579 = 4176;
private final static short FIX_0_541196100 = 4433;
private final static short FIX_0_601344887 = 4926;
private final static short FIX_0_765366865 = 6270;
private final static short FIX_0_785694958 = 6436;
private final static short FIX_0_899976223 = 7373;
private final static short FIX_1_061594337 = 8697;
private final static short FIX_1_111140466 = 9102;
private final static short FIX_1_175875602 = 9633;
private final static short FIX_1_306562965 = 10703;
private final static short FIX_1_387039845 = 11363;
private final static short FIX_1_451774981 = 11893;
private final static short FIX_1_501321110 = 12299;
private final static short FIX_1_662939225 = 13623;
private final static short FIX_1_847759065 = 15137;
private final static short FIX_1_961570560 = 16069;
private final static short FIX_2_053119869 = 16819;
private final static short FIX_2_172734803 = 17799;
private final static short FIX_2_562915447 = 20995;
private final static short FIX_3_072711026 = 25172;
/* Pass 1: process rows. */
/* Note results are scaled up by sqrt(8) compared to a true IDCT; */
/* furthermore, we scale the results by 2PASS1_BITS. */
private final static void pass1(ShortBuffer data) {
int z1;
int tmp2;
int tmp3;
int tmp0;
int tmp1;
int tmp10;
int tmp13;
int tmp11;
int tmp12;
int z2;
int z3;
int z4;
int z5;
ShortBuffer dataptr = data.duplicate();
for (int rowctr = DCTSIZE - 1; rowctr >= 0; rowctr--) {
/*
* Due to quantization, we will usually find that many of the input
* coefficients are zero, especially the AC terms. We can exploit
* this by short-circuiting the IDCT calculation for any row in
* which all the AC terms are zero. In that case each output is
* equal to the DC coefficient (with scale factor as needed). With
* typical images and quantization tables, half or more of the row
* DCT calculations can be simplified this way.
*/
// register int *idataptr = (int*)dataptr;
/*
* WARNING: we do the same permutation as MMX idct to simplify the
* video core
*/
int d0 = dataptr.get(0);
int d2 = dataptr.get(1);
int d4 = dataptr.get(2);
int d6 = dataptr.get(3);
int d1 = dataptr.get(4);
int d3 = dataptr.get(5);
int d5 = dataptr.get(6);
int d7 = dataptr.get(7);
if ((d1 | d2 | d3 | d4 | d5 | d6 | d7) == 0) {
/* AC terms all zero */
if (d0 != 0) {
/* Compute a 32 bit value to assign. */
int dcval = (int) (d0 << PASS1_BITS);
for (int i = 0; i < 8; i++) {
dataptr.put(i, (short) dcval);
}
}
/*
* advance pointer to next row
*/
dataptr = advance(dataptr, DCTSIZE);
continue;
}
/* Even part: reverse the even part of the forward DCT. */
/* The rotator is sqrt(2)c(-6). */
if (d6 != 0) {
if (d2 != 0) {
/* d0 != 0, d2 != 0, d4 != 0, d6 != 0 */
z1 = MULTIPLY(d2 + d6, FIX_0_541196100);
tmp2 = z1 + MULTIPLY(-d6, FIX_1_847759065);
tmp3 = z1 + MULTIPLY(d2, FIX_0_765366865);
tmp0 = (d0 + d4) << CONST_BITS;
tmp1 = (d0 - d4) << CONST_BITS;
tmp10 = tmp0 + tmp3;
tmp13 = tmp0 - tmp3;
tmp11 = tmp1 + tmp2;
tmp12 = tmp1 - tmp2;
} else {
/* d0 != 0, d2 == 0, d4 != 0, d6 != 0 */
tmp2 = MULTIPLY(-d6, FIX_1_306562965);
tmp3 = MULTIPLY(d6, FIX_0_541196100);
tmp0 = (d0 + d4) << CONST_BITS;
tmp1 = (d0 - d4) << CONST_BITS;
tmp10 = tmp0 + tmp3;
tmp13 = tmp0 - tmp3;
tmp11 = tmp1 + tmp2;
tmp12 = tmp1 - tmp2;
}
} else {
if (d2 != 0) {
/* d0 != 0, d2 != 0, d4 != 0, d6 == 0 */
tmp2 = MULTIPLY(d2, FIX_0_541196100);
tmp3 = MULTIPLY(d2, FIX_1_306562965);
tmp0 = (d0 + d4) << CONST_BITS;
tmp1 = (d0 - d4) << CONST_BITS;
tmp10 = tmp0 + tmp3;
tmp13 = tmp0 - tmp3;
tmp11 = tmp1 + tmp2;
tmp12 = tmp1 - tmp2;
} else {
/* d0 != 0, d2 == 0, d4 != 0, d6 == 0 */
tmp10 = tmp13 = (d0 + d4) << CONST_BITS;
tmp11 = tmp12 = (d0 - d4) << CONST_BITS;
}
}
/*
* Odd part per figure 8; the matrix is unitary and hence its
* transpose is its inverse. i0..i3 are y7,y5,y3,y1 respectively.
*/
if (d7 != 0) {
if (d5 != 0) {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 != 0, d7 != 0 */
z1 = d7 + d1;
z2 = d5 + d3;
z3 = d7 + d3;
z4 = d5 + d1;
z5 = MULTIPLY(z3 + z4, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-z1, FIX_0_899976223);
z2 = MULTIPLY(-z2, FIX_2_562915447);
z3 = MULTIPLY(-z3, FIX_1_961570560);
z4 = MULTIPLY(-z4, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 += z2 + z4;
tmp2 += z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 != 0, d5 != 0, d7 != 0 */
z2 = d5 + d3;
z3 = d7 + d3;
z5 = MULTIPLY(z3 + d5, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
z1 = MULTIPLY(-d7, FIX_0_899976223);
z2 = MULTIPLY(-z2, FIX_2_562915447);
z3 = MULTIPLY(-z3, FIX_1_961570560);
z4 = MULTIPLY(-d5, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 += z2 + z4;
tmp2 += z2 + z3;
tmp3 = z1 + z4;
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 != 0, d7 != 0 */
z1 = d7 + d1;
z4 = d5 + d1;
z5 = MULTIPLY(d7 + z4, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-z1, FIX_0_899976223);
z2 = MULTIPLY(-d5, FIX_2_562915447);
z3 = MULTIPLY(-d7, FIX_1_961570560);
z4 = MULTIPLY(-z4, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 += z2 + z4;
tmp2 = z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 == 0, d5 != 0, d7 != 0 */
tmp0 = MULTIPLY(-d7, FIX_0_601344887);
z1 = MULTIPLY(-d7, FIX_0_899976223);
z3 = MULTIPLY(-d7, FIX_1_961570560);
tmp1 = MULTIPLY(-d5, FIX_0_509795579);
z2 = MULTIPLY(-d5, FIX_2_562915447);
z4 = MULTIPLY(-d5, FIX_0_390180644);
z5 = MULTIPLY(d5 + d7, FIX_1_175875602);
z3 += z5;
z4 += z5;
tmp0 += z3;
tmp1 += z4;
tmp2 = z2 + z3;
tmp3 = z1 + z4;
}
}
} else {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 == 0, d7 != 0 */
z1 = d7 + d1;
z3 = d7 + d3;
z5 = MULTIPLY(z3 + d1, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-z1, FIX_0_899976223);
z2 = MULTIPLY(-d3, FIX_2_562915447);
z3 = MULTIPLY(-z3, FIX_1_961570560);
z4 = MULTIPLY(-d1, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 = z2 + z4;
tmp2 += z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 != 0, d5 == 0, d7 != 0 */
z3 = d7 + d3;
tmp0 = MULTIPLY(-d7, FIX_0_601344887);
z1 = MULTIPLY(-d7, FIX_0_899976223);
tmp2 = MULTIPLY(d3, FIX_0_509795579);
z2 = MULTIPLY(-d3, FIX_2_562915447);
z5 = MULTIPLY(z3, FIX_1_175875602);
z3 = MULTIPLY(-z3, FIX_0_785694958);
tmp0 += z3;
tmp1 = z2 + z5;
tmp2 += z3;
tmp3 = z1 + z5;
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 == 0, d7 != 0 */
z1 = d7 + d1;
z5 = MULTIPLY(z1, FIX_1_175875602);
z1 = MULTIPLY(z1, FIX_0_275899380);
z3 = MULTIPLY(-d7, FIX_1_961570560);
tmp0 = MULTIPLY(-d7, FIX_1_662939225);
z4 = MULTIPLY(-d1, FIX_0_390180644);
tmp3 = MULTIPLY(d1, FIX_1_111140466);
tmp0 += z1;
tmp1 = z4 + z5;
tmp2 = z3 + z5;
tmp3 += z1;
} else {
/* d1 == 0, d3 == 0, d5 == 0, d7 != 0 */
tmp0 = MULTIPLY(-d7, FIX_1_387039845);
tmp1 = MULTIPLY(d7, FIX_1_175875602);
tmp2 = MULTIPLY(-d7, FIX_0_785694958);
tmp3 = MULTIPLY(d7, FIX_0_275899380);
}
}
}
} else {
if (d5 != 0) {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 != 0, d7 == 0 */
z2 = d5 + d3;
z4 = d5 + d1;
z5 = MULTIPLY(d3 + z4, FIX_1_175875602);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-d1, FIX_0_899976223);
z2 = MULTIPLY(-z2, FIX_2_562915447);
z3 = MULTIPLY(-d3, FIX_1_961570560);
z4 = MULTIPLY(-z4, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 = z1 + z3;
tmp1 += z2 + z4;
tmp2 += z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 != 0, d5 != 0, d7 == 0 */
z2 = d5 + d3;
z5 = MULTIPLY(z2, FIX_1_175875602);
tmp1 = MULTIPLY(d5, FIX_1_662939225);
z4 = MULTIPLY(-d5, FIX_0_390180644);
z2 = MULTIPLY(-z2, FIX_1_387039845);
tmp2 = MULTIPLY(d3, FIX_1_111140466);
z3 = MULTIPLY(-d3, FIX_1_961570560);
tmp0 = z3 + z5;
tmp1 += z2;
tmp2 += z2;
tmp3 = z4 + z5;
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 != 0, d7 == 0 */
z4 = d5 + d1;
z5 = MULTIPLY(z4, FIX_1_175875602);
z1 = MULTIPLY(-d1, FIX_0_899976223);
tmp3 = MULTIPLY(d1, FIX_0_601344887);
tmp1 = MULTIPLY(-d5, FIX_0_509795579);
z2 = MULTIPLY(-d5, FIX_2_562915447);
z4 = MULTIPLY(z4, FIX_0_785694958);
tmp0 = z1 + z5;
tmp1 += z4;
tmp2 = z2 + z5;
tmp3 += z4;
} else {
/* d1 == 0, d3 == 0, d5 != 0, d7 == 0 */
tmp0 = MULTIPLY(d5, FIX_1_175875602);
tmp1 = MULTIPLY(d5, FIX_0_275899380);
tmp2 = MULTIPLY(-d5, FIX_1_387039845);
tmp3 = MULTIPLY(d5, FIX_0_785694958);
}
}
} else {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 == 0, d7 == 0 */
z5 = d1 + d3;
tmp3 = MULTIPLY(d1, FIX_0_211164243);
tmp2 = MULTIPLY(-d3, FIX_1_451774981);
z1 = MULTIPLY(d1, FIX_1_061594337);
z2 = MULTIPLY(-d3, FIX_2_172734803);
z4 = MULTIPLY(z5, FIX_0_785694958);
z5 = MULTIPLY(z5, FIX_1_175875602);
tmp0 = z1 - z4;
tmp1 = z2 + z4;
tmp2 += z5;
tmp3 += z5;
} else {
/* d1 == 0, d3 != 0, d5 == 0, d7 == 0 */
tmp0 = MULTIPLY(-d3, FIX_0_785694958);
tmp1 = MULTIPLY(-d3, FIX_1_387039845);
tmp2 = MULTIPLY(-d3, FIX_0_275899380);
tmp3 = MULTIPLY(d3, FIX_1_175875602);
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 == 0, d7 == 0 */
tmp0 = MULTIPLY(d1, FIX_0_275899380);
tmp1 = MULTIPLY(d1, FIX_0_785694958);
tmp2 = MULTIPLY(d1, FIX_1_175875602);
tmp3 = MULTIPLY(d1, FIX_1_387039845);
} else {
/* d1 == 0, d3 == 0, d5 == 0, d7 == 0 */
tmp0 = tmp1 = tmp2 = tmp3 = 0;
}
}
}
}
/* Final output stage: inputs are tmp10..tmp13, tmp0..tmp3 */
dataptr.put(0, DESCALE11(tmp10 + tmp3));
dataptr.put(7, DESCALE11(tmp10 - tmp3));
dataptr.put(1, DESCALE11(tmp11 + tmp2));
dataptr.put(6, DESCALE11(tmp11 - tmp2));
dataptr.put(2, DESCALE11(tmp12 + tmp1));
dataptr.put(5, DESCALE11(tmp12 - tmp1));
dataptr.put(3, DESCALE11(tmp13 + tmp0));
dataptr.put(4, DESCALE11(tmp13 - tmp0));
dataptr = advance(dataptr, DCTSIZE); /* advance pointer to next row */
}
}
private static int MULTIPLY(int x, short y) {
return y * (short) x;
}
/**
* Perform the inverse DCT on one block of coefficients.
*/
private final static void pass2(ShortBuffer data) {
int tmp0, tmp1, tmp2, tmp3;
int tmp10, tmp11, tmp12, tmp13;
int z1, z2, z3, z4, z5;
int d0, d1, d2, d3, d4, d5, d6, d7;
ShortBuffer dataptr = data.duplicate();
/* Pass 2: process columns. */
/* Note that we must descale the results by a factor of 8 == 23, */
/* and also undo the PASS1_BITS scaling. */
for (int rowctr = DCTSIZE - 1; rowctr >= 0; rowctr--) {
/*
* Columns of zeroes can be exploited in the same way as we did with
* rows. However, the row calculation has created many nonzero AC
* terms, so the simplification applies less often (typically 5% to
* 10% of the time). On machines with very fast multiplication, it's
* possible that the test takes more time than it's worth. In that
* case this section may be commented out.
*/
d0 = dataptr.get(DCTSIZE_0);
d1 = dataptr.get(DCTSIZE_1);
d2 = dataptr.get(DCTSIZE_2);
d3 = dataptr.get(DCTSIZE_3);
d4 = dataptr.get(DCTSIZE_4);
d5 = dataptr.get(DCTSIZE_5);
d6 = dataptr.get(DCTSIZE_6);
d7 = dataptr.get(DCTSIZE_7);
/* Even part: reverse the even part of the forward DCT. */
/* The rotator is sqrt(2)c(-6). */
if (d6 != 0) {
if (d2 != 0) {
/* d0 != 0, d2 != 0, d4 != 0, d6 != 0 */
z1 = MULTIPLY(d2 + d6, FIX_0_541196100);
tmp2 = z1 + MULTIPLY(-d6, FIX_1_847759065);
tmp3 = z1 + MULTIPLY(d2, FIX_0_765366865);
tmp0 = (d0 + d4) << CONST_BITS;
tmp1 = (d0 - d4) << CONST_BITS;
tmp10 = tmp0 + tmp3;
tmp13 = tmp0 - tmp3;
tmp11 = tmp1 + tmp2;
tmp12 = tmp1 - tmp2;
} else {
/* d0 != 0, d2 == 0, d4 != 0, d6 != 0 */
tmp2 = MULTIPLY(-d6, FIX_1_306562965);
tmp3 = MULTIPLY(d6, FIX_0_541196100);
tmp0 = (d0 + d4) << CONST_BITS;
tmp1 = (d0 - d4) << CONST_BITS;
tmp10 = tmp0 + tmp3;
tmp13 = tmp0 - tmp3;
tmp11 = tmp1 + tmp2;
tmp12 = tmp1 - tmp2;
}
} else {
if (d2 != 0) {
/* d0 != 0, d2 != 0, d4 != 0, d6 == 0 */
tmp2 = MULTIPLY(d2, FIX_0_541196100);
tmp3 = MULTIPLY(d2, FIX_1_306562965);
tmp0 = (d0 + d4) << CONST_BITS;
tmp1 = (d0 - d4) << CONST_BITS;
tmp10 = tmp0 + tmp3;
tmp13 = tmp0 - tmp3;
tmp11 = tmp1 + tmp2;
tmp12 = tmp1 - tmp2;
} else {
/* d0 != 0, d2 == 0, d4 != 0, d6 == 0 */
tmp10 = tmp13 = (d0 + d4) << CONST_BITS;
tmp11 = tmp12 = (d0 - d4) << CONST_BITS;
}
}
/*
* Odd part per figure 8; the matrix is unitary and hence its
* transpose is its inverse. i0..i3 are y7,y5,y3,y1 respectively.
*/
if (d7 != 0) {
if (d5 != 0) {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 != 0, d7 != 0 */
z1 = d7 + d1;
z2 = d5 + d3;
z3 = d7 + d3;
z4 = d5 + d1;
z5 = MULTIPLY(z3 + z4, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-z1, FIX_0_899976223);
z2 = MULTIPLY(-z2, FIX_2_562915447);
z3 = MULTIPLY(-z3, FIX_1_961570560);
z4 = MULTIPLY(-z4, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 += z2 + z4;
tmp2 += z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 != 0, d5 != 0, d7 != 0 */
z1 = d7;
z2 = d5 + d3;
z3 = d7 + d3;
z5 = MULTIPLY(z3 + d5, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
z1 = MULTIPLY(-d7, FIX_0_899976223);
z2 = MULTIPLY(-z2, FIX_2_562915447);
z3 = MULTIPLY(-z3, FIX_1_961570560);
z4 = MULTIPLY(-d5, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 += z2 + z4;
tmp2 += z2 + z3;
tmp3 = z1 + z4;
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 != 0, d7 != 0 */
z1 = d7 + d1;
z2 = d5;
z3 = d7;
z4 = d5 + d1;
z5 = MULTIPLY(z3 + z4, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-z1, FIX_0_899976223);
z2 = MULTIPLY(-d5, FIX_2_562915447);
z3 = MULTIPLY(-d7, FIX_1_961570560);
z4 = MULTIPLY(-z4, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 += z2 + z4;
tmp2 = z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 == 0, d5 != 0, d7 != 0 */
tmp0 = MULTIPLY(-d7, FIX_0_601344887);
z1 = MULTIPLY(-d7, FIX_0_899976223);
z3 = MULTIPLY(-d7, FIX_1_961570560);
tmp1 = MULTIPLY(-d5, FIX_0_509795579);
z2 = MULTIPLY(-d5, FIX_2_562915447);
z4 = MULTIPLY(-d5, FIX_0_390180644);
z5 = MULTIPLY(d5 + d7, FIX_1_175875602);
z3 += z5;
z4 += z5;
tmp0 += z3;
tmp1 += z4;
tmp2 = z2 + z3;
tmp3 = z1 + z4;
}
}
} else {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 == 0, d7 != 0 */
z1 = d7 + d1;
z3 = d7 + d3;
z5 = MULTIPLY(z3 + d1, FIX_1_175875602);
tmp0 = MULTIPLY(d7, FIX_0_298631336);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-z1, FIX_0_899976223);
z2 = MULTIPLY(-d3, FIX_2_562915447);
z3 = MULTIPLY(-z3, FIX_1_961570560);
z4 = MULTIPLY(-d1, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 += z1 + z3;
tmp1 = z2 + z4;
tmp2 += z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 != 0, d5 == 0, d7 != 0 */
z3 = d7 + d3;
tmp0 = MULTIPLY(-d7, FIX_0_601344887);
z1 = MULTIPLY(-d7, FIX_0_899976223);
tmp2 = MULTIPLY(d3, FIX_0_509795579);
z2 = MULTIPLY(-d3, FIX_2_562915447);
z5 = MULTIPLY(z3, FIX_1_175875602);
z3 = MULTIPLY(-z3, FIX_0_785694958);
tmp0 += z3;
tmp1 = z2 + z5;
tmp2 += z3;
tmp3 = z1 + z5;
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 == 0, d7 != 0 */
z1 = d7 + d1;
z5 = MULTIPLY(z1, FIX_1_175875602);
z1 = MULTIPLY(z1, FIX_0_275899380);
z3 = MULTIPLY(-d7, FIX_1_961570560);
tmp0 = MULTIPLY(-d7, FIX_1_662939225);
z4 = MULTIPLY(-d1, FIX_0_390180644);
tmp3 = MULTIPLY(d1, FIX_1_111140466);
tmp0 += z1;
tmp1 = z4 + z5;
tmp2 = z3 + z5;
tmp3 += z1;
} else {
/* d1 == 0, d3 == 0, d5 == 0, d7 != 0 */
tmp0 = MULTIPLY(-d7, FIX_1_387039845);
tmp1 = MULTIPLY(d7, FIX_1_175875602);
tmp2 = MULTIPLY(-d7, FIX_0_785694958);
tmp3 = MULTIPLY(d7, FIX_0_275899380);
}
}
}
} else {
if (d5 != 0) {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 != 0, d7 == 0 */
z2 = d5 + d3;
z4 = d5 + d1;
z5 = MULTIPLY(d3 + z4, FIX_1_175875602);
tmp1 = MULTIPLY(d5, FIX_2_053119869);
tmp2 = MULTIPLY(d3, FIX_3_072711026);
tmp3 = MULTIPLY(d1, FIX_1_501321110);
z1 = MULTIPLY(-d1, FIX_0_899976223);
z2 = MULTIPLY(-z2, FIX_2_562915447);
z3 = MULTIPLY(-d3, FIX_1_961570560);
z4 = MULTIPLY(-z4, FIX_0_390180644);
z3 += z5;
z4 += z5;
tmp0 = z1 + z3;
tmp1 += z2 + z4;
tmp2 += z2 + z3;
tmp3 += z1 + z4;
} else {
/* d1 == 0, d3 != 0, d5 != 0, d7 == 0 */
z2 = d5 + d3;
z5 = MULTIPLY(z2, FIX_1_175875602);
tmp1 = MULTIPLY(d5, FIX_1_662939225);
z4 = MULTIPLY(-d5, FIX_0_390180644);
z2 = MULTIPLY(-z2, FIX_1_387039845);
tmp2 = MULTIPLY(d3, FIX_1_111140466);
z3 = MULTIPLY(-d3, FIX_1_961570560);
tmp0 = z3 + z5;
tmp1 += z2;
tmp2 += z2;
tmp3 = z4 + z5;
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 != 0, d7 == 0 */
z4 = d5 + d1;
z5 = MULTIPLY(z4, FIX_1_175875602);
z1 = MULTIPLY(-d1, FIX_0_899976223);
tmp3 = MULTIPLY(d1, FIX_0_601344887);
tmp1 = MULTIPLY(-d5, FIX_0_509795579);
z2 = MULTIPLY(-d5, FIX_2_562915447);
z4 = MULTIPLY(z4, FIX_0_785694958);
tmp0 = z1 + z5;
tmp1 += z4;
tmp2 = z2 + z5;
tmp3 += z4;
} else {
/* d1 == 0, d3 == 0, d5 != 0, d7 == 0 */
tmp0 = MULTIPLY(d5, FIX_1_175875602);
tmp1 = MULTIPLY(d5, FIX_0_275899380);
tmp2 = MULTIPLY(-d5, FIX_1_387039845);
tmp3 = MULTIPLY(d5, FIX_0_785694958);
}
}
} else {
if (d3 != 0) {
if (d1 != 0) {
/* d1 != 0, d3 != 0, d5 == 0, d7 == 0 */
z5 = d1 + d3;
tmp3 = MULTIPLY(d1, FIX_0_211164243);
tmp2 = MULTIPLY(-d3, FIX_1_451774981);
z1 = MULTIPLY(d1, FIX_1_061594337);
z2 = MULTIPLY(-d3, FIX_2_172734803);
z4 = MULTIPLY(z5, FIX_0_785694958);
z5 = MULTIPLY(z5, FIX_1_175875602);
tmp0 = z1 - z4;
tmp1 = z2 + z4;
tmp2 += z5;
tmp3 += z5;
} else {
/* d1 == 0, d3 != 0, d5 == 0, d7 == 0 */
tmp0 = MULTIPLY(-d3, FIX_0_785694958);
tmp1 = MULTIPLY(-d3, FIX_1_387039845);
tmp2 = MULTIPLY(-d3, FIX_0_275899380);
tmp3 = MULTIPLY(d3, FIX_1_175875602);
}
} else {
if (d1 != 0) {
/* d1 != 0, d3 == 0, d5 == 0, d7 == 0 */
tmp0 = MULTIPLY(d1, FIX_0_275899380);
tmp1 = MULTIPLY(d1, FIX_0_785694958);
tmp2 = MULTIPLY(d1, FIX_1_175875602);
tmp3 = MULTIPLY(d1, FIX_1_387039845);
} else {
/* d1 == 0, d3 == 0, d5 == 0, d7 == 0 */
tmp0 = tmp1 = tmp2 = tmp3 = 0;
}
}
}
}
/* Final output stage: inputs are tmp10..tmp13, tmp0..tmp3 */
dataptr.put(DCTSIZE_0, DESCALE18(tmp10 + tmp3));
dataptr.put(DCTSIZE_7, DESCALE18(tmp10 - tmp3));
dataptr.put(DCTSIZE_1, DESCALE18(tmp11 + tmp2));
dataptr.put(DCTSIZE_6, DESCALE18(tmp11 - tmp2));
dataptr.put(DCTSIZE_2, DESCALE18(tmp12 + tmp1));
dataptr.put(DCTSIZE_5, DESCALE18(tmp12 - tmp1));
dataptr.put(DCTSIZE_3, DESCALE18(tmp13 + tmp0));
dataptr.put(DCTSIZE_4, DESCALE18(tmp13 - tmp0));
dataptr = advance(dataptr, 1); /* advance pointer to next column */
}
}
private final static int DESCALE(int x, int n) {
return ((x) + (1 << ((n) - 1))) >> n;
}
private final static short DESCALE11(int x) {
return (short) ((x + ONEHALF_11) >> 11);
}
private final static short DESCALE18(int x) {
return (short) ((x + ONEHALF_18) >> 18);
}
}