# HG changeset patch # User nickols_k # Date 1011635202 0 # Node ID 1fe6b64feefb2728f02897d19ce45d6d68571ec4 # Parent 73df666cacc7f7d21f3860d8e0d6425510ff075f Small simple idct improvement for Alpha by Falk Hueffner diff -r 73df666cacc7 -r 1fe6b64feefb simple_idct.c --- a/simple_idct.c Sun Jan 20 14:48:02 2002 +0000 +++ b/simple_idct.c Mon Jan 21 17:46:42 2002 +0000 @@ -104,6 +104,7 @@ } #ifdef ARCH_ALPHA +/* 0: all entries 0, 1: only first entry nonzero, 2: otherwise */ static int inline idctRowCondDC(int16_t *row) { int_fast32_t a0, a1, a2, a3, b0, b1, b2, b3; @@ -201,7 +202,7 @@ row[6] = (a1 - b1) >> ROW_SHIFT; row[7] = (a0 - b0) >> ROW_SHIFT; - return 1; + return 2; } #else /* not ARCH_ALPHA */ static int inline idctRowCondDC (int16_t * row) @@ -547,16 +548,33 @@ idctSparse2Col(block + i); } #elif defined(ARCH_ALPHA) - int shortcut = 1; + int rowsZero = 1; /* all rows except row 0 zero */ + int rowsConstant = 1; /* all rows consist of a constant value */ for (i = 0; i < 8; i++) { - int anynonzero = idctRowCondDC(block + 8 * i); - if (i > 0 && anynonzero) - shortcut = 0; + int sparseness = idctRowCondDC(block + 8 * i); + + if (i > 0 && sparseness > 0) + rowsZero = 0; + if (sparseness == 2) + rowsConstant = 0; } - if (shortcut) { - idctCol2(block); + if (rowsZero) { + idctCol2(block); + } else if (rowsConstant) { + uint64_t *lblock = (uint64_t *) block; + + idctSparseCol(block); + for (i = 0; i < 8; i++) { + uint64_t v = (uint16_t) block[i * 8]; + + v += v << 16; + v += v << 32; + lblock[0] = v; + lblock[1] = v; + lblock += 2; + } } else { for (i = 0; i < 8; i++) idctSparseCol(block + i);