libavcodec.hg: faandct.c annotate

annotate faandct.c @ 6411:5d50e8a7eb09 libavcodec

Alternative and faster (on gcc x86) plane rotation.

author	michael
date	Tue, 26 Feb 2008 15:52:37 +0000
parents	72e573046758
children	b72f6c4cee12

rev	line source
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	1 /*
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	2 * Floating point AAN DCT
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	4 *
5214 470601203f44 Group all copyright and author notices together. diego parents: 4283 diff changeset	5 * this implementation is based upon the IJG integer AAN DCT (see jfdctfst.c)
470601203f44 Group all copyright and author notices together. diego parents: 4283 diff changeset	6 *
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3036 diff changeset	7 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3036 diff changeset	8 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3036 diff changeset	9 * FFmpeg is free software; you can redistribute it and/or
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	10 * modify it under the terms of the GNU Lesser General Public
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	11 * License as published by the Free Software Foundation; either
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3036 diff changeset	12 * version 2.1 of the License, or (at your option) any later version.
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	13 *
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3036 diff changeset	14 * FFmpeg is distributed in the hope that it will be useful,
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	15 * but WITHOUT ANY WARRANTY; without even the implied warranty of
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	16 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	17 * Lesser General Public License for more details.
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	18 *
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	19 * You should have received a copy of the GNU Lesser General Public
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3036 diff changeset	20 * License along with FFmpeg; if not, write to the Free Software
3036 0b546eab515d Update licensing information: The FSF changed postal address. diego parents: 2979 diff changeset	21 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
6397 094f507b952b Allow use of my AAN DCT under BSD, AMD has agreed to write and contribute michael parents: 5214 diff changeset	22 *
094f507b952b Allow use of my AAN DCT under BSD, AMD has agreed to write and contribute michael parents: 5214 diff changeset	23 * The AAN DCT in this file except ff_faandct248() can also be used under the
6398 0a50abd54b7f Clarify which BSD license. michael parents: 6397 diff changeset	24 * new (3 clause) BSD license.
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	25 */
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	26
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	27 /**
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	28 * @file faandct.c
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	29 * @brief
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	30 * Floating point AAN DCT
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	31 * @author Michael Niedermayer <michaelni@gmx.at>
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	32 */
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	33
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	34 #include "dsputil.h"
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	35 #include "faandct.h"
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	36
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	37 #define FLOAT float
1562 bf452704100f optionally merge postscale into quantization table for the float aan dct michael parents: 1561 diff changeset	38 #ifdef FAAN_POSTSCALE
bf452704100f optionally merge postscale into quantization table for the float aan dct michael parents: 1561 diff changeset	39 # define SCALE(x) postscale[x]
bf452704100f optionally merge postscale into quantization table for the float aan dct michael parents: 1561 diff changeset	40 #else
bf452704100f optionally merge postscale into quantization table for the float aan dct michael parents: 1561 diff changeset	41 # define SCALE(x) 1
bf452704100f optionally merge postscale into quantization table for the float aan dct michael parents: 1561 diff changeset	42 #endif
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	43
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	44 //numbers generated by simple c code (not as accurate as they could be)
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	45 /*
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	46 for(i=0; i<8; i++){
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	47 printf("#define B%d %1.20llf\n", i, (long double)1.0/(cosl(iacosl(-1.0)/(long double)16.0)sqrtl(2)));
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	48 }
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	49 */
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	50 #define B0 1.00000000000000000000
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	51 #define B1 0.72095982200694791383 // (cos(pi*1/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	52 #define B2 0.76536686473017954350 // (cos(pi*2/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	53 #define B3 0.85043009476725644878 // (cos(pi*3/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	54 #define B4 1.00000000000000000000 // (cos(pi*4/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	55 #define B5 1.27275858057283393842 // (cos(pi*5/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	56 #define B6 1.84775906502257351242 // (cos(pi*6/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	57 #define B7 3.62450978541155137218 // (cos(pi*7/16)sqrt(2))^-1
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	58
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	59
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	60 #define A1 0.70710678118654752438 // cos(pi*4/16)
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	61 #define A2 0.54119610014619698435 // cos(pi*6/16)sqrt(2)
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	62 #define A5 0.38268343236508977170 // cos(pi*6/16)
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	63 #define A4 1.30656296487637652774 // cos(pi*2/16)sqrt(2)
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	64
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	65 static FLOAT postscale[64]={
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	66 B0B0, B0B1, B0B2, B0B3, B0B4, B0B5, B0B6, B0B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	67 B1B0, B1B1, B1B2, B1B3, B1B4, B1B5, B1B6, B1B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	68 B2B0, B2B1, B2B2, B2B3, B2B4, B2B5, B2B6, B2B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	69 B3B0, B3B1, B3B2, B3B3, B3B4, B3B5, B3B6, B3B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	70 B4B0, B4B1, B4B2, B4B3, B4B4, B4B5, B4B6, B4B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	71 B5B0, B5B1, B5B2, B5B3, B5B4, B5B5, B5B6, B5B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	72 B6B0, B6B1, B6B2, B6B3, B6B4, B6B5, B6B6, B6B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	73 B7B0, B7B1, B7B2, B7B3, B7B4, B7B5, B7B6, B7B7,
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	74 };
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	75
4283 d6f83e2f8804 rename always_inline to av_always_inline and move to common.h mru parents: 3947 diff changeset	76 static av_always_inline void row_fdct(FLOAT temp[64], DCTELEM * data)
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	77 {
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	78 FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	79 FLOAT tmp10, tmp11, tmp12, tmp13;
6410 72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	80 FLOAT z2, z4, z5, z11, z13;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	81 int i;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	82
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	83 for (i=0; i<8*8; i+=8) {
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	84 tmp0= data[0 + i] + data[7 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	85 tmp7= data[0 + i] - data[7 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	86 tmp1= data[1 + i] + data[6 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	87 tmp6= data[1 + i] - data[6 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	88 tmp2= data[2 + i] + data[5 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	89 tmp5= data[2 + i] - data[5 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	90 tmp3= data[3 + i] + data[4 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	91 tmp4= data[3 + i] - data[4 + i];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	92
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	93 tmp10= tmp0 + tmp3;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	94 tmp13= tmp0 - tmp3;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	95 tmp11= tmp1 + tmp2;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	96 tmp12= tmp1 - tmp2;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	97
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	98 temp[0 + i]= tmp10 + tmp11;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	99 temp[4 + i]= tmp10 - tmp11;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	100
6408 7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	101 tmp12 += tmp13;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	102 tmp12 *= A1;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	103 temp[2 + i]= tmp13 + tmp12;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	104 temp[6 + i]= tmp13 - tmp12;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	105
6409 813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	106 tmp4 += tmp5;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	107 tmp5 += tmp6;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	108 tmp6 += tmp7;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	109
6411 5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	110 #if 0
6409 813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	111 z5= (tmp4 - tmp6) * A5;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	112 z2= tmp4*A2 + z5;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	113 z4= tmp6*A4 + z5;
6411 5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	114 #else
5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	115 z2= tmp4(A2+A5) - tmp6A5;
5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	116 z4= tmp6(A4-A5) + tmp4A5;
5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	117 #endif
6410 72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	118 tmp5*=A1;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	119
6410 72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	120 z11= tmp7 + tmp5;
72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	121 z13= tmp7 - tmp5;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	122
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	123 temp[5 + i]= z13 + z2;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	124 temp[3 + i]= z13 - z2;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	125 temp[1 + i]= z11 + z4;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	126 temp[7 + i]= z11 - z4;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	127 }
1589 eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	128 }
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	129
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	130 void ff_faandct(DCTELEM * data)
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	131 {
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	132 FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	133 FLOAT tmp10, tmp11, tmp12, tmp13;
6410 72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	134 FLOAT z2, z4, z5, z11, z13;
1589 eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	135 FLOAT temp[64];
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	136 int i;
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	137
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	138 emms_c();
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	139
eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	140 row_fdct(temp, data);
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	141
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	142 for (i=0; i<8; i++) {
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	143 tmp0= temp[80 + i] + temp[87 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	144 tmp7= temp[80 + i] - temp[87 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	145 tmp1= temp[81 + i] + temp[86 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	146 tmp6= temp[81 + i] - temp[86 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	147 tmp2= temp[82 + i] + temp[85 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	148 tmp5= temp[82 + i] - temp[85 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	149 tmp3= temp[83 + i] + temp[84 + i];
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	150 tmp4= temp[83 + i] - temp[84 + i];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	151
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	152 tmp10= tmp0 + tmp3;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	153 tmp13= tmp0 - tmp3;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	154 tmp11= tmp1 + tmp2;
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	155 tmp12= tmp1 - tmp2;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	156
1563 820e06c6ca9b 4.9-RC FreeBSD doesnt like lrint() so change to lrintf(), not that bsd supports that but we emulate it ... michael parents: 1562 diff changeset	157 data[80 + i]= lrintf(SCALE(80 + i) * (tmp10 + tmp11));
820e06c6ca9b 4.9-RC FreeBSD doesnt like lrint() so change to lrintf(), not that bsd supports that but we emulate it ... michael parents: 1562 diff changeset	158 data[84 + i]= lrintf(SCALE(84 + i) * (tmp10 - tmp11));
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	159
6408 7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	160 tmp12 += tmp13;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	161 tmp12 *= A1;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	162 data[82 + i]= lrintf(SCALE(82 + i) * (tmp13 + tmp12));
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	163 data[86 + i]= lrintf(SCALE(86 + i) * (tmp13 - tmp12));
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	164
6409 813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	165 tmp4 += tmp5;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	166 tmp5 += tmp6;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	167 tmp6 += tmp7;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	168
6411 5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	169 #if 0
6409 813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	170 z5= (tmp4 - tmp6) * A5;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	171 z2= tmp4*A2 + z5;
813ff53ed933 Avoid a=b+c but rather use a+=b (gcc is too stupid to do this itself), michael parents: 6408 diff changeset	172 z4= tmp6*A4 + z5;
6411 5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	173 #else
5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	174 z2= tmp4(A2+A5) - tmp6A5;
5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	175 z4= tmp6(A4-A5) + tmp4A5;
5d50e8a7eb09 Alternative and faster (on gcc x86) plane rotation. michael parents: 6410 diff changeset	176 #endif
6410 72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	177 tmp5*=A1;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	178
6410 72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	179 z11= tmp7 + tmp5;
72e573046758 Get rid of another useless variable. michael parents: 6409 diff changeset	180 z13= tmp7 - tmp5;
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	181
1563 820e06c6ca9b 4.9-RC FreeBSD doesnt like lrint() so change to lrintf(), not that bsd supports that but we emulate it ... michael parents: 1562 diff changeset	182 data[85 + i]= lrintf(SCALE(85 + i) * (z13 + z2));
820e06c6ca9b 4.9-RC FreeBSD doesnt like lrint() so change to lrintf(), not that bsd supports that but we emulate it ... michael parents: 1562 diff changeset	183 data[83 + i]= lrintf(SCALE(83 + i) * (z13 - z2));
820e06c6ca9b 4.9-RC FreeBSD doesnt like lrint() so change to lrintf(), not that bsd supports that but we emulate it ... michael parents: 1562 diff changeset	184 data[81 + i]= lrintf(SCALE(81 + i) * (z11 + z4));
820e06c6ca9b 4.9-RC FreeBSD doesnt like lrint() so change to lrintf(), not that bsd supports that but we emulate it ... michael parents: 1562 diff changeset	185 data[87 + i]= lrintf(SCALE(87 + i) * (z11 - z4));
1557 5d53c03186a1 floating point AAN DCT michael parents: diff changeset	186 }
5d53c03186a1 floating point AAN DCT michael parents: diff changeset	187 }
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	188
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	189 void ff_faandct248(DCTELEM * data)
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	190 {
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	191 FLOAT tmp0, tmp1, tmp2, tmp3, tmp4, tmp5, tmp6, tmp7;
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	192 FLOAT tmp10, tmp11, tmp12, tmp13;
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	193 FLOAT temp[64];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	194 int i;
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	195
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	196 emms_c();
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	197
1589 eb26d190cf5a move identical code into its own function michael parents: 1571 diff changeset	198 row_fdct(temp, data);
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	199
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	200 for (i=0; i<8; i++) {
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	201 tmp0 = temp[80 + i] + temp[81 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	202 tmp1 = temp[82 + i] + temp[83 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	203 tmp2 = temp[84 + i] + temp[85 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	204 tmp3 = temp[86 + i] + temp[87 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	205 tmp4 = temp[80 + i] - temp[81 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	206 tmp5 = temp[82 + i] - temp[83 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	207 tmp6 = temp[84 + i] - temp[85 + i];
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	208 tmp7 = temp[86 + i] - temp[87 + i];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	209
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	210 tmp10 = tmp0 + tmp3;
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	211 tmp11 = tmp1 + tmp2;
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	212 tmp12 = tmp1 - tmp2;
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	213 tmp13 = tmp0 - tmp3;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	214
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	215 data[80 + i] = lrintf(SCALE(80 + i) * (tmp10 + tmp11));
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	216 data[84 + i] = lrintf(SCALE(84 + i) * (tmp10 - tmp11));
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	217
6408 7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	218 tmp12 += tmp13;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	219 tmp12 *= A1;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	220 data[82 + i] = lrintf(SCALE(82 + i) * (tmp13 + tmp12));
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	221 data[86 + i] = lrintf(SCALE(86 + i) * (tmp13 - tmp12));
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2024 diff changeset	222
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	223 tmp10 = tmp4 + tmp7;
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	224 tmp11 = tmp5 + tmp6;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	225 tmp12 = tmp5 - tmp6;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	226 tmp13 = tmp4 - tmp7;
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	227
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	228 data[81 + i] = lrintf(SCALE(80 + i) * (tmp10 + tmp11));
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	229 data[85 + i] = lrintf(SCALE(84 + i) * (tmp10 - tmp11));
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	230
6408 7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	231 tmp12 += tmp13;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	232 tmp12 *= A1;
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	233 data[83 + i] = lrintf(SCALE(82 + i) * (tmp13 + tmp12));
7af599600f2d One variable less. No real change to the actual code. michael parents: 6398 diff changeset	234 data[87 + i] = lrintf(SCALE(86 + i) * (tmp13 - tmp12));
1571 aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	235 }
aa4dc16c0f18 * adding integer/floating point AAN implementations for DCT 2-4-8 romansh parents: 1563 diff changeset	236 }

Mercurial > libavcodec.hg

annotate faandct.c @ 6411:5d50e8a7eb09 libavcodec