libavcodec.hg: dsputil.c annotate

annotate dsputil.c @ 12043:f9a0bd0888a4 libavcodec

mpegaudio: call ff_mpegaudiodec_init_mmx() only from float decoder The mmx code is floating-point only, and this function does not know from which decoder it is called. Without this change, the integer decoder only "works" because the size of the context struct is smaller in this case, and the mmx init function writes the function pointer outside the allocated context.

author	mru
date	Thu, 01 Jul 2010 23:21:17 +0000
parents	fdafbcef52f5
children	8b28e74de2c0

rev	line source
0 986e461dc072 Initial revision glantau parents: diff changeset	1 /*
986e461dc072 Initial revision glantau parents: diff changeset	2 * DSP utils
8629 04423b2f6e0b cosmetics: Remove pointless period after copyright statement non-sentences. diego parents: 8627 diff changeset	3 * Copyright (c) 2000, 2001 Fabrice Bellard
1739 07a484280a82 copyright year update of the files i touched and remembered, things look annoyingly unmaintained otherwise michael parents: 1729 diff changeset	4 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
0 986e461dc072 Initial revision glantau parents: diff changeset	5 *
5214 470601203f44 Group all copyright and author notices together. diego parents: 5151 diff changeset	6 * gmc & q-pel & 32/64 bit based MC by Michael Niedermayer <michaelni@gmx.at>
470601203f44 Group all copyright and author notices together. diego parents: 5151 diff changeset	7 *
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3807 diff changeset	8 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3807 diff changeset	9 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3807 diff changeset	10 * FFmpeg is free software; you can redistribute it and/or
429 718a22dc121f license/copyright change glantau parents: 403 diff changeset	11 * modify it under the terms of the GNU Lesser General Public
718a22dc121f license/copyright change glantau parents: 403 diff changeset	12 * License as published by the Free Software Foundation; either
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3807 diff changeset	13 * version 2.1 of the License, or (at your option) any later version.
0 986e461dc072 Initial revision glantau parents: diff changeset	14 *
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3807 diff changeset	15 * FFmpeg is distributed in the hope that it will be useful,
0 986e461dc072 Initial revision glantau parents: diff changeset	16 * but WITHOUT ANY WARRANTY; without even the implied warranty of
429 718a22dc121f license/copyright change glantau parents: 403 diff changeset	17 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
718a22dc121f license/copyright change glantau parents: 403 diff changeset	18 * Lesser General Public License for more details.
0 986e461dc072 Initial revision glantau parents: diff changeset	19 *
429 718a22dc121f license/copyright change glantau parents: 403 diff changeset	20 * You should have received a copy of the GNU Lesser General Public
3947 c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library' diego parents: 3807 diff changeset	21 * License along with FFmpeg; if not, write to the Free Software
3036 0b546eab515d Update licensing information: The FSF changed postal address. diego parents: 3029 diff changeset	22 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
0 986e461dc072 Initial revision glantau parents: diff changeset	23 */
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	24
1106 1e39f273ecd6 per file doxy michaelni parents: 1101 diff changeset	25 /**
11644 7dd2a45249a9 Remove explicit filename from Doxygen @file commands. diego parents: 11637 diff changeset	26 * @file
1106 1e39f273ecd6 per file doxy michaelni parents: 1101 diff changeset	27 * DSP utils
1e39f273ecd6 per file doxy michaelni parents: 1101 diff changeset	28 */
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	29
0 986e461dc072 Initial revision glantau parents: diff changeset	30 #include "avcodec.h"
986e461dc072 Initial revision glantau parents: diff changeset	31 #include "dsputil.h"
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	32 #include "simple_idct.h"
1557 5d53c03186a1 floating point AAN DCT michael parents: 1527 diff changeset	33 #include "faandct.h"
6407 7f9e2b5893fc floating point AAN IDCT michael parents: 6387 diff changeset	34 #include "faanidct.h"
8627 d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory) aurel parents: 8596 diff changeset	35 #include "mathops.h"
10748 36611425fedb Add required header #includes for mpegvideo.h and config.h. diego parents: 10644 diff changeset	36 #include "mpegvideo.h"
36611425fedb Add required header #includes for mpegvideo.h and config.h. diego parents: 10644 diff changeset	37 #include "config.h"
11375 84963c795459 Move some prototypes from dsputil.c to reasonable header files mru parents: 11369 diff changeset	38 #include "lpc.h"
84963c795459 Move some prototypes from dsputil.c to reasonable header files mru parents: 11369 diff changeset	39 #include "ac3dec.h"
84963c795459 Move some prototypes from dsputil.c to reasonable header files mru parents: 11369 diff changeset	40 #include "vorbis.h"
84963c795459 Move some prototypes from dsputil.c to reasonable header files mru parents: 11369 diff changeset	41 #include "png.h"
11921 f2007d7c3f1d Native VP8 decoder. rbultje parents: 11784 diff changeset	42 #include "vp8dsp.h"
676 c3bdb00a98a9 dont store version for bit-exact tests michaelni parents: 651 diff changeset	43
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	44 uint8_t ff_cropTbl[256 + 2 * MAX_NEG_CROP] = {0, };
4179 46d38e3d7038 rename squareTbl -> ff_squareTbl mru parents: 4176 diff changeset	45 uint32_t ff_squareTbl[512] = {0, };
0 986e461dc072 Initial revision glantau parents: diff changeset	46
6387 922774d1fb9c cleaner way of writing packed-byte constants. lorenm parents: 6386 diff changeset	47 // 0x7f7f7f7f or 0x7f7f7f7f7f7f7f7f or whatever, depending on the cpu's native arithmetic size
922774d1fb9c cleaner way of writing packed-byte constants. lorenm parents: 6386 diff changeset	48 #define pb_7f (~0UL/255 * 0x7f)
922774d1fb9c cleaner way of writing packed-byte constants. lorenm parents: 6386 diff changeset	49 #define pb_80 (~0UL/255 * 0x80)
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	50
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	51 const uint8_t ff_zigzag_direct[64] = {
706 e65798d228ea idct permutation cleanup, idct can be selected per context now michaelni parents: 689 diff changeset	52 0, 1, 8, 16, 9, 2, 3, 10,
e65798d228ea idct permutation cleanup, idct can be selected per context now michaelni parents: 689 diff changeset	53 17, 24, 32, 25, 18, 11, 4, 5,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	54 12, 19, 26, 33, 40, 48, 41, 34,
706 e65798d228ea idct permutation cleanup, idct can be selected per context now michaelni parents: 689 diff changeset	55 27, 20, 13, 6, 7, 14, 21, 28,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	56 35, 42, 49, 56, 57, 50, 43, 36,
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	57 29, 22, 15, 23, 30, 37, 44, 51,
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	58 58, 59, 52, 45, 38, 31, 39, 46,
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	59 53, 60, 61, 54, 47, 55, 62, 63
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	60 };
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	61
1567 e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	62 /* Specific zigzag scan for 248 idct. NOTE that unlike the
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	63 specification, we interleave the fields */
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	64 const uint8_t ff_zigzag248_direct[64] = {
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	65 0, 8, 1, 9, 16, 24, 2, 10,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	66 17, 25, 32, 40, 48, 56, 33, 41,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	67 18, 26, 3, 11, 4, 12, 19, 27,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	68 34, 42, 49, 57, 50, 58, 35, 43,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	69 20, 28, 5, 13, 6, 14, 21, 29,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	70 36, 44, 51, 59, 52, 60, 37, 45,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	71 22, 30, 7, 15, 23, 31, 38, 46,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	72 53, 61, 54, 62, 39, 47, 55, 63,
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	73 };
e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	74
220 0b234715e205 (commit by michael) arpi_esp parents: 214 diff changeset	75 /* not permutated inverse zigzag_direct + 1 for MMX quantizer */
11369 98970e51365a Remove DECLARE_ALIGNED_{8,16} macros mru parents: 11231 diff changeset	76 DECLARE_ALIGNED(16, uint16_t, inv_zigzag_direct16)[64];
220 0b234715e205 (commit by michael) arpi_esp parents: 214 diff changeset	77
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	78 const uint8_t ff_alternate_horizontal_scan[64] = {
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	79 0, 1, 2, 3, 8, 9, 16, 17,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	80 10, 11, 4, 5, 6, 7, 15, 14,
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	81 13, 12, 19, 18, 24, 25, 32, 33,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	82 26, 27, 20, 21, 22, 23, 28, 29,
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	83 30, 31, 34, 35, 40, 41, 48, 49,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	84 42, 43, 36, 37, 38, 39, 44, 45,
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	85 46, 47, 50, 51, 56, 57, 58, 59,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	86 52, 53, 54, 55, 60, 61, 62, 63,
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	87 };
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	88
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	89 const uint8_t ff_alternate_vertical_scan[64] = {
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	90 0, 8, 16, 24, 1, 9, 2, 10,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	91 17, 25, 32, 40, 48, 56, 57, 49,
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	92 41, 33, 26, 18, 3, 11, 4, 12,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	93 19, 27, 34, 42, 50, 58, 35, 43,
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	94 51, 59, 20, 28, 5, 13, 6, 14,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	95 21, 29, 36, 44, 52, 60, 37, 45,
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	96 53, 61, 22, 30, 7, 15, 23, 31,
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	97 38, 46, 54, 62, 39, 47, 55, 63,
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	98 };
2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	99
10207 658b2ca35e22 extend ff_inverse[], and fix its documentation lorenm parents: 10105 diff changeset	100 /* a*inverse[b]>>32 == a/b for all 0<=a<=16909558 && 2<=b<=256
658b2ca35e22 extend ff_inverse[], and fix its documentation lorenm parents: 10105 diff changeset	101 * for a>16909558, is an overestimate by less than 1 part in 1<<24 */
658b2ca35e22 extend ff_inverse[], and fix its documentation lorenm parents: 10105 diff changeset	102 const uint32_t ff_inverse[257]={
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	103 0, 4294967295U,2147483648U,1431655766, 1073741824, 858993460, 715827883, 613566757,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	104 536870912, 477218589, 429496730, 390451573, 357913942, 330382100, 306783379, 286331154,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	105 268435456, 252645136, 238609295, 226050911, 214748365, 204522253, 195225787, 186737709,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	106 178956971, 171798692, 165191050, 159072863, 153391690, 148102321, 143165577, 138547333,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	107 134217728, 130150525, 126322568, 122713352, 119304648, 116080198, 113025456, 110127367,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	108 107374183, 104755300, 102261127, 99882961, 97612894, 95443718, 93368855, 91382283,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	109 89478486, 87652394, 85899346, 84215046, 82595525, 81037119, 79536432, 78090315,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	110 76695845, 75350304, 74051161, 72796056, 71582789, 70409300, 69273667, 68174085,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	111 67108864, 66076420, 65075263, 64103990, 63161284, 62245903, 61356676, 60492498,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	112 59652324, 58835169, 58040099, 57266231, 56512728, 55778797, 55063684, 54366675,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	113 53687092, 53024288, 52377650, 51746594, 51130564, 50529028, 49941481, 49367441,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	114 48806447, 48258060, 47721859, 47197443, 46684428, 46182445, 45691142, 45210183,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	115 44739243, 44278014, 43826197, 43383509, 42949673, 42524429, 42107523, 41698712,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	116 41297763, 40904451, 40518560, 40139882, 39768216, 39403370, 39045158, 38693400,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	117 38347923, 38008561, 37675152, 37347542, 37025581, 36709123, 36398028, 36092163,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	118 35791395, 35495598, 35204650, 34918434, 34636834, 34359739, 34087043, 33818641,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	119 33554432, 33294321, 33038210, 32786010, 32537632, 32292988, 32051995, 31814573,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	120 31580642, 31350127, 31122952, 30899046, 30678338, 30460761, 30246249, 30034737,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	121 29826162, 29620465, 29417585, 29217465, 29020050, 28825284, 28633116, 28443493,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	122 28256364, 28071682, 27889399, 27709467, 27531842, 27356480, 27183338, 27012373,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	123 26843546, 26676816, 26512144, 26349493, 26188825, 26030105, 25873297, 25718368,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	124 25565282, 25414008, 25264514, 25116768, 24970741, 24826401, 24683721, 24542671,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	125 24403224, 24265352, 24129030, 23994231, 23860930, 23729102, 23598722, 23469767,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	126 23342214, 23216040, 23091223, 22967740, 22845571, 22724695, 22605092, 22486740,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	127 22369622, 22253717, 22139007, 22025474, 21913099, 21801865, 21691755, 21582751,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	128 21474837, 21367997, 21262215, 21157475, 21053762, 20951060, 20849356, 20748635,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	129 20648882, 20550083, 20452226, 20355296, 20259280, 20164166, 20069941, 19976593,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	130 19884108, 19792477, 19701685, 19611723, 19522579, 19434242, 19346700, 19259944,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	131 19173962, 19088744, 19004281, 18920561, 18837576, 18755316, 18673771, 18592933,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	132 18512791, 18433337, 18354562, 18276457, 18199014, 18122225, 18046082, 17970575,
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	133 17895698, 17821442, 17747799, 17674763, 17602325, 17530479, 17459217, 17388532,
220 0b234715e205 (commit by michael) arpi_esp parents: 214 diff changeset	134 17318417, 17248865, 17179870, 17111424, 17043522, 16976156, 16909321, 16843010,
10207 658b2ca35e22 extend ff_inverse[], and fix its documentation lorenm parents: 10105 diff changeset	135 16777216
220 0b234715e205 (commit by michael) arpi_esp parents: 214 diff changeset	136 };
0b234715e205 (commit by michael) arpi_esp parents: 214 diff changeset	137
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	138 /* Input permutation for the simple_idct_mmx */
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	139 static const uint8_t simple_mmx_permutation[64]={
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	140 0x00, 0x08, 0x04, 0x09, 0x01, 0x0C, 0x05, 0x0D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	141 0x10, 0x18, 0x14, 0x19, 0x11, 0x1C, 0x15, 0x1D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	142 0x20, 0x28, 0x24, 0x29, 0x21, 0x2C, 0x25, 0x2D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	143 0x12, 0x1A, 0x16, 0x1B, 0x13, 0x1E, 0x17, 0x1F,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	144 0x02, 0x0A, 0x06, 0x0B, 0x03, 0x0E, 0x07, 0x0F,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	145 0x30, 0x38, 0x34, 0x39, 0x31, 0x3C, 0x35, 0x3D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	146 0x22, 0x2A, 0x26, 0x2B, 0x23, 0x2E, 0x27, 0x2F,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	147 0x32, 0x3A, 0x36, 0x3B, 0x33, 0x3E, 0x37, 0x3F,
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	148 };
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	149
6600 c3213c91124c Add a new IDCT permutation, used in xvid_sse2 and possibly future similar IDCTs. astrange parents: 6450 diff changeset	150 static const uint8_t idct_sse2_row_perm[8] = {0, 4, 1, 5, 2, 6, 3, 7};
c3213c91124c Add a new IDCT permutation, used in xvid_sse2 and possibly future similar IDCTs. astrange parents: 6450 diff changeset	151
6438 e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	152 void ff_init_scantable(uint8_t permutation, ScanTable st, const uint8_t *src_scantable){
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	153 int i;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	154 int end;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	155
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	156 st->scantable= src_scantable;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	157
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	158 for(i=0; i<64; i++){
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	159 int j;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	160 j = src_scantable[i];
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	161 st->permutated[i] = permutation[j];
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	162 #if ARCH_PPC
6438 e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	163 st->inverse[j] = i;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	164 #endif
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	165 }
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	166
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	167 end=-1;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	168 for(i=0; i<64; i++){
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	169 int j;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	170 j = st->permutated[i];
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	171 if(j>end) end=j;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	172 st->raster_end[i]= end;
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	173 }
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	174 }
e1dd408a7864 move ff_init_scantable() into dsputil aurel parents: 6437 diff changeset	175
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	176 static int pix_sum_c(uint8_t * pix, int line_size)
612 c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	177 {
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	178 int s, i, j;
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	179
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	180 s = 0;
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	181 for (i = 0; i < 16; i++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	182 for (j = 0; j < 16; j += 8) {
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	183 s += pix[0];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	184 s += pix[1];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	185 s += pix[2];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	186 s += pix[3];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	187 s += pix[4];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	188 s += pix[5];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	189 s += pix[6];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	190 s += pix[7];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	191 pix += 8;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	192 }
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	193 pix += line_size - 16;
612 c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	194 }
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	195 return s;
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	196 }
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	197
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	198 static int pix_norm1_c(uint8_t * pix, int line_size)
612 c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	199 {
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	200 int s, i, j;
4179 46d38e3d7038 rename squareTbl -> ff_squareTbl mru parents: 4176 diff changeset	201 uint32_t *sq = ff_squareTbl + 256;
612 c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	202
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	203 s = 0;
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	204 for (i = 0; i < 16; i++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	205 for (j = 0; j < 16; j += 8) {
997 4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	206 #if 0
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	207 s += sq[pix[0]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	208 s += sq[pix[1]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	209 s += sq[pix[2]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	210 s += sq[pix[3]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	211 s += sq[pix[4]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	212 s += sq[pix[5]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	213 s += sq[pix[6]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	214 s += sq[pix[7]];
997 4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	215 #else
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	216 #if LONG_MAX > 2147483647
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	217 register uint64_t x=(uint64_t)pix;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	218 s += sq[x&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	219 s += sq[(x>>8)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	220 s += sq[(x>>16)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	221 s += sq[(x>>24)&0xff];
997 4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	222 s += sq[(x>>32)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	223 s += sq[(x>>40)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	224 s += sq[(x>>48)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	225 s += sq[(x>>56)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	226 #else
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	227 register uint32_t x=(uint32_t)pix;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	228 s += sq[x&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	229 s += sq[(x>>8)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	230 s += sq[(x>>16)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	231 s += sq[(x>>24)&0xff];
997 4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	232 x=(uint32_t)(pix+4);
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	233 s += sq[x&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	234 s += sq[(x>>8)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	235 s += sq[(x>>16)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	236 s += sq[(x>>24)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	237 #endif
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	238 #endif
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	239 pix += 8;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	240 }
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	241 pix += line_size - 16;
612 c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	242 }
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	243 return s;
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	244 }
c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	245
6241 2799f65a24de const src for bswap michael parents: 6218 diff changeset	246 static void bswap_buf(uint32_t dst, const uint32_t src, int w){
1273 a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	247 int i;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	248
1273 a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	249 for(i=0; i+8<=w; i+=8){
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	250 dst[i+0]= bswap_32(src[i+0]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	251 dst[i+1]= bswap_32(src[i+1]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	252 dst[i+2]= bswap_32(src[i+2]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	253 dst[i+3]= bswap_32(src[i+3]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	254 dst[i+4]= bswap_32(src[i+4]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	255 dst[i+5]= bswap_32(src[i+5]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	256 dst[i+6]= bswap_32(src[i+6]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	257 dst[i+7]= bswap_32(src[i+7]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	258 }
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	259 for(;i<w; i++){
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	260 dst[i+0]= bswap_32(src[i+0]);
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	261 }
a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	262 }
612 c0005de2be59 new ratecontrol code michaelni parents: 590 diff changeset	263
2184 3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	264 static int sse4_c(void v, uint8_t pix1, uint8_t * pix2, int line_size, int h)
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	265 {
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	266 int s, i;
4179 46d38e3d7038 rename squareTbl -> ff_squareTbl mru parents: 4176 diff changeset	267 uint32_t *sq = ff_squareTbl + 256;
2184 3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	268
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	269 s = 0;
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	270 for (i = 0; i < h; i++) {
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	271 s += sq[pix1[0] - pix2[0]];
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	272 s += sq[pix1[1] - pix2[1]];
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	273 s += sq[pix1[2] - pix2[2]];
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	274 s += sq[pix1[3] - pix2[3]];
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	275 pix1 += line_size;
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	276 pix2 += line_size;
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	277 }
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	278 return s;
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	279 }
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	280
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	281 static int sse8_c(void v, uint8_t pix1, uint8_t * pix2, int line_size, int h)
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	282 {
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	283 int s, i;
4179 46d38e3d7038 rename squareTbl -> ff_squareTbl mru parents: 4176 diff changeset	284 uint32_t *sq = ff_squareTbl + 256;
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	285
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	286 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	287 for (i = 0; i < h; i++) {
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	288 s += sq[pix1[0] - pix2[0]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	289 s += sq[pix1[1] - pix2[1]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	290 s += sq[pix1[2] - pix2[2]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	291 s += sq[pix1[3] - pix2[3]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	292 s += sq[pix1[4] - pix2[4]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	293 s += sq[pix1[5] - pix2[5]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	294 s += sq[pix1[6] - pix2[6]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	295 s += sq[pix1[7] - pix2[7]];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	296 pix1 += line_size;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	297 pix2 += line_size;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	298 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	299 return s;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	300 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	301
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	302 static int sse16_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
884 2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	303 {
1012 7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	304 int s, i;
4179 46d38e3d7038 rename squareTbl -> ff_squareTbl mru parents: 4176 diff changeset	305 uint32_t *sq = ff_squareTbl + 256;
884 2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	306
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	307 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	308 for (i = 0; i < h; i++) {
1012 7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	309 s += sq[pix1[ 0] - pix2[ 0]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	310 s += sq[pix1[ 1] - pix2[ 1]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	311 s += sq[pix1[ 2] - pix2[ 2]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	312 s += sq[pix1[ 3] - pix2[ 3]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	313 s += sq[pix1[ 4] - pix2[ 4]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	314 s += sq[pix1[ 5] - pix2[ 5]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	315 s += sq[pix1[ 6] - pix2[ 6]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	316 s += sq[pix1[ 7] - pix2[ 7]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	317 s += sq[pix1[ 8] - pix2[ 8]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	318 s += sq[pix1[ 9] - pix2[ 9]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	319 s += sq[pix1[10] - pix2[10]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	320 s += sq[pix1[11] - pix2[11]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	321 s += sq[pix1[12] - pix2[12]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	322 s += sq[pix1[13] - pix2[13]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	323 s += sq[pix1[14] - pix2[14]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	324 s += sq[pix1[15] - pix2[15]];
997 4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications) michaelni parents: 996 diff changeset	325
1012 7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	326 pix1 += line_size;
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined, mellum parents: 1011 diff changeset	327 pix2 += line_size;
884 2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	328 }
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	329 return s;
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	330 }
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley kabi parents: 882 diff changeset	331
6437 5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	332 /* draw the edges of width 'w' of an image of size width, height */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	333 //FIXME check that this is ok for mpeg4 interlaced
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	334 static void draw_edges_c(uint8_t *buf, int wrap, int width, int height, int w)
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	335 {
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	336 uint8_t ptr, last_line;
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	337 int i;
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	338
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	339 last_line = buf + (height - 1) * wrap;
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	340 for(i=0;i<w;i++) {
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	341 /* top and bottom */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	342 memcpy(buf - (i + 1) * wrap, buf, width);
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	343 memcpy(last_line + (i + 1) * wrap, last_line, width);
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	344 }
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	345 /* left and right */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	346 ptr = buf;
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	347 for(i=0;i<height;i++) {
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	348 memset(ptr - w, ptr[0], w);
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	349 memset(ptr + width, ptr[width-1], w);
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	350 ptr += wrap;
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	351 }
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	352 /* corners */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	353 for(i=0;i<w;i++) {
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	354 memset(buf - (i + 1) * wrap - w, buf[0], w); /* top left */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	355 memset(buf - (i + 1) * wrap + width, buf[width-1], w); /* top right */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	356 memset(last_line + (i + 1) * wrap - w, last_line[0], w); /* top left */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	357 memset(last_line + (i + 1) * wrap + width, last_line[width-1], w); /* top right */
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	358 }
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	359 }
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	360
6445 2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	361 /**
12024 fdafbcef52f5 Fix grammar errors in documentation mru parents: 11988 diff changeset	362 * Copy a rectangular area of samples to a temporary buffer and replicate the border samples.
6445 2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	363 * @param buf destination buffer
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	364 * @param src source buffer
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	365 * @param linesize number of bytes between 2 vertically adjacent samples in both the source and destination buffers
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	366 * @param block_w width of block
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	367 * @param block_h height of block
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	368 * @param src_x x coordinate of the top left sample of the block in the source buffer
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	369 * @param src_y y coordinate of the top left sample of the block in the source buffer
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	370 * @param w width of the source buffer
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	371 * @param h height of the source buffer
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	372 */
11784 eaf3ffb5df56 Add const to ff_emulated_edge_mc conrad parents: 11783 diff changeset	373 void ff_emulated_edge_mc(uint8_t buf, const uint8_t src, int linesize, int block_w, int block_h,
6445 2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	374 int src_x, int src_y, int w, int h){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	375 int x, y;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	376 int start_y, start_x, end_y, end_x;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	377
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	378 if(src_y>= h){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	379 src+= (h-1-src_y)*linesize;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	380 src_y=h-1;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	381 }else if(src_y<=-block_h){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	382 src+= (1-block_h-src_y)*linesize;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	383 src_y=1-block_h;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	384 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	385 if(src_x>= w){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	386 src+= (w-1-src_x);
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	387 src_x=w-1;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	388 }else if(src_x<=-block_w){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	389 src+= (1-block_w-src_x);
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	390 src_x=1-block_w;
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	391 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	392
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	393 start_y= FFMAX(0, -src_y);
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	394 start_x= FFMAX(0, -src_x);
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	395 end_y= FFMIN(block_h, h-src_y);
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	396 end_x= FFMIN(block_w, w-src_x);
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	397
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	398 // copy existing part
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	399 for(y=start_y; y<end_y; y++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	400 for(x=start_x; x<end_x; x++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	401 buf[x + ylinesize]= src[x + ylinesize];
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	402 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	403 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	404
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	405 //top
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	406 for(y=0; y<start_y; y++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	407 for(x=start_x; x<end_x; x++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	408 buf[x + ylinesize]= buf[x + start_ylinesize];
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	409 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	410 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	411
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	412 //bottom
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	413 for(y=end_y; y<block_h; y++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	414 for(x=start_x; x<end_x; x++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	415 buf[x + ylinesize]= buf[x + (end_y-1)linesize];
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	416 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	417 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	418
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	419 for(y=0; y<block_h; y++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	420 //left
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	421 for(x=0; x<start_x; x++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	422 buf[x + ylinesize]= buf[start_x + ylinesize];
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	423 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	424
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	425 //right
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	426 for(x=end_x; x<block_w; x++){
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	427 buf[x + ylinesize]= buf[end_x - 1 + ylinesize];
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	428 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	429 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	430 }
2b553c57ec51 move ff_emulated_edge_mc() to dsputil aurel parents: 6438 diff changeset	431
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	432 static void get_pixels_c(DCTELEM restrict block, const uint8_t pixels, int line_size)
0 986e461dc072 Initial revision glantau parents: diff changeset	433 {
986e461dc072 Initial revision glantau parents: diff changeset	434 int i;
986e461dc072 Initial revision glantau parents: diff changeset	435
986e461dc072 Initial revision glantau parents: diff changeset	436 /* read the pixels */
986e461dc072 Initial revision glantau parents: diff changeset	437 for(i=0;i<8;i++) {
516 0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	438 block[0] = pixels[0];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	439 block[1] = pixels[1];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	440 block[2] = pixels[2];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	441 block[3] = pixels[3];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	442 block[4] = pixels[4];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	443 block[5] = pixels[5];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	444 block[6] = pixels[6];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	445 block[7] = pixels[7];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	446 pixels += line_size;
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	447 block += 8;
0 986e461dc072 Initial revision glantau parents: diff changeset	448 }
986e461dc072 Initial revision glantau parents: diff changeset	449 }
986e461dc072 Initial revision glantau parents: diff changeset	450
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	451 static void diff_pixels_c(DCTELEM restrict block, const uint8_t s1,
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	452 const uint8_t *s2, int stride){
324 9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	453 int i;
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	454
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	455 /* read the pixels */
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	456 for(i=0;i<8;i++) {
516 0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	457 block[0] = s1[0] - s2[0];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	458 block[1] = s1[1] - s2[1];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	459 block[2] = s1[2] - s2[2];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	460 block[3] = s1[3] - s2[3];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	461 block[4] = s1[4] - s2[4];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	462 block[5] = s1[5] - s2[5];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	463 block[6] = s1[6] - s2[6];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	464 block[7] = s1[7] - s2[7];
324 9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	465 s1 += stride;
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	466 s2 += stride;
516 0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	467 block += 8;
324 9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	468 }
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	469 }
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	470
9c6f056f0e41 fixed mpeg4 time stuff on encoding michaelni parents: 320 diff changeset	471
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	472 static void put_pixels_clamped_c(const DCTELEM block, uint8_t restrict pixels,
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	473 int line_size)
0 986e461dc072 Initial revision glantau parents: diff changeset	474 {
986e461dc072 Initial revision glantau parents: diff changeset	475 int i;
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	476 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	477
0 986e461dc072 Initial revision glantau parents: diff changeset	478 /* read the pixels */
986e461dc072 Initial revision glantau parents: diff changeset	479 for(i=0;i<8;i++) {
516 0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	480 pixels[0] = cm[block[0]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	481 pixels[1] = cm[block[1]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	482 pixels[2] = cm[block[2]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	483 pixels[3] = cm[block[3]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	484 pixels[4] = cm[block[4]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	485 pixels[5] = cm[block[5]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	486 pixels[6] = cm[block[6]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	487 pixels[7] = cm[block[7]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	488
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	489 pixels += line_size;
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	490 block += 8;
0 986e461dc072 Initial revision glantau parents: diff changeset	491 }
986e461dc072 Initial revision glantau parents: diff changeset	492 }
986e461dc072 Initial revision glantau parents: diff changeset	493
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	494 static void put_pixels_clamped4_c(const DCTELEM block, uint8_t restrict pixels,
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	495 int line_size)
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	496 {
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	497 int i;
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	498 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	499
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	500 /* read the pixels */
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	501 for(i=0;i<4;i++) {
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	502 pixels[0] = cm[block[0]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	503 pixels[1] = cm[block[1]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	504 pixels[2] = cm[block[2]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	505 pixels[3] = cm[block[3]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	506
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	507 pixels += line_size;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	508 block += 8;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	509 }
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	510 }
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	511
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	512 static void put_pixels_clamped2_c(const DCTELEM block, uint8_t restrict pixels,
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	513 int line_size)
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	514 {
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	515 int i;
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	516 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	517
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	518 /* read the pixels */
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	519 for(i=0;i<2;i++) {
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	520 pixels[0] = cm[block[0]];
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	521 pixels[1] = cm[block[1]];
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	522
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	523 pixels += line_size;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	524 block += 8;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	525 }
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	526 }
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	527
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	528 static void put_signed_pixels_clamped_c(const DCTELEM *block,
1984 ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	529 uint8_t *restrict pixels,
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	530 int line_size)
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	531 {
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	532 int i, j;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	533
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	534 for (i = 0; i < 8; i++) {
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	535 for (j = 0; j < 8; j++) {
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	536 if (*block < -128)
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	537 *pixels = 0;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	538 else if (*block > 127)
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	539 *pixels = 255;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	540 else
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	541 pixels = (uint8_t)(block + 128);
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	542 block++;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	543 pixels++;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	544 }
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	545 pixels += (line_size - 8);
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	546 }
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	547 }
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	548
11231 0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	549 static void put_pixels_nonclamped_c(const DCTELEM block, uint8_t restrict pixels,
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	550 int line_size)
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	551 {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	552 int i;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	553
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	554 /* read the pixels */
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	555 for(i=0;i<8;i++) {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	556 pixels[0] = block[0];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	557 pixels[1] = block[1];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	558 pixels[2] = block[2];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	559 pixels[3] = block[3];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	560 pixels[4] = block[4];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	561 pixels[5] = block[5];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	562 pixels[6] = block[6];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	563 pixels[7] = block[7];
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	564
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	565 pixels += line_size;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	566 block += 8;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	567 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	568 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	569
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	570 static void add_pixels_clamped_c(const DCTELEM block, uint8_t restrict pixels,
516 0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	571 int line_size)
0 986e461dc072 Initial revision glantau parents: diff changeset	572 {
986e461dc072 Initial revision glantau parents: diff changeset	573 int i;
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	574 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	575
0 986e461dc072 Initial revision glantau parents: diff changeset	576 /* read the pixels */
986e461dc072 Initial revision glantau parents: diff changeset	577 for(i=0;i<8;i++) {
516 0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	578 pixels[0] = cm[pixels[0] + block[0]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	579 pixels[1] = cm[pixels[1] + block[1]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	580 pixels[2] = cm[pixels[2] + block[2]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	581 pixels[3] = cm[pixels[3] + block[3]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	582 pixels[4] = cm[pixels[4] + block[4]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	583 pixels[5] = cm[pixels[5] + block[5]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	584 pixels[6] = cm[pixels[6] + block[6]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	585 pixels[7] = cm[pixels[7] + block[7]];
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	586 pixels += line_size;
0cb7ab35ccb2 * Detect "retrict" keyword mellum parents: 493 diff changeset	587 block += 8;
0 986e461dc072 Initial revision glantau parents: diff changeset	588 }
986e461dc072 Initial revision glantau parents: diff changeset	589 }
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	590
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	591 static void add_pixels_clamped4_c(const DCTELEM block, uint8_t restrict pixels,
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	592 int line_size)
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	593 {
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	594 int i;
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	595 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	596
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	597 /* read the pixels */
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	598 for(i=0;i<4;i++) {
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	599 pixels[0] = cm[pixels[0] + block[0]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	600 pixels[1] = cm[pixels[1] + block[1]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	601 pixels[2] = cm[pixels[2] + block[2]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	602 pixels[3] = cm[pixels[3] + block[3]];
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	603 pixels += line_size;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	604 block += 8;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	605 }
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	606 }
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	607
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	608 static void add_pixels_clamped2_c(const DCTELEM block, uint8_t restrict pixels,
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	609 int line_size)
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	610 {
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	611 int i;
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	612 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	613
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	614 /* read the pixels */
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	615 for(i=0;i<2;i++) {
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	616 pixels[0] = cm[pixels[0] + block[0]];
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	617 pixels[1] = cm[pixels[1] + block[1]];
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	618 pixels += line_size;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	619 block += 8;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	620 }
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	621 }
2763 01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	622
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	623 static void add_pixels8_c(uint8_t restrict pixels, DCTELEM block, int line_size)
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	624 {
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	625 int i;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	626 for(i=0;i<8;i++) {
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	627 pixels[0] += block[0];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	628 pixels[1] += block[1];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	629 pixels[2] += block[2];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	630 pixels[3] += block[3];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	631 pixels[4] += block[4];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	632 pixels[5] += block[5];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	633 pixels[6] += block[6];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	634 pixels[7] += block[7];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	635 pixels += line_size;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	636 block += 8;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	637 }
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	638 }
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	639
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	640 static void add_pixels4_c(uint8_t restrict pixels, DCTELEM block, int line_size)
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	641 {
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	642 int i;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	643 for(i=0;i<4;i++) {
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	644 pixels[0] += block[0];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	645 pixels[1] += block[1];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	646 pixels[2] += block[2];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	647 pixels[3] += block[3];
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	648 pixels += line_size;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	649 block += 4;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	650 }
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	651 }
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	652
4988 689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	653 static int sum_abs_dctelem_c(DCTELEM *block)
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	654 {
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	655 int sum=0, i;
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	656 for(i=0; i<64; i++)
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	657 sum+= FFABS(block[i]);
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	658 return sum;
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	659 }
689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	660
11231 0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	661 static void fill_block16_c(uint8_t *block, uint8_t value, int line_size, int h)
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	662 {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	663 int i;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	664
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	665 for (i = 0; i < h; i++) {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	666 memset(block, value, 16);
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	667 block += line_size;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	668 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	669 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	670
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	671 static void fill_block8_c(uint8_t *block, uint8_t value, int line_size, int h)
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	672 {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	673 int i;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	674
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	675 for (i = 0; i < h; i++) {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	676 memset(block, value, 8);
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	677 block += line_size;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	678 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	679 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	680
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	681 static void scale_block_c(const uint8_t src[64]/align 8/, uint8_t dst/align 8*/, int linesize)
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	682 {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	683 int i, j;
11459 5fe3559e8e71 Add some required casts mru parents: 11380 diff changeset	684 uint16_t dst1 = (uint16_t ) dst;
5fe3559e8e71 Add some required casts mru parents: 11380 diff changeset	685 uint16_t dst2 = (uint16_t )(dst + linesize);
11231 0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	686
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	687 for (j = 0; j < 8; j++) {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	688 for (i = 0; i < 8; i++) {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	689 dst1[i] = dst2[i] = src[i] * 0x0101;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	690 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	691 src += 8;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	692 dst1 += linesize;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	693 dst2 += linesize;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	694 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	695 }
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	696
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	697 #if 0
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	698
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	699 #define PIXOP2(OPNAME, OP) \
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	700 static void OPNAME ## _pixels(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	701 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	702 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	703 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	704 OP(((uint64_t)block), AV_RN64(pixels));\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	705 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	706 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	707 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	708 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	709 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	710 static void OPNAME ## _no_rnd_pixels_x2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	711 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	712 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	713 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	714 const uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	715 const uint64_t b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	716 OP(((uint64_t)block), (a&b) + (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	717 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	718 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	719 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	720 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	721 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	722 static void OPNAME ## _pixels_x2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	723 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	724 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	725 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	726 const uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	727 const uint64_t b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	728 OP(((uint64_t)block), (a\|b) - (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	729 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	730 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	731 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	732 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	733 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	734 static void OPNAME ## _no_rnd_pixels_y2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	735 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	736 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	737 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	738 const uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	739 const uint64_t b= AV_RN64(pixels+line_size);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	740 OP(((uint64_t)block), (a&b) + (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	741 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	742 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	743 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	744 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	745 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	746 static void OPNAME ## _pixels_y2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	747 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	748 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	749 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	750 const uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	751 const uint64_t b= AV_RN64(pixels+line_size);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	752 OP(((uint64_t)block), (a\|b) - (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	753 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	754 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	755 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	756 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	757 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	758 static void OPNAME ## _pixels_xy2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	759 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	760 int i;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	761 const uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	762 const uint64_t b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	763 uint64_t l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	764 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	765 + 0x0202020202020202ULL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	766 uint64_t h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	767 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	768 uint64_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	769 \
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	770 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	771 for(i=0; i<h; i+=2){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	772 uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	773 uint64_t b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	774 l1= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	775 + (b&0x0303030303030303ULL);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	776 h1= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	777 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	778 OP(((uint64_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	779 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	780 block +=line_size;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	781 a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	782 b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	783 l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	784 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	785 + 0x0202020202020202ULL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	786 h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	787 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	788 OP(((uint64_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	789 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	790 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	791 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	792 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	793 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	794 static void OPNAME ## _no_rnd_pixels_xy2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	795 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	796 int i;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	797 const uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	798 const uint64_t b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	799 uint64_t l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	800 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	801 + 0x0101010101010101ULL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	802 uint64_t h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	803 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	804 uint64_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	805 \
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	806 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	807 for(i=0; i<h; i+=2){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	808 uint64_t a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	809 uint64_t b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	810 l1= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	811 + (b&0x0303030303030303ULL);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	812 h1= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	813 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	814 OP(((uint64_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	815 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	816 block +=line_size;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	817 a= AV_RN64(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	818 b= AV_RN64(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	819 l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	820 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	821 + 0x0101010101010101ULL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	822 h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	823 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	824 OP(((uint64_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	825 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	826 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	827 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	828 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	829 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	830 CALL_2X_PIXELS(OPNAME ## _pixels16_c , OPNAME ## _pixels_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	831 CALL_2X_PIXELS(OPNAME ## _pixels16_x2_c , OPNAME ## _pixels_x2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	832 CALL_2X_PIXELS(OPNAME ## _pixels16_y2_c , OPNAME ## _pixels_y2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	833 CALL_2X_PIXELS(OPNAME ## _pixels16_xy2_c, OPNAME ## _pixels_xy2_c, 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	834 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_x2_c , OPNAME ## _no_rnd_pixels_x2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	835 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_y2_c , OPNAME ## _no_rnd_pixels_y2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	836 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_xy2_c, OPNAME ## _no_rnd_pixels_xy2_c, 8)
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	837
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	838 #define op_avg(a, b) a = ( ((a)\|(b)) - ((((a)^(b))&0xFEFEFEFEFEFEFEFEULL)>>1) )
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	839 #else // 64 bit variant
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	840
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	841 #define PIXOP2(OPNAME, OP) \
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	842 static void OPNAME ## _pixels2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	843 int i;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	844 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	845 OP(((uint16_t)(block )), AV_RN16(pixels ));\
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	846 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	847 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	848 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	849 }\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	850 static void OPNAME ## _pixels4_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	851 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	852 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	853 OP(((uint32_t)(block )), AV_RN32(pixels ));\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	854 pixels+=line_size;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	855 block +=line_size;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	856 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	857 }\
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	858 static void OPNAME ## _pixels8_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	859 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	860 for(i=0; i<h; i++){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	861 OP(((uint32_t)(block )), AV_RN32(pixels ));\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	862 OP(((uint32_t)(block+4)), AV_RN32(pixels+4));\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	863 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	864 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	865 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	866 }\
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	867 static inline void OPNAME ## _no_rnd_pixels8_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	868 OPNAME ## _pixels8_c(block, pixels, line_size, h);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	869 }\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	870 \
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	871 static inline void OPNAME ## _no_rnd_pixels8_l2(uint8_t dst, const uint8_t src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	872 int src_stride1, int src_stride2, int h){\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	873 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	874 for(i=0; i<h; i++){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	875 uint32_t a,b;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	876 a= AV_RN32(&src1[i*src_stride1 ]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	877 b= AV_RN32(&src2[i*src_stride2 ]);\
1264 2fa34e615c76 cleanup michaelni parents: 1259 diff changeset	878 OP(((uint32_t)&dst[i*dst_stride ]), no_rnd_avg32(a, b));\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	879 a= AV_RN32(&src1[i*src_stride1+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	880 b= AV_RN32(&src2[i*src_stride2+4]);\
1264 2fa34e615c76 cleanup michaelni parents: 1259 diff changeset	881 OP(((uint32_t)&dst[i*dst_stride+4]), no_rnd_avg32(a, b));\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	882 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	883 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	884 \
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	885 static inline void OPNAME ## _pixels8_l2(uint8_t dst, const uint8_t src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	886 int src_stride1, int src_stride2, int h){\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	887 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	888 for(i=0; i<h; i++){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	889 uint32_t a,b;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	890 a= AV_RN32(&src1[i*src_stride1 ]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	891 b= AV_RN32(&src2[i*src_stride2 ]);\
1264 2fa34e615c76 cleanup michaelni parents: 1259 diff changeset	892 OP(((uint32_t)&dst[i*dst_stride ]), rnd_avg32(a, b));\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	893 a= AV_RN32(&src1[i*src_stride1+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	894 b= AV_RN32(&src2[i*src_stride2+4]);\
1264 2fa34e615c76 cleanup michaelni parents: 1259 diff changeset	895 OP(((uint32_t)&dst[i*dst_stride+4]), rnd_avg32(a, b));\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	896 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	897 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	898 \
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	899 static inline void OPNAME ## _pixels4_l2(uint8_t dst, const uint8_t src1, const uint8_t *src2, int dst_stride, \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	900 int src_stride1, int src_stride2, int h){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	901 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	902 for(i=0; i<h; i++){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	903 uint32_t a,b;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	904 a= AV_RN32(&src1[i*src_stride1 ]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	905 b= AV_RN32(&src2[i*src_stride2 ]);\
1264 2fa34e615c76 cleanup michaelni parents: 1259 diff changeset	906 OP(((uint32_t)&dst[i*dst_stride ]), rnd_avg32(a, b));\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	907 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	908 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	909 \
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	910 static inline void OPNAME ## _pixels2_l2(uint8_t dst, const uint8_t src1, const uint8_t *src2, int dst_stride, \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	911 int src_stride1, int src_stride2, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	912 int i;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	913 for(i=0; i<h; i++){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	914 uint32_t a,b;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	915 a= AV_RN16(&src1[i*src_stride1 ]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	916 b= AV_RN16(&src2[i*src_stride2 ]);\
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	917 OP(((uint16_t)&dst[i*dst_stride ]), rnd_avg32(a, b));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	918 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	919 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	920 \
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	921 static inline void OPNAME ## _pixels16_l2(uint8_t dst, const uint8_t src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	922 int src_stride1, int src_stride2, int h){\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	923 OPNAME ## _pixels8_l2(dst , src1 , src2 , dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	924 OPNAME ## _pixels8_l2(dst+8, src1+8, src2+8, dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	925 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	926 \
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	927 static inline void OPNAME ## _no_rnd_pixels16_l2(uint8_t dst, const uint8_t src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	928 int src_stride1, int src_stride2, int h){\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	929 OPNAME ## _no_rnd_pixels8_l2(dst , src1 , src2 , dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	930 OPNAME ## _no_rnd_pixels8_l2(dst+8, src1+8, src2+8, dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	931 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	932 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	933 static inline void OPNAME ## _no_rnd_pixels8_x2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	934 OPNAME ## _no_rnd_pixels8_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	935 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	936 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	937 static inline void OPNAME ## _pixels8_x2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	938 OPNAME ## _pixels8_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	939 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	940 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	941 static inline void OPNAME ## _no_rnd_pixels8_y2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	942 OPNAME ## _no_rnd_pixels8_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	943 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	944 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	945 static inline void OPNAME ## _pixels8_y2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	946 OPNAME ## _pixels8_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	947 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	948 \
11783 f97b1759c39a Add more const to _l4 pixel functions conrad parents: 11644 diff changeset	949 static inline void OPNAME ## _pixels8_l4(uint8_t dst, const uint8_t src1, const uint8_t src2, const uint8_t src3, const uint8_t *src4,\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	950 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	951 int i;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	952 for(i=0; i<h; i++){\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	953 uint32_t a, b, c, d, l0, l1, h0, h1;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	954 a= AV_RN32(&src1[i*src_stride1]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	955 b= AV_RN32(&src2[i*src_stride2]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	956 c= AV_RN32(&src3[i*src_stride3]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	957 d= AV_RN32(&src4[i*src_stride4]);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	958 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	959 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	960 + 0x02020202UL;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	961 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	962 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	963 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	964 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	965 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	966 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	967 OP(((uint32_t)&dst[i*dst_stride]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	968 a= AV_RN32(&src1[i*src_stride1+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	969 b= AV_RN32(&src2[i*src_stride2+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	970 c= AV_RN32(&src3[i*src_stride3+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	971 d= AV_RN32(&src4[i*src_stride4+4]);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	972 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	973 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	974 + 0x02020202UL;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	975 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	976 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	977 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	978 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	979 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	980 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	981 OP(((uint32_t)&dst[i*dst_stride+4]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	982 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	983 }\
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	984 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	985 static inline void OPNAME ## _pixels4_x2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	986 OPNAME ## _pixels4_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	987 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	988 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	989 static inline void OPNAME ## _pixels4_y2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	990 OPNAME ## _pixels4_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	991 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	992 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	993 static inline void OPNAME ## _pixels2_x2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	994 OPNAME ## _pixels2_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	995 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	996 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	997 static inline void OPNAME ## _pixels2_y2_c(uint8_t block, const uint8_t pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	998 OPNAME ## _pixels2_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	999 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1000 \
11783 f97b1759c39a Add more const to _l4 pixel functions conrad parents: 11644 diff changeset	1001 static inline void OPNAME ## _no_rnd_pixels8_l4(uint8_t dst, const uint8_t src1, const uint8_t src2, const uint8_t src3, const uint8_t *src4,\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1002 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1003 int i;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1004 for(i=0; i<h; i++){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1005 uint32_t a, b, c, d, l0, l1, h0, h1;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1006 a= AV_RN32(&src1[i*src_stride1]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1007 b= AV_RN32(&src2[i*src_stride2]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1008 c= AV_RN32(&src3[i*src_stride3]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1009 d= AV_RN32(&src4[i*src_stride4]);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1010 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1011 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1012 + 0x01010101UL;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1013 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1014 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1015 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1016 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1017 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1018 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1019 OP(((uint32_t)&dst[i*dst_stride]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1020 a= AV_RN32(&src1[i*src_stride1+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1021 b= AV_RN32(&src2[i*src_stride2+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1022 c= AV_RN32(&src3[i*src_stride3+4]);\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1023 d= AV_RN32(&src4[i*src_stride4+4]);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1024 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1025 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1026 + 0x01010101UL;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1027 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1028 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1029 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1030 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1031 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1032 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1033 OP(((uint32_t)&dst[i*dst_stride+4]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1034 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1035 }\
11783 f97b1759c39a Add more const to _l4 pixel functions conrad parents: 11644 diff changeset	1036 static inline void OPNAME ## _pixels16_l4(uint8_t dst, const uint8_t src1, const uint8_t src2, const uint8_t src3, const uint8_t *src4,\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1037 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1038 OPNAME ## _pixels8_l4(dst , src1 , src2 , src3 , src4 , dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1039 OPNAME ## _pixels8_l4(dst+8, src1+8, src2+8, src3+8, src4+8, dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1040 }\
11783 f97b1759c39a Add more const to _l4 pixel functions conrad parents: 11644 diff changeset	1041 static inline void OPNAME ## _no_rnd_pixels16_l4(uint8_t dst, const uint8_t src1, const uint8_t src2, const uint8_t src3, const uint8_t *src4,\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1042 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1043 OPNAME ## _no_rnd_pixels8_l4(dst , src1 , src2 , src3 , src4 , dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1044 OPNAME ## _no_rnd_pixels8_l4(dst+8, src1+8, src2+8, src3+8, src4+8, dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1045 }\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1046 \
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1047 static inline void OPNAME ## _pixels2_xy2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1048 {\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1049 int i, a0, b0, a1, b1;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1050 a0= pixels[0];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1051 b0= pixels[1] + 2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1052 a0 += b0;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1053 b0 += pixels[2];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1054 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1055 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1056 for(i=0; i<h; i+=2){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1057 a1= pixels[0];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1058 b1= pixels[1];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1059 a1 += b1;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1060 b1 += pixels[2];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1061 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1062 block[0]= (a1+a0)>>2; /* FIXME non put */\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1063 block[1]= (b1+b0)>>2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1064 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1065 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1066 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1067 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1068 a0= pixels[0];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1069 b0= pixels[1] + 2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1070 a0 += b0;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1071 b0 += pixels[2];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1072 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1073 block[0]= (a1+a0)>>2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1074 block[1]= (b1+b0)>>2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1075 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1076 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1077 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1078 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1079 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1080 static inline void OPNAME ## _pixels4_xy2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1081 {\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1082 int i;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1083 const uint32_t a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1084 const uint32_t b= AV_RN32(pixels+1);\
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1085 uint32_t l0= (a&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1086 + (b&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1087 + 0x02020202UL;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1088 uint32_t h0= ((a&0xFCFCFCFCUL)>>2)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1089 + ((b&0xFCFCFCFCUL)>>2);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1090 uint32_t l1,h1;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1091 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1092 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1093 for(i=0; i<h; i+=2){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1094 uint32_t a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1095 uint32_t b= AV_RN32(pixels+1);\
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1096 l1= (a&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1097 + (b&0x03030303UL);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1098 h1= ((a&0xFCFCFCFCUL)>>2)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1099 + ((b&0xFCFCFCFCUL)>>2);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1100 OP(((uint32_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1101 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1102 block +=line_size;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1103 a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1104 b= AV_RN32(pixels+1);\
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1105 l0= (a&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1106 + (b&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1107 + 0x02020202UL;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1108 h0= ((a&0xFCFCFCFCUL)>>2)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1109 + ((b&0xFCFCFCFCUL)>>2);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1110 OP(((uint32_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1111 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1112 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1113 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1114 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1115 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1116 static inline void OPNAME ## _pixels8_xy2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1117 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1118 int j;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1119 for(j=0; j<2; j++){\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1120 int i;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1121 const uint32_t a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1122 const uint32_t b= AV_RN32(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1123 uint32_t l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1124 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1125 + 0x02020202UL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1126 uint32_t h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1127 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1128 uint32_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1129 \
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1130 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1131 for(i=0; i<h; i+=2){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1132 uint32_t a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1133 uint32_t b= AV_RN32(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1134 l1= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1135 + (b&0x03030303UL);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1136 h1= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1137 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1138 OP(((uint32_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1139 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1140 block +=line_size;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1141 a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1142 b= AV_RN32(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1143 l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1144 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1145 + 0x02020202UL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1146 h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1147 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1148 OP(((uint32_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1149 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1150 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1151 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1152 pixels+=4-line_size*(h+1);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1153 block +=4-line_size*h;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1154 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1155 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1156 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1157 static inline void OPNAME ## _no_rnd_pixels8_xy2_c(uint8_t block, const uint8_t pixels, int line_size, int h)\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1158 {\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1159 int j;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1160 for(j=0; j<2; j++){\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1161 int i;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1162 const uint32_t a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1163 const uint32_t b= AV_RN32(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1164 uint32_t l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1165 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1166 + 0x01010101UL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1167 uint32_t h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1168 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1169 uint32_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1170 \
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1171 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1172 for(i=0; i<h; i+=2){\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1173 uint32_t a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1174 uint32_t b= AV_RN32(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1175 l1= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1176 + (b&0x03030303UL);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1177 h1= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1178 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1179 OP(((uint32_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1180 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1181 block +=line_size;\
5520 c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1182 a= AV_RN32(pixels );\
c16a59ef6a86 * renaming (ST\|LD)(16\|32\|64) -> AV_(R\|W)N(16\|32\|64) romansh parents: 5411 diff changeset	1183 b= AV_RN32(pixels+1);\
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1184 l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1185 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1186 + 0x01010101UL;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1187 h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1188 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1189 OP(((uint32_t)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1190 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1191 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1192 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1193 pixels+=4-line_size*(h+1);\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1194 block +=4-line_size*h;\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1195 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1196 }\
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1197 \
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1198 CALL_2X_PIXELS(OPNAME ## _pixels16_c , OPNAME ## _pixels8_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1199 CALL_2X_PIXELS(OPNAME ## _pixels16_x2_c , OPNAME ## _pixels8_x2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1200 CALL_2X_PIXELS(OPNAME ## _pixels16_y2_c , OPNAME ## _pixels8_y2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1201 CALL_2X_PIXELS(OPNAME ## _pixels16_xy2_c, OPNAME ## _pixels8_xy2_c, 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1202 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_c , OPNAME ## _pixels8_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1203 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_x2_c , OPNAME ## _no_rnd_pixels8_x2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1204 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_y2_c , OPNAME ## _no_rnd_pixels8_y2_c , 8)\
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1205 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_xy2_c, OPNAME ## _no_rnd_pixels8_xy2_c, 8)\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1206
1264 2fa34e615c76 cleanup michaelni parents: 1259 diff changeset	1207 #define op_avg(a, b) a = rnd_avg32(a, b)
385 7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1208 #endif
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1209 #define op_put(a, b) a = b
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1210
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1211 PIXOP2(avg, op_avg)
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1212 PIXOP2(put, op_put)
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1213 #undef op_avg
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1214 #undef op_put
7ac7a48fbe5e new hopefully faster MC michaelni parents: 324 diff changeset	1215
0 986e461dc072 Initial revision glantau parents: diff changeset	1216 #define avg2(a,b) ((a+b+1)>>1)
986e461dc072 Initial revision glantau parents: diff changeset	1217 #define avg4(a,b,c,d) ((a+b+c+d+2)>>2)
986e461dc072 Initial revision glantau parents: diff changeset	1218
1864 9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1219 static void put_no_rnd_pixels16_l2_c(uint8_t dst, const uint8_t a, const uint8_t *b, int stride, int h){
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1220 put_no_rnd_pixels16_l2(dst, a, b, stride, stride, stride, h);
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1221 }
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1222
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1223 static void put_no_rnd_pixels8_l2_c(uint8_t dst, const uint8_t a, const uint8_t *b, int stride, int h){
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1224 put_no_rnd_pixels8_l2(dst, a, b, stride, stride, stride, h);
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	1225 }
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1226
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1227 static void gmc1_c(uint8_t dst, uint8_t src, int stride, int h, int x16, int y16, int rounder)
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1228 {
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1229 const int A=(16-x16)*(16-y16);
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1230 const int B=( x16)*(16-y16);
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1231 const int C=(16-x16)*( y16);
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1232 const int D=( x16)*( y16);
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1233 int i;
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1234
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1235 for(i=0; i<h; i++)
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1236 {
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1237 dst[0]= (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1238 dst[1]= (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1239 dst[2]= (Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1240 dst[3]= (Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1241 dst[4]= (Asrc[4] + Bsrc[5] + Csrc[stride+4] + Dsrc[stride+5] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1242 dst[5]= (Asrc[5] + Bsrc[6] + Csrc[stride+5] + Dsrc[stride+6] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1243 dst[6]= (Asrc[6] + Bsrc[7] + Csrc[stride+6] + Dsrc[stride+7] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1244 dst[7]= (Asrc[7] + Bsrc[8] + Csrc[stride+7] + Dsrc[stride+8] + rounder)>>8;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1245 dst+= stride;
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1246 src+= stride;
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1247 }
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1248 }
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1249
3248 7aa9f80e7954 mmx implementation of 3-point GMC. (5x faster than C) lorenm parents: 3245 diff changeset	1250 void ff_gmc_c(uint8_t dst, uint8_t src, int stride, int h, int ox, int oy,
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1251 int dxx, int dxy, int dyx, int dyy, int shift, int r, int width, int height)
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1252 {
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1253 int y, vx, vy;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1254 const int s= 1<<shift;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1255
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1256 width--;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1257 height--;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1258
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1259 for(y=0; y<h; y++){
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1260 int x;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1261
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1262 vx= ox;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1263 vy= oy;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1264 for(x=0; x<8; x++){ //XXX FIXME optimize
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1265 int src_x, src_y, frac_x, frac_y, index;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1266
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1267 src_x= vx>>16;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1268 src_y= vy>>16;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1269 frac_x= src_x&(s-1);
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1270 frac_y= src_y&(s-1);
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1271 src_x>>=shift;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1272 src_y>>=shift;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1273
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1274 if((unsigned)src_x < width){
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1275 if((unsigned)src_y < height){
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1276 index= src_x + src_y*stride;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1277 dst[ystride + x]= ( ( src[index ](s-frac_x)
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1278 + src[index +1]* frac_x )*(s-frac_y)
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1279 + ( src[index+stride ]*(s-frac_x)
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1280 + src[index+stride+1]* frac_x )* frac_y
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1281 + r)>>(shift*2);
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1282 }else{
4594 a96d905dcbaa Add av_ prefix to clip functions reimar parents: 4296 diff changeset	1283 index= src_x + av_clip(src_y, 0, height)*stride;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1284 dst[ystride + x]= ( ( src[index ](s-frac_x)
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1285 + src[index +1]* frac_x )*s
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1286 + r)>>(shift*2);
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1287 }
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1288 }else{
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1289 if((unsigned)src_y < height){
4594 a96d905dcbaa Add av_ prefix to clip functions reimar parents: 4296 diff changeset	1290 index= av_clip(src_x, 0, width) + src_y*stride;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1291 dst[ystride + x]= ( ( src[index ](s-frac_y)
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1292 + src[index+stride ]* frac_y )*s
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1293 + r)>>(shift*2);
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1294 }else{
4594 a96d905dcbaa Add av_ prefix to clip functions reimar parents: 4296 diff changeset	1295 index= av_clip(src_x, 0, width) + av_clip(src_y, 0, height)*stride;
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1296 dst[y*stride + x]= src[index ];
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1297 }
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1298 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1299
753 8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1300 vx+= dxx;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1301 vy+= dyx;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1302 }
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1303 ox += dxy;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1304 oy += dyy;
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1305 }
8e1f0939d15d complete mpeg4 GMC decoding support michaelni parents: 751 diff changeset	1306 }
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1307
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1308 static inline void put_tpel_pixels_mc00_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1309 switch(width){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1310 case 2: put_pixels2_c (dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1311 case 4: put_pixels4_c (dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1312 case 8: put_pixels8_c (dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1313 case 16:put_pixels16_c(dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1314 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1315 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1316
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1317 static inline void put_tpel_pixels_mc10_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1318 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1319 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1320 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1321 dst[j] = (683(2src[j] + src[j+1] + 1)) >> 11;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1322 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1323 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1324 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1325 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1326 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1327
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1328 static inline void put_tpel_pixels_mc20_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1329 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1330 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1331 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1332 dst[j] = (683(src[j] + 2src[j+1] + 1)) >> 11;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1333 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1334 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1335 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1336 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1337 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1338
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1339 static inline void put_tpel_pixels_mc01_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1340 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1341 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1342 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1343 dst[j] = (683(2src[j] + src[j+stride] + 1)) >> 11;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1344 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1345 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1346 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1347 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1348 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1349
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1350 static inline void put_tpel_pixels_mc11_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1351 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1352 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1353 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1354 dst[j] = (2731(4src[j] + 3src[j+1] + 3src[j+stride] + 2*src[j+stride+1] + 6)) >> 15;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1355 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1356 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1357 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1358 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1359 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1360
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1361 static inline void put_tpel_pixels_mc12_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1362 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1363 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1364 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1365 dst[j] = (2731(3src[j] + 2src[j+1] + 4src[j+stride] + 3*src[j+stride+1] + 6)) >> 15;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1366 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1367 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1368 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1369 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1370 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1371
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1372 static inline void put_tpel_pixels_mc02_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1373 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1374 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1375 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1376 dst[j] = (683(src[j] + 2src[j+stride] + 1)) >> 11;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1377 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1378 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1379 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1380 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1381 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1382
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1383 static inline void put_tpel_pixels_mc21_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1384 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1385 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1386 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1387 dst[j] = (2731(3src[j] + 4src[j+1] + 2src[j+stride] + 3*src[j+stride+1] + 6)) >> 15;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1388 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1389 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1390 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1391 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1392 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1393
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1394 static inline void put_tpel_pixels_mc22_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1395 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1396 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1397 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1398 dst[j] = (2731(2src[j] + 3src[j+1] + 3src[j+stride] + 4*src[j+stride+1] + 6)) >> 15;
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1399 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1400 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1401 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1402 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1403 }
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1404
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1405 static inline void avg_tpel_pixels_mc00_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1406 switch(width){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1407 case 2: avg_pixels2_c (dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1408 case 4: avg_pixels4_c (dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1409 case 8: avg_pixels8_c (dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1410 case 16:avg_pixels16_c(dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1411 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1412 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1413
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1414 static inline void avg_tpel_pixels_mc10_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1415 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1416 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1417 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1418 dst[j] = (dst[j] + ((683(2src[j] + src[j+1] + 1)) >> 11) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1419 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1420 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1421 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1422 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1423 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1424
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1425 static inline void avg_tpel_pixels_mc20_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1426 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1427 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1428 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1429 dst[j] = (dst[j] + ((683(src[j] + 2src[j+1] + 1)) >> 11) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1430 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1431 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1432 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1433 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1434 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1435
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1436 static inline void avg_tpel_pixels_mc01_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1437 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1438 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1439 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1440 dst[j] = (dst[j] + ((683(2src[j] + src[j+stride] + 1)) >> 11) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1441 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1442 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1443 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1444 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1445 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	1446
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1447 static inline void avg_tpel_pixels_mc11_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1448 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1449 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1450 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1451 dst[j] = (dst[j] + ((2731(4src[j] + 3src[j+1] + 3src[j+stride] + 2*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1452 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1453 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1454 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1455 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1456 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1457
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1458 static inline void avg_tpel_pixels_mc12_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1459 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1460 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1461 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1462 dst[j] = (dst[j] + ((2731(3src[j] + 2src[j+1] + 4src[j+stride] + 3*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1463 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1464 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1465 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1466 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1467 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1468
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1469 static inline void avg_tpel_pixels_mc02_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1470 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1471 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1472 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1473 dst[j] = (dst[j] + ((683(src[j] + 2src[j+stride] + 1)) >> 11) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1474 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1475 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1476 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1477 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1478 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1479
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1480 static inline void avg_tpel_pixels_mc21_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1481 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1482 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1483 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1484 dst[j] = (dst[j] + ((2731(3src[j] + 4src[j+1] + 2src[j+stride] + 3*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1485 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1486 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1487 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1488 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1489 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1490
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1491 static inline void avg_tpel_pixels_mc22_c(uint8_t dst, const uint8_t src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1492 int i,j;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1493 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1494 for (j=0; j < width; j++) {
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	1495 dst[j] = (dst[j] + ((2731(2src[j] + 3src[j+1] + 3src[j+stride] + 4*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1496 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1497 src += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1498 dst += stride;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1499 }
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	1500 }
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1501 #if 0
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1502 #define TPEL_WIDTH(width)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1503 static void put_tpel_pixels ## width ## _mc00_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1504 void put_tpel_pixels_mc00_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1505 static void put_tpel_pixels ## width ## _mc10_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1506 void put_tpel_pixels_mc10_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1507 static void put_tpel_pixels ## width ## _mc20_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1508 void put_tpel_pixels_mc20_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1509 static void put_tpel_pixels ## width ## _mc01_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1510 void put_tpel_pixels_mc01_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1511 static void put_tpel_pixels ## width ## _mc11_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1512 void put_tpel_pixels_mc11_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1513 static void put_tpel_pixels ## width ## _mc21_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1514 void put_tpel_pixels_mc21_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1515 static void put_tpel_pixels ## width ## _mc02_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1516 void put_tpel_pixels_mc02_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1517 static void put_tpel_pixels ## width ## _mc12_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1518 void put_tpel_pixels_mc12_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1519 static void put_tpel_pixels ## width ## _mc22_c(uint8_t dst, const uint8_t src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1520 void put_tpel_pixels_mc22_c(dst, src, stride, width, height);}
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1521 #endif
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	1522
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1523 #define H264_CHROMA_MC(OPNAME, OP)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1524 static void OPNAME ## h264_chroma_mc2_c(uint8_t dst/align 8/, uint8_t src/align 1/, int stride, int h, int x, int y){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1525 const int A=(8-x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1526 const int B=( x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1527 const int C=(8-x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1528 const int D=( x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1529 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1530 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1531 assert(x<8 && y<8 && x>=0 && y>=0);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1532 \
6052 c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1533 if(D){\
6054 de71ee8112f4 More consistent { placement. michael parents: 6053 diff changeset	1534 for(i=0; i<h; i++){\
6053 f4607985f888 indent michael parents: 6052 diff changeset	1535 OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\
f4607985f888 indent michael parents: 6052 diff changeset	1536 OP(dst[1], (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2]));\
f4607985f888 indent michael parents: 6052 diff changeset	1537 dst+= stride;\
f4607985f888 indent michael parents: 6052 diff changeset	1538 src+= stride;\
f4607985f888 indent michael parents: 6052 diff changeset	1539 }\
6052 c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1540 }else{\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1541 const int E= B+C;\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1542 const int step= C ? stride : 1;\
6054 de71ee8112f4 More consistent { placement. michael parents: 6053 diff changeset	1543 for(i=0; i<h; i++){\
6052 c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1544 OP(dst[0], (Asrc[0] + Esrc[step+0]));\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1545 OP(dst[1], (Asrc[1] + Esrc[step+1]));\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1546 dst+= stride;\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1547 src+= stride;\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1548 }\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1549 }\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1550 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1551 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1552 static void OPNAME ## h264_chroma_mc4_c(uint8_t dst/align 8/, uint8_t src/align 1/, int stride, int h, int x, int y){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1553 const int A=(8-x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1554 const int B=( x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1555 const int C=(8-x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1556 const int D=( x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1557 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1558 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1559 assert(x<8 && y<8 && x>=0 && y>=0);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1560 \
6052 c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1561 if(D){\
6054 de71ee8112f4 More consistent { placement. michael parents: 6053 diff changeset	1562 for(i=0; i<h; i++){\
6053 f4607985f888 indent michael parents: 6052 diff changeset	1563 OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\
f4607985f888 indent michael parents: 6052 diff changeset	1564 OP(dst[1], (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2]));\
f4607985f888 indent michael parents: 6052 diff changeset	1565 OP(dst[2], (Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3]));\
f4607985f888 indent michael parents: 6052 diff changeset	1566 OP(dst[3], (Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4]));\
f4607985f888 indent michael parents: 6052 diff changeset	1567 dst+= stride;\
f4607985f888 indent michael parents: 6052 diff changeset	1568 src+= stride;\
f4607985f888 indent michael parents: 6052 diff changeset	1569 }\
6052 c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1570 }else{\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1571 const int E= B+C;\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1572 const int step= C ? stride : 1;\
6054 de71ee8112f4 More consistent { placement. michael parents: 6053 diff changeset	1573 for(i=0; i<h; i++){\
6052 c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1574 OP(dst[0], (Asrc[0] + Esrc[step+0]));\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1575 OP(dst[1], (Asrc[1] + Esrc[step+1]));\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1576 OP(dst[2], (Asrc[2] + Esrc[step+2]));\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1577 OP(dst[3], (Asrc[3] + Esrc[step+3]));\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1578 dst+= stride;\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1579 src+= stride;\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1580 }\
c90798ac28ee ~15% faster h264_chroma_mc2/4_c() these also prevent some possible out michael parents: 6051 diff changeset	1581 }\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1582 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1583 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1584 static void OPNAME ## h264_chroma_mc8_c(uint8_t dst/align 8/, uint8_t src/align 1/, int stride, int h, int x, int y){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1585 const int A=(8-x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1586 const int B=( x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1587 const int C=(8-x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1588 const int D=( x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1589 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1590 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1591 assert(x<8 && y<8 && x>=0 && y>=0);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1592 \
6051 1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1593 if(D){\
6054 de71ee8112f4 More consistent { placement. michael parents: 6053 diff changeset	1594 for(i=0; i<h; i++){\
6053 f4607985f888 indent michael parents: 6052 diff changeset	1595 OP(dst[0], (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1]));\
f4607985f888 indent michael parents: 6052 diff changeset	1596 OP(dst[1], (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2]));\
f4607985f888 indent michael parents: 6052 diff changeset	1597 OP(dst[2], (Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3]));\
f4607985f888 indent michael parents: 6052 diff changeset	1598 OP(dst[3], (Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4]));\
f4607985f888 indent michael parents: 6052 diff changeset	1599 OP(dst[4], (Asrc[4] + Bsrc[5] + Csrc[stride+4] + Dsrc[stride+5]));\
f4607985f888 indent michael parents: 6052 diff changeset	1600 OP(dst[5], (Asrc[5] + Bsrc[6] + Csrc[stride+5] + Dsrc[stride+6]));\
f4607985f888 indent michael parents: 6052 diff changeset	1601 OP(dst[6], (Asrc[6] + Bsrc[7] + Csrc[stride+6] + Dsrc[stride+7]));\
f4607985f888 indent michael parents: 6052 diff changeset	1602 OP(dst[7], (Asrc[7] + Bsrc[8] + Csrc[stride+7] + Dsrc[stride+8]));\
f4607985f888 indent michael parents: 6052 diff changeset	1603 dst+= stride;\
f4607985f888 indent michael parents: 6052 diff changeset	1604 src+= stride;\
f4607985f888 indent michael parents: 6052 diff changeset	1605 }\
6051 1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1606 }else{\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1607 const int E= B+C;\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1608 const int step= C ? stride : 1;\
6054 de71ee8112f4 More consistent { placement. michael parents: 6053 diff changeset	1609 for(i=0; i<h; i++){\
6051 1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1610 OP(dst[0], (Asrc[0] + Esrc[step+0]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1611 OP(dst[1], (Asrc[1] + Esrc[step+1]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1612 OP(dst[2], (Asrc[2] + Esrc[step+2]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1613 OP(dst[3], (Asrc[3] + Esrc[step+3]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1614 OP(dst[4], (Asrc[4] + Esrc[step+4]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1615 OP(dst[5], (Asrc[5] + Esrc[step+5]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1616 OP(dst[6], (Asrc[6] + Esrc[step+6]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1617 OP(dst[7], (Asrc[7] + Esrc[step+7]));\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1618 dst+= stride;\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1619 src+= stride;\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1620 }\
1e3b5597505a 30% faster h264_chroma_mc8_c(), this also prevents a possible out of michael parents: 6001 diff changeset	1621 }\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1622 }
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1623
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1624 #define op_avg(a, b) a = (((a)+(((b) + 32)>>6)+1)>>1)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1625 #define op_put(a, b) a = (((b) + 32)>>6)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1626
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1627 H264_CHROMA_MC(put_ , op_put)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1628 H264_CHROMA_MC(avg_ , op_avg)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1629 #undef op_avg
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1630 #undef op_put
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	1631
9439 ef3a7b711cc0 Rename put_no_rnd_h264_chroma* to reflect its usage in VC1 only conrad parents: 9437 diff changeset	1632 static void put_no_rnd_vc1_chroma_mc8_c(uint8_t dst/align 8/, uint8_t src/align 1/, int stride, int h, int x, int y){
3663 8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1633 const int A=(8-x)*(8-y);
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1634 const int B=( x)*(8-y);
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1635 const int C=(8-x)*( y);
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1636 const int D=( x)*( y);
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1637 int i;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1638
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1639 assert(x<8 && y<8 && x>=0 && y>=0);
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1640
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1641 for(i=0; i<h; i++)
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1642 {
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1643 dst[0] = (Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1644 dst[1] = (Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1645 dst[2] = (Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1646 dst[3] = (Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1647 dst[4] = (Asrc[4] + Bsrc[5] + Csrc[stride+4] + Dsrc[stride+5] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1648 dst[5] = (Asrc[5] + Bsrc[6] + Csrc[stride+5] + Dsrc[stride+6] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1649 dst[6] = (Asrc[6] + Bsrc[7] + Csrc[stride+6] + Dsrc[stride+7] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1650 dst[7] = (Asrc[7] + Bsrc[8] + Csrc[stride+7] + Dsrc[stride+8] + 32 - 4) >> 6;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1651 dst+= stride;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1652 src+= stride;
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1653 }
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1654 }
8e180a3276fe New function for chroma MC (will be used in VC-1) kostya parents: 3656 diff changeset	1655
9440 daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1656 static void avg_no_rnd_vc1_chroma_mc8_c(uint8_t dst/align 8/, uint8_t src/align 1/, int stride, int h, int x, int y){
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1657 const int A=(8-x)*(8-y);
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1658 const int B=( x)*(8-y);
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1659 const int C=(8-x)*( y);
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1660 const int D=( x)*( y);
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1661 int i;
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1662
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1663 assert(x<8 && y<8 && x>=0 && y>=0);
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1664
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1665 for(i=0; i<h; i++)
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1666 {
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1667 dst[0] = avg2(dst[0], ((Asrc[0] + Bsrc[1] + Csrc[stride+0] + Dsrc[stride+1] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1668 dst[1] = avg2(dst[1], ((Asrc[1] + Bsrc[2] + Csrc[stride+1] + Dsrc[stride+2] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1669 dst[2] = avg2(dst[2], ((Asrc[2] + Bsrc[3] + Csrc[stride+2] + Dsrc[stride+3] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1670 dst[3] = avg2(dst[3], ((Asrc[3] + Bsrc[4] + Csrc[stride+3] + Dsrc[stride+4] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1671 dst[4] = avg2(dst[4], ((Asrc[4] + Bsrc[5] + Csrc[stride+4] + Dsrc[stride+5] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1672 dst[5] = avg2(dst[5], ((Asrc[5] + Bsrc[6] + Csrc[stride+5] + Dsrc[stride+6] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1673 dst[6] = avg2(dst[6], ((Asrc[6] + Bsrc[7] + Csrc[stride+6] + Dsrc[stride+7] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1674 dst[7] = avg2(dst[7], ((Asrc[7] + Bsrc[8] + Csrc[stride+7] + Dsrc[stride+8] + 32 - 4) >> 6));
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1675 dst+= stride;
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1676 src+= stride;
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1677 }
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1678 }
daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	1679
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1680 #define QPEL_MC(r, OPNAME, RND, OP) \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1681 static void OPNAME ## mpeg4_qpel8_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride, int h){\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	1682 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1683 int i;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1684 for(i=0; i<h; i++)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1685 {\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1686 OP(dst[0], (src[0]+src[1])20 - (src[0]+src[2])6 + (src[1]+src[3])*3 - (src[2]+src[4]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1687 OP(dst[1], (src[1]+src[2])20 - (src[0]+src[3])6 + (src[0]+src[4])*3 - (src[1]+src[5]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1688 OP(dst[2], (src[2]+src[3])20 - (src[1]+src[4])6 + (src[0]+src[5])*3 - (src[0]+src[6]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1689 OP(dst[3], (src[3]+src[4])20 - (src[2]+src[5])6 + (src[1]+src[6])*3 - (src[0]+src[7]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1690 OP(dst[4], (src[4]+src[5])20 - (src[3]+src[6])6 + (src[2]+src[7])*3 - (src[1]+src[8]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1691 OP(dst[5], (src[5]+src[6])20 - (src[4]+src[7])6 + (src[3]+src[8])*3 - (src[2]+src[8]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1692 OP(dst[6], (src[6]+src[7])20 - (src[5]+src[8])6 + (src[4]+src[8])*3 - (src[3]+src[7]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1693 OP(dst[7], (src[7]+src[8])20 - (src[6]+src[8])6 + (src[5]+src[7])*3 - (src[4]+src[6]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1694 dst+=dstStride;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1695 src+=srcStride;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1696 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1697 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1698 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1699 static void OPNAME ## mpeg4_qpel8_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1700 const int w=8;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	1701 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1702 int i;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1703 for(i=0; i<w; i++)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1704 {\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1705 const int src0= src[0*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1706 const int src1= src[1*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1707 const int src2= src[2*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1708 const int src3= src[3*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1709 const int src4= src[4*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1710 const int src5= src[5*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1711 const int src6= src[6*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1712 const int src7= src[7*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1713 const int src8= src[8*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1714 OP(dst[0dstStride], (src0+src1)20 - (src0+src2)6 + (src1+src3)3 - (src2+src4));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1715 OP(dst[1dstStride], (src1+src2)20 - (src0+src3)6 + (src0+src4)3 - (src1+src5));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1716 OP(dst[2dstStride], (src2+src3)20 - (src1+src4)6 + (src0+src5)3 - (src0+src6));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1717 OP(dst[3dstStride], (src3+src4)20 - (src2+src5)6 + (src1+src6)3 - (src0+src7));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1718 OP(dst[4dstStride], (src4+src5)20 - (src3+src6)6 + (src2+src7)3 - (src1+src8));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1719 OP(dst[5dstStride], (src5+src6)20 - (src4+src7)6 + (src3+src8)3 - (src2+src8));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1720 OP(dst[6dstStride], (src6+src7)20 - (src5+src8)6 + (src4+src8)3 - (src3+src7));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1721 OP(dst[7dstStride], (src7+src8)20 - (src6+src8)6 + (src5+src7)3 - (src4+src6));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1722 dst++;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1723 src++;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1724 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1725 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1726 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1727 static void OPNAME ## mpeg4_qpel16_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride, int h){\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	1728 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1729 int i;\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	1730 \
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1731 for(i=0; i<h; i++)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1732 {\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1733 OP(dst[ 0], (src[ 0]+src[ 1])20 - (src[ 0]+src[ 2])6 + (src[ 1]+src[ 3])*3 - (src[ 2]+src[ 4]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1734 OP(dst[ 1], (src[ 1]+src[ 2])20 - (src[ 0]+src[ 3])6 + (src[ 0]+src[ 4])*3 - (src[ 1]+src[ 5]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1735 OP(dst[ 2], (src[ 2]+src[ 3])20 - (src[ 1]+src[ 4])6 + (src[ 0]+src[ 5])*3 - (src[ 0]+src[ 6]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1736 OP(dst[ 3], (src[ 3]+src[ 4])20 - (src[ 2]+src[ 5])6 + (src[ 1]+src[ 6])*3 - (src[ 0]+src[ 7]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1737 OP(dst[ 4], (src[ 4]+src[ 5])20 - (src[ 3]+src[ 6])6 + (src[ 2]+src[ 7])*3 - (src[ 1]+src[ 8]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1738 OP(dst[ 5], (src[ 5]+src[ 6])20 - (src[ 4]+src[ 7])6 + (src[ 3]+src[ 8])*3 - (src[ 2]+src[ 9]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1739 OP(dst[ 6], (src[ 6]+src[ 7])20 - (src[ 5]+src[ 8])6 + (src[ 4]+src[ 9])*3 - (src[ 3]+src[10]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1740 OP(dst[ 7], (src[ 7]+src[ 8])20 - (src[ 6]+src[ 9])6 + (src[ 5]+src[10])*3 - (src[ 4]+src[11]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1741 OP(dst[ 8], (src[ 8]+src[ 9])20 - (src[ 7]+src[10])6 + (src[ 6]+src[11])*3 - (src[ 5]+src[12]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1742 OP(dst[ 9], (src[ 9]+src[10])20 - (src[ 8]+src[11])6 + (src[ 7]+src[12])*3 - (src[ 6]+src[13]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1743 OP(dst[10], (src[10]+src[11])20 - (src[ 9]+src[12])6 + (src[ 8]+src[13])*3 - (src[ 7]+src[14]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1744 OP(dst[11], (src[11]+src[12])20 - (src[10]+src[13])6 + (src[ 9]+src[14])*3 - (src[ 8]+src[15]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1745 OP(dst[12], (src[12]+src[13])20 - (src[11]+src[14])6 + (src[10]+src[15])*3 - (src[ 9]+src[16]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1746 OP(dst[13], (src[13]+src[14])20 - (src[12]+src[15])6 + (src[11]+src[16])*3 - (src[10]+src[16]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1747 OP(dst[14], (src[14]+src[15])20 - (src[13]+src[16])6 + (src[12]+src[16])*3 - (src[11]+src[15]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1748 OP(dst[15], (src[15]+src[16])20 - (src[14]+src[16])6 + (src[13]+src[15])*3 - (src[12]+src[14]));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1749 dst+=dstStride;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1750 src+=srcStride;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1751 }\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1752 }\
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1753 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1754 static void OPNAME ## mpeg4_qpel16_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	1755 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1756 int i;\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	1757 const int w=16;\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1758 for(i=0; i<w; i++)\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1759 {\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1760 const int src0= src[0*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1761 const int src1= src[1*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1762 const int src2= src[2*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1763 const int src3= src[3*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1764 const int src4= src[4*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1765 const int src5= src[5*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1766 const int src6= src[6*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1767 const int src7= src[7*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1768 const int src8= src[8*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1769 const int src9= src[9*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1770 const int src10= src[10*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1771 const int src11= src[11*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1772 const int src12= src[12*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1773 const int src13= src[13*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1774 const int src14= src[14*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1775 const int src15= src[15*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1776 const int src16= src[16*srcStride];\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1777 OP(dst[ 0dstStride], (src0 +src1 )20 - (src0 +src2 )6 + (src1 +src3 )3 - (src2 +src4 ));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1778 OP(dst[ 1dstStride], (src1 +src2 )20 - (src0 +src3 )6 + (src0 +src4 )3 - (src1 +src5 ));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1779 OP(dst[ 2dstStride], (src2 +src3 )20 - (src1 +src4 )6 + (src0 +src5 )3 - (src0 +src6 ));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1780 OP(dst[ 3dstStride], (src3 +src4 )20 - (src2 +src5 )6 + (src1 +src6 )3 - (src0 +src7 ));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1781 OP(dst[ 4dstStride], (src4 +src5 )20 - (src3 +src6 )6 + (src2 +src7 )3 - (src1 +src8 ));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1782 OP(dst[ 5dstStride], (src5 +src6 )20 - (src4 +src7 )6 + (src3 +src8 )3 - (src2 +src9 ));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1783 OP(dst[ 6dstStride], (src6 +src7 )20 - (src5 +src8 )6 + (src4 +src9 )3 - (src3 +src10));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1784 OP(dst[ 7dstStride], (src7 +src8 )20 - (src6 +src9 )6 + (src5 +src10)3 - (src4 +src11));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1785 OP(dst[ 8dstStride], (src8 +src9 )20 - (src7 +src10)6 + (src6 +src11)3 - (src5 +src12));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1786 OP(dst[ 9dstStride], (src9 +src10)20 - (src8 +src11)6 + (src7 +src12)3 - (src6 +src13));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1787 OP(dst[10dstStride], (src10+src11)20 - (src9 +src12)6 + (src8 +src13)3 - (src7 +src14));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1788 OP(dst[11dstStride], (src11+src12)20 - (src10+src13)6 + (src9 +src14)3 - (src8 +src15));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1789 OP(dst[12dstStride], (src12+src13)20 - (src11+src14)6 + (src10+src15)3 - (src9 +src16));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1790 OP(dst[13dstStride], (src13+src14)20 - (src12+src15)6 + (src11+src16)3 - (src10+src16));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1791 OP(dst[14dstStride], (src14+src15)20 - (src13+src16)6 + (src12+src16)3 - (src11+src15));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1792 OP(dst[15dstStride], (src15+src16)20 - (src14+src16)6 + (src13+src15)3 - (src12+src14));\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1793 dst++;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1794 src++;\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1795 }\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1796 }\
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1797 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1798 static void OPNAME ## qpel8_mc00_c (uint8_t dst, uint8_t src, int stride){\
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1799 OPNAME ## pixels8_c(dst, src, stride, 8);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1800 }\
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1801 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1802 static void OPNAME ## qpel8_mc10_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1803 uint8_t half[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1804 put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1805 OPNAME ## pixels8_l2(dst, src, half, stride, stride, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1806 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1807 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1808 static void OPNAME ## qpel8_mc20_c(uint8_t dst, uint8_t src, int stride){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1809 OPNAME ## mpeg4_qpel8_h_lowpass(dst, src, stride, stride, 8);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1810 }\
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1811 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1812 static void OPNAME ## qpel8_mc30_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1813 uint8_t half[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1814 put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1815 OPNAME ## pixels8_l2(dst, src+1, half, stride, stride, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1816 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1817 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1818 static void OPNAME ## qpel8_mc01_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1819 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1820 uint8_t half[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1821 copy_block9(full, src, 16, stride, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1822 put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1823 OPNAME ## pixels8_l2(dst, full, half, stride, 16, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1824 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1825 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1826 static void OPNAME ## qpel8_mc02_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1827 uint8_t full[16*9];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1828 copy_block9(full, src, 16, stride, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1829 OPNAME ## mpeg4_qpel8_v_lowpass(dst, full, stride, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1830 }\
db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1831 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1832 static void OPNAME ## qpel8_mc03_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1833 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1834 uint8_t half[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1835 copy_block9(full, src, 16, stride, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1836 put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1837 OPNAME ## pixels8_l2(dst, full+16, half, stride, 16, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1838 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1839 void ff_ ## OPNAME ## qpel8_mc11_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1840 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1841 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1842 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1843 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1844 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1845 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1846 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1847 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1848 OPNAME ## pixels8_l4(dst, full, halfH, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1849 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1850 static void OPNAME ## qpel8_mc11_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1851 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1852 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1853 uint8_t halfHV[64];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1854 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1855 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1856 put ## RND ## pixels8_l2(halfH, halfH, full, 8, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1857 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1858 OPNAME ## pixels8_l2(dst, halfH, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1859 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1860 void ff_ ## OPNAME ## qpel8_mc31_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1861 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1862 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1863 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1864 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1865 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1866 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1867 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full+1, 8, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1868 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1869 OPNAME ## pixels8_l4(dst, full+1, halfH, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1870 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1871 static void OPNAME ## qpel8_mc31_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1872 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1873 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1874 uint8_t halfHV[64];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1875 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1876 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1877 put ## RND ## pixels8_l2(halfH, halfH, full+1, 8, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1878 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1879 OPNAME ## pixels8_l2(dst, halfH, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1880 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1881 void ff_ ## OPNAME ## qpel8_mc13_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1882 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1883 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1884 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1885 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1886 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1887 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1888 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1889 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1890 OPNAME ## pixels8_l4(dst, full+16, halfH+8, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1891 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1892 static void OPNAME ## qpel8_mc13_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1893 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1894 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1895 uint8_t halfHV[64];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1896 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1897 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1898 put ## RND ## pixels8_l2(halfH, halfH, full, 8, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1899 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1900 OPNAME ## pixels8_l2(dst, halfH+8, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1901 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1902 void ff_ ## OPNAME ## qpel8_mc33_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1903 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1904 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1905 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1906 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1907 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1908 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full , 8, 16, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1909 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full+1, 8, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1910 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1911 OPNAME ## pixels8_l4(dst, full+17, halfH+8, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1912 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1913 static void OPNAME ## qpel8_mc33_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1914 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1915 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1916 uint8_t halfHV[64];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1917 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1918 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1919 put ## RND ## pixels8_l2(halfH, halfH, full+1, 8, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1920 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1921 OPNAME ## pixels8_l2(dst, halfH+8, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1922 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1923 static void OPNAME ## qpel8_mc21_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1924 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1925 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1926 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1927 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1928 OPNAME ## pixels8_l2(dst, halfH, halfHV, stride, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1929 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1930 static void OPNAME ## qpel8_mc23_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1931 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1932 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1933 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1934 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1935 OPNAME ## pixels8_l2(dst, halfH+8, halfHV, stride, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1936 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1937 void ff_ ## OPNAME ## qpel8_mc12_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1938 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1939 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1940 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1941 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1942 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1943 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1944 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1945 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1946 OPNAME ## pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1947 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1948 static void OPNAME ## qpel8_mc12_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1949 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1950 uint8_t halfH[72];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1951 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1952 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1953 put ## RND ## pixels8_l2(halfH, halfH, full, 8, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1954 OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1955 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1956 void ff_ ## OPNAME ## qpel8_mc32_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1957 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1958 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1959 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1960 uint8_t halfHV[64];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1961 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1962 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1963 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full+1, 8, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1964 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1965 OPNAME ## pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1966 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1967 static void OPNAME ## qpel8_mc32_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1968 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1969 uint8_t halfH[72];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1970 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1971 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1972 put ## RND ## pixels8_l2(halfH, halfH, full+1, 8, 8, 16, 9);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1973 OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1974 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1975 static void OPNAME ## qpel8_mc22_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1976 uint8_t halfH[72];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1977 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9);\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	1978 OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1979 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1980 static void OPNAME ## qpel16_mc00_c (uint8_t dst, uint8_t src, int stride){\
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	1981 OPNAME ## pixels16_c(dst, src, stride, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	1982 }\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1983 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1984 static void OPNAME ## qpel16_mc10_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1985 uint8_t half[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1986 put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1987 OPNAME ## pixels16_l2(dst, src, half, stride, stride, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1988 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1989 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1990 static void OPNAME ## qpel16_mc20_c(uint8_t dst, uint8_t src, int stride){\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1991 OPNAME ## mpeg4_qpel16_h_lowpass(dst, src, stride, stride, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1992 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1993 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1994 static void OPNAME ## qpel16_mc30_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	1995 uint8_t half[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1996 put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1997 OPNAME ## pixels16_l2(dst, src+1, half, stride, stride, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1998 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	1999 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2000 static void OPNAME ## qpel16_mc01_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2001 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2002 uint8_t half[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2003 copy_block17(full, src, 24, stride, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2004 put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2005 OPNAME ## pixels16_l2(dst, full, half, stride, 24, 16, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2006 }\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2007 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2008 static void OPNAME ## qpel16_mc02_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2009 uint8_t full[24*17];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2010 copy_block17(full, src, 24, stride, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2011 OPNAME ## mpeg4_qpel16_v_lowpass(dst, full, stride, 24);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2012 }\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2013 \
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2014 static void OPNAME ## qpel16_mc03_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2015 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2016 uint8_t half[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2017 copy_block17(full, src, 24, stride, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2018 put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2019 OPNAME ## pixels16_l2(dst, full+24, half, stride, 24, 16, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2020 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2021 void ff_ ## OPNAME ## qpel16_mc11_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2022 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2023 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2024 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2025 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2026 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2027 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2028 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2029 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2030 OPNAME ## pixels16_l4(dst, full, halfH, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2031 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2032 static void OPNAME ## qpel16_mc11_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2033 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2034 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2035 uint8_t halfHV[256];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2036 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2037 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2038 put ## RND ## pixels16_l2(halfH, halfH, full, 16, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2039 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2040 OPNAME ## pixels16_l2(dst, halfH, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2041 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2042 void ff_ ## OPNAME ## qpel16_mc31_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2043 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2044 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2045 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2046 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2047 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2048 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2049 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full+1, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2050 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2051 OPNAME ## pixels16_l4(dst, full+1, halfH, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2052 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2053 static void OPNAME ## qpel16_mc31_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2054 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2055 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2056 uint8_t halfHV[256];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2057 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2058 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2059 put ## RND ## pixels16_l2(halfH, halfH, full+1, 16, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2060 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2061 OPNAME ## pixels16_l2(dst, halfH, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2062 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2063 void ff_ ## OPNAME ## qpel16_mc13_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2064 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2065 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2066 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2067 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2068 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2069 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2070 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2071 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2072 OPNAME ## pixels16_l4(dst, full+24, halfH+16, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2073 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2074 static void OPNAME ## qpel16_mc13_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2075 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2076 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2077 uint8_t halfHV[256];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2078 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2079 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2080 put ## RND ## pixels16_l2(halfH, halfH, full, 16, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2081 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2082 OPNAME ## pixels16_l2(dst, halfH+16, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2083 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2084 void ff_ ## OPNAME ## qpel16_mc33_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2085 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2086 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2087 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2088 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2089 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2090 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full , 16, 24, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2091 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full+1, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2092 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2093 OPNAME ## pixels16_l4(dst, full+25, halfH+16, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2094 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2095 static void OPNAME ## qpel16_mc33_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2096 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2097 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2098 uint8_t halfHV[256];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2099 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2100 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2101 put ## RND ## pixels16_l2(halfH, halfH, full+1, 16, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2102 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2103 OPNAME ## pixels16_l2(dst, halfH+16, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2104 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2105 static void OPNAME ## qpel16_mc21_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2106 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2107 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2108 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2109 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2110 OPNAME ## pixels16_l2(dst, halfH, halfHV, stride, 16, 16, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2111 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2112 static void OPNAME ## qpel16_mc23_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2113 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2114 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2115 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2116 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2117 OPNAME ## pixels16_l2(dst, halfH+16, halfHV, stride, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2118 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2119 void ff_ ## OPNAME ## qpel16_mc12_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2120 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2121 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2122 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2123 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2124 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2125 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2126 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2127 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2128 OPNAME ## pixels16_l2(dst, halfV, halfHV, stride, 16, 16, 16);\
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2129 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2130 static void OPNAME ## qpel16_mc12_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2131 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2132 uint8_t halfH[272];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2133 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2134 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2135 put ## RND ## pixels16_l2(halfH, halfH, full, 16, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2136 OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2137 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2138 void ff_ ## OPNAME ## qpel16_mc32_old_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2139 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2140 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2141 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2142 uint8_t halfHV[256];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2143 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2144 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2145 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full+1, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2146 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2147 OPNAME ## pixels16_l2(dst, halfV, halfHV, stride, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2148 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2149 static void OPNAME ## qpel16_mc32_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2150 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2151 uint8_t halfH[272];\
984 e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2152 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2153 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2154 put ## RND ## pixels16_l2(halfH, halfH, full+1, 16, 16, 24, 17);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2155 OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16);\
e162c09efbe7 qpel fix michaelni parents: 954 diff changeset	2156 }\
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2157 static void OPNAME ## qpel16_mc22_c(uint8_t dst, uint8_t src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2158 uint8_t halfH[272];\
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2159 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17);\
954 13aec7e50c52 qpel in mmx2/3dnow michaelni parents: 945 diff changeset	2160 OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16);\
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	2161 }
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2162
651 45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2163 #define op_avg(a, b) a = (((a)+cm[((b) + 16)>>5]+1)>>1)
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2164 #define op_avg_no_rnd(a, b) a = (((a)+cm[((b) + 15)>>5])>>1)
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2165 #define op_put(a, b) a = cm[((b) + 16)>>5]
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2166 #define op_put_no_rnd(a, b) a = cm[((b) + 15)>>5]
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2167
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2168 QPEL_MC(0, put_ , _ , op_put)
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2169 QPEL_MC(1, put_no_rnd_, _no_rnd_, op_put_no_rnd)
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2170 QPEL_MC(0, avg_ , _ , op_avg)
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2171 //QPEL_MC(1, avg_no_rnd , _ , op_avg)
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2172 #undef op_avg
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2173 #undef op_avg_no_rnd
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2174 #undef op_put
45e8f39fda50 put/avg_pixels16 michaelni parents: 638 diff changeset	2175 #undef op_put_no_rnd
255 db20b987c32d divx5-gmc support michaelni parents: 252 diff changeset	2176
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2177 #if 1
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2178 #define H264_LOWPASS(OPNAME, OP, OP2) \
5151 8c273ff9ca03 kill some "defined but not used" warnings mru parents: 5150 diff changeset	2179 static av_unused void OPNAME ## h264_qpel2_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2180 const int h=2;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2181 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2182 int i;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2183 for(i=0; i<h; i++)\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2184 {\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2185 OP(dst[0], (src[0]+src[1])20 - (src[-1]+src[2])5 + (src[-2]+src[3]));\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2186 OP(dst[1], (src[1]+src[2])20 - (src[0 ]+src[3])5 + (src[-1]+src[4]));\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2187 dst+=dstStride;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2188 src+=srcStride;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2189 }\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2190 }\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2191 \
5151 8c273ff9ca03 kill some "defined but not used" warnings mru parents: 5150 diff changeset	2192 static av_unused void OPNAME ## h264_qpel2_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2193 const int w=2;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2194 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2195 int i;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2196 for(i=0; i<w; i++)\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2197 {\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2198 const int srcB= src[-2*srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2199 const int srcA= src[-1*srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2200 const int src0= src[0 *srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2201 const int src1= src[1 *srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2202 const int src2= src[2 *srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2203 const int src3= src[3 *srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2204 const int src4= src[4 *srcStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2205 OP(dst[0dstStride], (src0+src1)20 - (srcA+src2)*5 + (srcB+src3));\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2206 OP(dst[1dstStride], (src1+src2)20 - (src0+src3)*5 + (srcA+src4));\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2207 dst++;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2208 src++;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2209 }\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2210 }\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2211 \
5151 8c273ff9ca03 kill some "defined but not used" warnings mru parents: 5150 diff changeset	2212 static av_unused void OPNAME ## h264_qpel2_hv_lowpass(uint8_t dst, int16_t tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2213 const int h=2;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2214 const int w=2;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2215 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2216 int i;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2217 src -= 2*srcStride;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2218 for(i=0; i<h+5; i++)\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2219 {\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2220 tmp[0]= (src[0]+src[1])20 - (src[-1]+src[2])5 + (src[-2]+src[3]);\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2221 tmp[1]= (src[1]+src[2])20 - (src[0 ]+src[3])5 + (src[-1]+src[4]);\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2222 tmp+=tmpStride;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2223 src+=srcStride;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2224 }\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2225 tmp -= tmpStride*(h+5-2);\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2226 for(i=0; i<w; i++)\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2227 {\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2228 const int tmpB= tmp[-2*tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2229 const int tmpA= tmp[-1*tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2230 const int tmp0= tmp[0 *tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2231 const int tmp1= tmp[1 *tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2232 const int tmp2= tmp[2 *tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2233 const int tmp3= tmp[3 *tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2234 const int tmp4= tmp[4 *tmpStride];\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2235 OP2(dst[0dstStride], (tmp0+tmp1)20 - (tmpA+tmp2)*5 + (tmpB+tmp3));\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2236 OP2(dst[1dstStride], (tmp1+tmp2)20 - (tmp0+tmp3)*5 + (tmpA+tmp4));\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2237 dst++;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2238 tmp++;\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2239 }\
c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2240 }\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2241 static void OPNAME ## h264_qpel4_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2242 const int h=4;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2243 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2244 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2245 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2246 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2247 OP(dst[0], (src[0]+src[1])20 - (src[-1]+src[2])5 + (src[-2]+src[3]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2248 OP(dst[1], (src[1]+src[2])20 - (src[0 ]+src[3])5 + (src[-1]+src[4]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2249 OP(dst[2], (src[2]+src[3])20 - (src[1 ]+src[4])5 + (src[0 ]+src[5]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2250 OP(dst[3], (src[3]+src[4])20 - (src[2 ]+src[5])5 + (src[1 ]+src[6]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2251 dst+=dstStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2252 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2253 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2254 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2255 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2256 static void OPNAME ## h264_qpel4_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2257 const int w=4;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2258 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2259 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2260 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2261 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2262 const int srcB= src[-2*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2263 const int srcA= src[-1*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2264 const int src0= src[0 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2265 const int src1= src[1 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2266 const int src2= src[2 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2267 const int src3= src[3 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2268 const int src4= src[4 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2269 const int src5= src[5 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2270 const int src6= src[6 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2271 OP(dst[0dstStride], (src0+src1)20 - (srcA+src2)*5 + (srcB+src3));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2272 OP(dst[1dstStride], (src1+src2)20 - (src0+src3)*5 + (srcA+src4));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2273 OP(dst[2dstStride], (src2+src3)20 - (src1+src4)*5 + (src0+src5));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2274 OP(dst[3dstStride], (src3+src4)20 - (src2+src5)*5 + (src1+src6));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2275 dst++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2276 src++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2277 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2278 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2279 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2280 static void OPNAME ## h264_qpel4_hv_lowpass(uint8_t dst, int16_t tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2281 const int h=4;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2282 const int w=4;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2283 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2284 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2285 src -= 2*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2286 for(i=0; i<h+5; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2287 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2288 tmp[0]= (src[0]+src[1])20 - (src[-1]+src[2])5 + (src[-2]+src[3]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2289 tmp[1]= (src[1]+src[2])20 - (src[0 ]+src[3])5 + (src[-1]+src[4]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2290 tmp[2]= (src[2]+src[3])20 - (src[1 ]+src[4])5 + (src[0 ]+src[5]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2291 tmp[3]= (src[3]+src[4])20 - (src[2 ]+src[5])5 + (src[1 ]+src[6]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2292 tmp+=tmpStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2293 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2294 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2295 tmp -= tmpStride*(h+5-2);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2296 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2297 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2298 const int tmpB= tmp[-2*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2299 const int tmpA= tmp[-1*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2300 const int tmp0= tmp[0 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2301 const int tmp1= tmp[1 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2302 const int tmp2= tmp[2 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2303 const int tmp3= tmp[3 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2304 const int tmp4= tmp[4 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2305 const int tmp5= tmp[5 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2306 const int tmp6= tmp[6 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2307 OP2(dst[0dstStride], (tmp0+tmp1)20 - (tmpA+tmp2)*5 + (tmpB+tmp3));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2308 OP2(dst[1dstStride], (tmp1+tmp2)20 - (tmp0+tmp3)*5 + (tmpA+tmp4));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2309 OP2(dst[2dstStride], (tmp2+tmp3)20 - (tmp1+tmp4)*5 + (tmp0+tmp5));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2310 OP2(dst[3dstStride], (tmp3+tmp4)20 - (tmp2+tmp5)*5 + (tmp1+tmp6));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2311 dst++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2312 tmp++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2313 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2314 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2315 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2316 static void OPNAME ## h264_qpel8_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2317 const int h=8;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2318 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2319 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2320 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2321 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2322 OP(dst[0], (src[0]+src[1])20 - (src[-1]+src[2])5 + (src[-2]+src[3 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2323 OP(dst[1], (src[1]+src[2])20 - (src[0 ]+src[3])5 + (src[-1]+src[4 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2324 OP(dst[2], (src[2]+src[3])20 - (src[1 ]+src[4])5 + (src[0 ]+src[5 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2325 OP(dst[3], (src[3]+src[4])20 - (src[2 ]+src[5])5 + (src[1 ]+src[6 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2326 OP(dst[4], (src[4]+src[5])20 - (src[3 ]+src[6])5 + (src[2 ]+src[7 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2327 OP(dst[5], (src[5]+src[6])20 - (src[4 ]+src[7])5 + (src[3 ]+src[8 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2328 OP(dst[6], (src[6]+src[7])20 - (src[5 ]+src[8])5 + (src[4 ]+src[9 ]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2329 OP(dst[7], (src[7]+src[8])20 - (src[6 ]+src[9])5 + (src[5 ]+src[10]));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2330 dst+=dstStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2331 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2332 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2333 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2334 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2335 static void OPNAME ## h264_qpel8_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2336 const int w=8;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2337 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2338 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2339 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2340 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2341 const int srcB= src[-2*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2342 const int srcA= src[-1*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2343 const int src0= src[0 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2344 const int src1= src[1 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2345 const int src2= src[2 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2346 const int src3= src[3 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2347 const int src4= src[4 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2348 const int src5= src[5 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2349 const int src6= src[6 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2350 const int src7= src[7 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2351 const int src8= src[8 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2352 const int src9= src[9 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2353 const int src10=src[10*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2354 OP(dst[0dstStride], (src0+src1)20 - (srcA+src2)*5 + (srcB+src3));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2355 OP(dst[1dstStride], (src1+src2)20 - (src0+src3)*5 + (srcA+src4));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2356 OP(dst[2dstStride], (src2+src3)20 - (src1+src4)*5 + (src0+src5));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2357 OP(dst[3dstStride], (src3+src4)20 - (src2+src5)*5 + (src1+src6));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2358 OP(dst[4dstStride], (src4+src5)20 - (src3+src6)*5 + (src2+src7));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2359 OP(dst[5dstStride], (src5+src6)20 - (src4+src7)*5 + (src3+src8));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2360 OP(dst[6dstStride], (src6+src7)20 - (src5+src8)*5 + (src4+src9));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2361 OP(dst[7dstStride], (src7+src8)20 - (src6+src9)*5 + (src5+src10));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2362 dst++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2363 src++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2364 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2365 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2366 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2367 static void OPNAME ## h264_qpel8_hv_lowpass(uint8_t dst, int16_t tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2368 const int h=8;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2369 const int w=8;\
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2370 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;\
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2371 int i;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2372 src -= 2*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2373 for(i=0; i<h+5; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2374 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2375 tmp[0]= (src[0]+src[1])20 - (src[-1]+src[2])5 + (src[-2]+src[3 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2376 tmp[1]= (src[1]+src[2])20 - (src[0 ]+src[3])5 + (src[-1]+src[4 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2377 tmp[2]= (src[2]+src[3])20 - (src[1 ]+src[4])5 + (src[0 ]+src[5 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2378 tmp[3]= (src[3]+src[4])20 - (src[2 ]+src[5])5 + (src[1 ]+src[6 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2379 tmp[4]= (src[4]+src[5])20 - (src[3 ]+src[6])5 + (src[2 ]+src[7 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2380 tmp[5]= (src[5]+src[6])20 - (src[4 ]+src[7])5 + (src[3 ]+src[8 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2381 tmp[6]= (src[6]+src[7])20 - (src[5 ]+src[8])5 + (src[4 ]+src[9 ]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2382 tmp[7]= (src[7]+src[8])20 - (src[6 ]+src[9])5 + (src[5 ]+src[10]);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2383 tmp+=tmpStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2384 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2385 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2386 tmp -= tmpStride*(h+5-2);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2387 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2388 {\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2389 const int tmpB= tmp[-2*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2390 const int tmpA= tmp[-1*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2391 const int tmp0= tmp[0 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2392 const int tmp1= tmp[1 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2393 const int tmp2= tmp[2 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2394 const int tmp3= tmp[3 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2395 const int tmp4= tmp[4 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2396 const int tmp5= tmp[5 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2397 const int tmp6= tmp[6 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2398 const int tmp7= tmp[7 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2399 const int tmp8= tmp[8 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2400 const int tmp9= tmp[9 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2401 const int tmp10=tmp[10*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2402 OP2(dst[0dstStride], (tmp0+tmp1)20 - (tmpA+tmp2)*5 + (tmpB+tmp3));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2403 OP2(dst[1dstStride], (tmp1+tmp2)20 - (tmp0+tmp3)*5 + (tmpA+tmp4));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2404 OP2(dst[2dstStride], (tmp2+tmp3)20 - (tmp1+tmp4)*5 + (tmp0+tmp5));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2405 OP2(dst[3dstStride], (tmp3+tmp4)20 - (tmp2+tmp5)*5 + (tmp1+tmp6));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2406 OP2(dst[4dstStride], (tmp4+tmp5)20 - (tmp3+tmp6)*5 + (tmp2+tmp7));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2407 OP2(dst[5dstStride], (tmp5+tmp6)20 - (tmp4+tmp7)*5 + (tmp3+tmp8));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2408 OP2(dst[6dstStride], (tmp6+tmp7)20 - (tmp5+tmp8)*5 + (tmp4+tmp9));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2409 OP2(dst[7dstStride], (tmp7+tmp8)20 - (tmp6+tmp9)*5 + (tmp5+tmp10));\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2410 dst++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2411 tmp++;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2412 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2413 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2414 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2415 static void OPNAME ## h264_qpel16_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2416 OPNAME ## h264_qpel8_v_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2417 OPNAME ## h264_qpel8_v_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2418 src += 8*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2419 dst += 8*dstStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2420 OPNAME ## h264_qpel8_v_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2421 OPNAME ## h264_qpel8_v_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2422 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2423 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2424 static void OPNAME ## h264_qpel16_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2425 OPNAME ## h264_qpel8_h_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2426 OPNAME ## h264_qpel8_h_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2427 src += 8*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2428 dst += 8*dstStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2429 OPNAME ## h264_qpel8_h_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2430 OPNAME ## h264_qpel8_h_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2431 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2432 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2433 static void OPNAME ## h264_qpel16_hv_lowpass(uint8_t dst, int16_t tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2434 OPNAME ## h264_qpel8_hv_lowpass(dst , tmp , src , dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2435 OPNAME ## h264_qpel8_hv_lowpass(dst+8, tmp+8, src+8, dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2436 src += 8*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2437 dst += 8*dstStride;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2438 OPNAME ## h264_qpel8_hv_lowpass(dst , tmp , src , dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2439 OPNAME ## h264_qpel8_hv_lowpass(dst+8, tmp+8, src+8, dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2440 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2441
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2442 #define H264_MC(OPNAME, SIZE) \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2443 static void OPNAME ## h264_qpel ## SIZE ## _mc00_c (uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2444 OPNAME ## pixels ## SIZE ## _c(dst, src, stride, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2445 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2446 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2447 static void OPNAME ## h264_qpel ## SIZE ## _mc10_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2448 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2449 put_h264_qpel ## SIZE ## _h_lowpass(half, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2450 OPNAME ## pixels ## SIZE ## _l2(dst, src, half, stride, stride, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2451 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2452 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2453 static void OPNAME ## h264_qpel ## SIZE ## _mc20_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2454 OPNAME ## h264_qpel ## SIZE ## _h_lowpass(dst, src, stride, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2455 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2456 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2457 static void OPNAME ## h264_qpel ## SIZE ## _mc30_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2458 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2459 put_h264_qpel ## SIZE ## _h_lowpass(half, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2460 OPNAME ## pixels ## SIZE ## _l2(dst, src+1, half, stride, stride, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2461 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2462 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2463 static void OPNAME ## h264_qpel ## SIZE ## _mc01_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2464 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2465 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2466 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2467 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2468 put_h264_qpel ## SIZE ## _v_lowpass(half, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2469 OPNAME ## pixels ## SIZE ## _l2(dst, full_mid, half, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2470 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2471 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2472 static void OPNAME ## h264_qpel ## SIZE ## _mc02_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2473 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2474 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2475 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2476 OPNAME ## h264_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2477 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2478 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2479 static void OPNAME ## h264_qpel ## SIZE ## _mc03_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2480 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2481 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2482 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2483 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2484 put_h264_qpel ## SIZE ## _v_lowpass(half, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2485 OPNAME ## pixels ## SIZE ## _l2(dst, full_mid+SIZE, half, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2486 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2487 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2488 static void OPNAME ## h264_qpel ## SIZE ## _mc11_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2489 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2490 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2491 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2492 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2493 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2494 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2495 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2496 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2497 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2498 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2499 static void OPNAME ## h264_qpel ## SIZE ## _mc31_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2500 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2501 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2502 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2503 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2504 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2505 copy_block ## SIZE (full, src - stride*2 + 1, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2506 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2507 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2508 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2509 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2510 static void OPNAME ## h264_qpel ## SIZE ## _mc13_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2511 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2512 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2513 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2514 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2515 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src + stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2516 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2517 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2518 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2519 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2520 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2521 static void OPNAME ## h264_qpel ## SIZE ## _mc33_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2522 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2523 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2524 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2525 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2526 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src + stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2527 copy_block ## SIZE (full, src - stride*2 + 1, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2528 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2529 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2530 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2531 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2532 static void OPNAME ## h264_qpel ## SIZE ## _mc22_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2533 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2534 OPNAME ## h264_qpel ## SIZE ## _hv_lowpass(dst, tmp, src, stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2535 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2536 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2537 static void OPNAME ## h264_qpel ## SIZE ## _mc21_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2538 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2539 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2540 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2541 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2542 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2543 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2544 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2545 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2546 static void OPNAME ## h264_qpel ## SIZE ## _mc23_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2547 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2548 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2549 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2550 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src + stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2551 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2552 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2553 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2554 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2555 static void OPNAME ## h264_qpel ## SIZE ## _mc12_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2556 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2557 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2558 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2559 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2560 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2561 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2562 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2563 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2564 OPNAME ## pixels ## SIZE ## _l2(dst, halfV, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2565 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2566 \
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2567 static void OPNAME ## h264_qpel ## SIZE ## _mc32_c(uint8_t dst, uint8_t src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2568 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2569 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2570 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2571 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2572 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2573 copy_block ## SIZE (full, src - stride*2 + 1, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2574 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2575 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2576 OPNAME ## pixels ## SIZE ## _l2(dst, halfV, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2577 }\
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2578
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2579 #define op_avg(a, b) a = (((a)+cm[((b) + 16)>>5]+1)>>1)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2580 //#define op_avg2(a, b) a = (((a)w1+cm[((b) + 16)>>5]w2 + o + 64)>>7)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2581 #define op_put(a, b) a = cm[((b) + 16)>>5]
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2582 #define op2_avg(a, b) a = (((a)+cm[((b) + 512)>>10]+1)>>1)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2583 #define op2_put(a, b) a = cm[((b) + 512)>>10]
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2584
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2585 H264_LOWPASS(put_ , op_put, op2_put)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2586 H264_LOWPASS(avg_ , op_avg, op2_avg)
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	2587 H264_MC(put_, 2)
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2588 H264_MC(put_, 4)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2589 H264_MC(put_, 8)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2590 H264_MC(put_, 16)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2591 H264_MC(avg_, 4)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2592 H264_MC(avg_, 8)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2593 H264_MC(avg_, 16)
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2594
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2595 #undef op_avg
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2596 #undef op_put
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2597 #undef op2_avg
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2598 #undef op2_put
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2599 #endif
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	2600
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2601 static void wmv2_mspel8_h_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride, int h){
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2602 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2603 int i;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2604
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2605 for(i=0; i<h; i++){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2606 dst[0]= cm[(9*(src[0] + src[1]) - (src[-1] + src[2]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2607 dst[1]= cm[(9*(src[1] + src[2]) - (src[ 0] + src[3]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2608 dst[2]= cm[(9*(src[2] + src[3]) - (src[ 1] + src[4]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2609 dst[3]= cm[(9*(src[3] + src[4]) - (src[ 2] + src[5]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2610 dst[4]= cm[(9*(src[4] + src[5]) - (src[ 3] + src[6]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2611 dst[5]= cm[(9*(src[5] + src[6]) - (src[ 4] + src[7]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2612 dst[6]= cm[(9*(src[6] + src[7]) - (src[ 5] + src[8]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2613 dst[7]= cm[(9*(src[7] + src[8]) - (src[ 6] + src[9]) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2614 dst+=dstStride;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2615 src+=srcStride;
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2616 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2617 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2618
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	2619 #if CONFIG_CAVS_DECODER
3395 adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2620 /* AVS specific */
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2621 void ff_put_cavs_qpel8_mc00_c(uint8_t dst, uint8_t src, int stride) {
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2622 put_pixels8_c(dst, src, stride, 8);
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2623 }
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2624 void ff_avg_cavs_qpel8_mc00_c(uint8_t dst, uint8_t src, int stride) {
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2625 avg_pixels8_c(dst, src, stride, 8);
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2626 }
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2627 void ff_put_cavs_qpel16_mc00_c(uint8_t dst, uint8_t src, int stride) {
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2628 put_pixels16_c(dst, src, stride, 16);
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2629 }
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2630 void ff_avg_cavs_qpel16_mc00_c(uint8_t dst, uint8_t src, int stride) {
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2631 avg_pixels16_c(dst, src, stride, 16);
adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2632 }
3432 ab49baf4adad Fix compilation with --disable-decoders. diego parents: 3395 diff changeset	2633 #endif /* CONFIG_CAVS_DECODER */
3395 adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	2634
9995 3141f69e3905 Do not check for both CONFIG_VC1_DECODER and CONFIG_WMV3_DECODER, diego parents: 9975 diff changeset	2635 #if CONFIG_VC1_DECODER
3526 7dc8e4a12105 New functions in DSPContext for VC-1 decoding kostya parents: 3432 diff changeset	2636 /* VC-1 specific */
11378 f46b68960464 Move some VC1 dsp prototypes to dsputil.h; they are defined in dsputil.c mru parents: 11376 diff changeset	2637 void ff_put_vc1_mspel_mc00_c(uint8_t dst, const uint8_t src, int stride, int rnd) {
3526 7dc8e4a12105 New functions in DSPContext for VC-1 decoding kostya parents: 3432 diff changeset	2638 put_pixels8_c(dst, src, stride, 8);
7dc8e4a12105 New functions in DSPContext for VC-1 decoding kostya parents: 3432 diff changeset	2639 }
11378 f46b68960464 Move some VC1 dsp prototypes to dsputil.h; they are defined in dsputil.c mru parents: 11376 diff changeset	2640 void ff_avg_vc1_mspel_mc00_c(uint8_t dst, const uint8_t src, int stride, int rnd) {
9437 8aa2e86549cd VC1: Do qpel when needed for both MVs in a B frame conrad parents: 9259 diff changeset	2641 avg_pixels8_c(dst, src, stride, 8);
8aa2e86549cd VC1: Do qpel when needed for both MVs in a B frame conrad parents: 9259 diff changeset	2642 }
9995 3141f69e3905 Do not check for both CONFIG_VC1_DECODER and CONFIG_WMV3_DECODER, diego parents: 9975 diff changeset	2643 #endif /* CONFIG_VC1_DECODER */
3526 7dc8e4a12105 New functions in DSPContext for VC-1 decoding kostya parents: 3432 diff changeset	2644
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	2645 #if CONFIG_RV40_DECODER
8232 520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2646 static void put_rv40_qpel16_mc33_c(uint8_t dst, uint8_t src, int stride){
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2647 put_pixels16_xy2_c(dst, src, stride, 16);
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2648 }
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2649 static void avg_rv40_qpel16_mc33_c(uint8_t dst, uint8_t src, int stride){
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2650 avg_pixels16_xy2_c(dst, src, stride, 16);
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2651 }
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2652 static void put_rv40_qpel8_mc33_c(uint8_t dst, uint8_t src, int stride){
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2653 put_pixels8_xy2_c(dst, src, stride, 8);
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2654 }
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2655 static void avg_rv40_qpel8_mc33_c(uint8_t dst, uint8_t src, int stride){
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2656 avg_pixels8_xy2_c(dst, src, stride, 8);
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2657 }
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2658 #endif /* CONFIG_RV40_DECODER */
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	2659
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2660 static void wmv2_mspel8_v_lowpass(uint8_t dst, uint8_t src, int dstStride, int srcStride, int w){
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	2661 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2662 int i;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2663
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2664 for(i=0; i<w; i++){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2665 const int src_1= src[ -srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2666 const int src0 = src[0 ];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2667 const int src1 = src[ srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2668 const int src2 = src[2*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2669 const int src3 = src[3*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2670 const int src4 = src[4*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2671 const int src5 = src[5*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2672 const int src6 = src[6*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2673 const int src7 = src[7*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2674 const int src8 = src[8*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2675 const int src9 = src[9*srcStride];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2676 dst[0dstStride]= cm[(9(src0 + src1) - (src_1 + src2) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2677 dst[1dstStride]= cm[(9(src1 + src2) - (src0 + src3) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2678 dst[2dstStride]= cm[(9(src2 + src3) - (src1 + src4) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2679 dst[3dstStride]= cm[(9(src3 + src4) - (src2 + src5) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2680 dst[4dstStride]= cm[(9(src4 + src5) - (src3 + src6) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2681 dst[5dstStride]= cm[(9(src5 + src6) - (src4 + src7) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2682 dst[6dstStride]= cm[(9(src6 + src7) - (src5 + src8) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2683 dst[7dstStride]= cm[(9(src7 + src8) - (src6 + src9) + 8)>>4];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2684 src++;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2685 dst++;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2686 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2687 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2688
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2689 static void put_mspel8_mc00_c (uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2690 put_pixels8_c(dst, src, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2691 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2692
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2693 static void put_mspel8_mc10_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2694 uint8_t half[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2695 wmv2_mspel8_h_lowpass(half, src, 8, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2696 put_pixels8_l2(dst, src, half, stride, stride, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2697 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2698
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2699 static void put_mspel8_mc20_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2700 wmv2_mspel8_h_lowpass(dst, src, stride, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2701 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2702
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2703 static void put_mspel8_mc30_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2704 uint8_t half[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2705 wmv2_mspel8_h_lowpass(half, src, 8, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2706 put_pixels8_l2(dst, src+1, half, stride, stride, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2707 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2708
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2709 static void put_mspel8_mc02_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2710 wmv2_mspel8_v_lowpass(dst, src, stride, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2711 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2712
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2713 static void put_mspel8_mc12_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2714 uint8_t halfH[88];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2715 uint8_t halfV[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2716 uint8_t halfHV[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2717 wmv2_mspel8_h_lowpass(halfH, src-stride, 8, stride, 11);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2718 wmv2_mspel8_v_lowpass(halfV, src, 8, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2719 wmv2_mspel8_v_lowpass(halfHV, halfH+8, 8, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2720 put_pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2721 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2722 static void put_mspel8_mc32_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2723 uint8_t halfH[88];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2724 uint8_t halfV[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2725 uint8_t halfHV[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2726 wmv2_mspel8_h_lowpass(halfH, src-stride, 8, stride, 11);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2727 wmv2_mspel8_v_lowpass(halfV, src+1, 8, stride, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2728 wmv2_mspel8_v_lowpass(halfHV, halfH+8, 8, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2729 put_pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2730 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2731 static void put_mspel8_mc22_c(uint8_t dst, uint8_t src, int stride){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2732 uint8_t halfH[88];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2733 wmv2_mspel8_h_lowpass(halfH, src-stride, 8, stride, 11);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2734 wmv2_mspel8_v_lowpass(dst, halfH+8, stride, 8, 8);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2735 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2736
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2737 static void h263_v_loop_filter_c(uint8_t *src, int stride, int qscale){
10749 5cca4b6c459d Get rid of pointless CONFIG_ANY_H263 preprocessor definition. diego parents: 10748 diff changeset	2738 if(CONFIG_H263_DECODER \|\| CONFIG_H263_ENCODER) {
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2739 int x;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2740 const int strength= ff_h263_loop_filter_strength[qscale];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2741
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2742 for(x=0; x<8; x++){
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2743 int d1, d2, ad1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2744 int p0= src[x-2*stride];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2745 int p1= src[x-1*stride];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2746 int p2= src[x+0*stride];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2747 int p3= src[x+1*stride];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2748 int d = (p0 - p3 + 4*(p2 - p1)) / 8;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2749
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2750 if (d<-2*strength) d1= 0;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2751 else if(d<- strength) d1=-2*strength - d;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2752 else if(d< strength) d1= d;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2753 else if(d< 2strength) d1= 2strength - d;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2754 else d1= 0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2755
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2756 p1 += d1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2757 p2 -= d1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2758 if(p1&256) p1= ~(p1>>31);
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2759 if(p2&256) p2= ~(p2>>31);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2760
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2761 src[x-1*stride] = p1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2762 src[x+0*stride] = p2;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2763
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	2764 ad1= FFABS(d1)>>1;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2765
4594 a96d905dcbaa Add av_ prefix to clip functions reimar parents: 4296 diff changeset	2766 d2= av_clip((p0-p3)/4, -ad1, ad1);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2767
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2768 src[x-2*stride] = p0 - d2;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2769 src[x+ stride] = p3 + d2;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2770 }
5394 e9a6215f4e3a help some gcc version to optimize out those functions aurel parents: 5291 diff changeset	2771 }
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2772 }
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2773
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2774 static void h263_h_loop_filter_c(uint8_t *src, int stride, int qscale){
10749 5cca4b6c459d Get rid of pointless CONFIG_ANY_H263 preprocessor definition. diego parents: 10748 diff changeset	2775 if(CONFIG_H263_DECODER \|\| CONFIG_H263_ENCODER) {
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2776 int y;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2777 const int strength= ff_h263_loop_filter_strength[qscale];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2778
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2779 for(y=0; y<8; y++){
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2780 int d1, d2, ad1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2781 int p0= src[y*stride-2];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2782 int p1= src[y*stride-1];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2783 int p2= src[y*stride+0];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2784 int p3= src[y*stride+1];
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2785 int d = (p0 - p3 + 4*(p2 - p1)) / 8;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2786
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2787 if (d<-2*strength) d1= 0;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2788 else if(d<- strength) d1=-2*strength - d;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2789 else if(d< strength) d1= d;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2790 else if(d< 2strength) d1= 2strength - d;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2791 else d1= 0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2792
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2793 p1 += d1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2794 p2 -= d1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2795 if(p1&256) p1= ~(p1>>31);
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2796 if(p2&256) p2= ~(p2>>31);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2797
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2798 src[y*stride-1] = p1;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2799 src[y*stride+0] = p2;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2800
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	2801 ad1= FFABS(d1)>>1;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2802
4594 a96d905dcbaa Add av_ prefix to clip functions reimar parents: 4296 diff changeset	2803 d2= av_clip((p0-p3)/4, -ad1, ad1);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2804
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2805 src[y*stride-2] = p0 - d2;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2806 src[y*stride+1] = p3 + d2;
835cf346975e h263 loop filter michael parents: 1598 diff changeset	2807 }
5394 e9a6215f4e3a help some gcc version to optimize out those functions aurel parents: 5291 diff changeset	2808 }
1644 835cf346975e h263 loop filter michael parents: 1598 diff changeset	2809 }
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	2810
2045 9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2811 static void h261_loop_filter_c(uint8_t *src, int stride){
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2812 int x,y,xy,yz;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2813 int temp[64];
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2814
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2815 for(x=0; x<8; x++){
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2816 temp[x ] = 4*src[x ];
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2817 temp[x + 78] = 4src[x + 7*stride];
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2818 }
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2819 for(y=1; y<7; y++){
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2820 for(x=0; x<8; x++){
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2821 xy = y * stride + x;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2822 yz = y * 8 + x;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2823 temp[yz] = src[xy - stride] + 2*src[xy] + src[xy + stride];
2044 b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>) michael parents: 1984 diff changeset	2824 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>) michael parents: 1984 diff changeset	2825 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	2826
2045 9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2827 for(y=0; y<8; y++){
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2828 src[ ystride] = (temp[ y8] + 2)>>2;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2829 src[7+ystride] = (temp[7+y8] + 2)>>2;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2830 for(x=1; x<7; x++){
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2831 xy = y * stride + x;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2832 yz = y * 8 + x;
9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	2833 src[xy] = (temp[yz-1] + 2*temp[yz] + temp[yz+1] + 8)>>4;
2044 b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>) michael parents: 1984 diff changeset	2834 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>) michael parents: 1984 diff changeset	2835 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>) michael parents: 1984 diff changeset	2836 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>) michael parents: 1984 diff changeset	2837
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2838 static inline int pix_abs16_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
0 986e461dc072 Initial revision glantau parents: diff changeset	2839 {
986e461dc072 Initial revision glantau parents: diff changeset	2840 int s, i;
986e461dc072 Initial revision glantau parents: diff changeset	2841
986e461dc072 Initial revision glantau parents: diff changeset	2842 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2843 for(i=0;i<h;i++) {
0 986e461dc072 Initial revision glantau parents: diff changeset	2844 s += abs(pix1[0] - pix2[0]);
986e461dc072 Initial revision glantau parents: diff changeset	2845 s += abs(pix1[1] - pix2[1]);
986e461dc072 Initial revision glantau parents: diff changeset	2846 s += abs(pix1[2] - pix2[2]);
986e461dc072 Initial revision glantau parents: diff changeset	2847 s += abs(pix1[3] - pix2[3]);
986e461dc072 Initial revision glantau parents: diff changeset	2848 s += abs(pix1[4] - pix2[4]);
986e461dc072 Initial revision glantau parents: diff changeset	2849 s += abs(pix1[5] - pix2[5]);
986e461dc072 Initial revision glantau parents: diff changeset	2850 s += abs(pix1[6] - pix2[6]);
986e461dc072 Initial revision glantau parents: diff changeset	2851 s += abs(pix1[7] - pix2[7]);
986e461dc072 Initial revision glantau parents: diff changeset	2852 s += abs(pix1[8] - pix2[8]);
986e461dc072 Initial revision glantau parents: diff changeset	2853 s += abs(pix1[9] - pix2[9]);
986e461dc072 Initial revision glantau parents: diff changeset	2854 s += abs(pix1[10] - pix2[10]);
986e461dc072 Initial revision glantau parents: diff changeset	2855 s += abs(pix1[11] - pix2[11]);
986e461dc072 Initial revision glantau parents: diff changeset	2856 s += abs(pix1[12] - pix2[12]);
986e461dc072 Initial revision glantau parents: diff changeset	2857 s += abs(pix1[13] - pix2[13]);
986e461dc072 Initial revision glantau parents: diff changeset	2858 s += abs(pix1[14] - pix2[14]);
986e461dc072 Initial revision glantau parents: diff changeset	2859 s += abs(pix1[15] - pix2[15]);
986e461dc072 Initial revision glantau parents: diff changeset	2860 pix1 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2861 pix2 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2862 }
986e461dc072 Initial revision glantau parents: diff changeset	2863 return s;
986e461dc072 Initial revision glantau parents: diff changeset	2864 }
986e461dc072 Initial revision glantau parents: diff changeset	2865
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2866 static int pix_abs16_x2_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
0 986e461dc072 Initial revision glantau parents: diff changeset	2867 {
986e461dc072 Initial revision glantau parents: diff changeset	2868 int s, i;
986e461dc072 Initial revision glantau parents: diff changeset	2869
986e461dc072 Initial revision glantau parents: diff changeset	2870 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2871 for(i=0;i<h;i++) {
0 986e461dc072 Initial revision glantau parents: diff changeset	2872 s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
986e461dc072 Initial revision glantau parents: diff changeset	2873 s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
986e461dc072 Initial revision glantau parents: diff changeset	2874 s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
986e461dc072 Initial revision glantau parents: diff changeset	2875 s += abs(pix1[3] - avg2(pix2[3], pix2[4]));
986e461dc072 Initial revision glantau parents: diff changeset	2876 s += abs(pix1[4] - avg2(pix2[4], pix2[5]));
986e461dc072 Initial revision glantau parents: diff changeset	2877 s += abs(pix1[5] - avg2(pix2[5], pix2[6]));
986e461dc072 Initial revision glantau parents: diff changeset	2878 s += abs(pix1[6] - avg2(pix2[6], pix2[7]));
986e461dc072 Initial revision glantau parents: diff changeset	2879 s += abs(pix1[7] - avg2(pix2[7], pix2[8]));
986e461dc072 Initial revision glantau parents: diff changeset	2880 s += abs(pix1[8] - avg2(pix2[8], pix2[9]));
986e461dc072 Initial revision glantau parents: diff changeset	2881 s += abs(pix1[9] - avg2(pix2[9], pix2[10]));
986e461dc072 Initial revision glantau parents: diff changeset	2882 s += abs(pix1[10] - avg2(pix2[10], pix2[11]));
986e461dc072 Initial revision glantau parents: diff changeset	2883 s += abs(pix1[11] - avg2(pix2[11], pix2[12]));
986e461dc072 Initial revision glantau parents: diff changeset	2884 s += abs(pix1[12] - avg2(pix2[12], pix2[13]));
986e461dc072 Initial revision glantau parents: diff changeset	2885 s += abs(pix1[13] - avg2(pix2[13], pix2[14]));
986e461dc072 Initial revision glantau parents: diff changeset	2886 s += abs(pix1[14] - avg2(pix2[14], pix2[15]));
986e461dc072 Initial revision glantau parents: diff changeset	2887 s += abs(pix1[15] - avg2(pix2[15], pix2[16]));
986e461dc072 Initial revision glantau parents: diff changeset	2888 pix1 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2889 pix2 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2890 }
986e461dc072 Initial revision glantau parents: diff changeset	2891 return s;
986e461dc072 Initial revision glantau parents: diff changeset	2892 }
986e461dc072 Initial revision glantau parents: diff changeset	2893
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2894 static int pix_abs16_y2_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
0 986e461dc072 Initial revision glantau parents: diff changeset	2895 {
986e461dc072 Initial revision glantau parents: diff changeset	2896 int s, i;
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2897 uint8_t *pix3 = pix2 + line_size;
0 986e461dc072 Initial revision glantau parents: diff changeset	2898
986e461dc072 Initial revision glantau parents: diff changeset	2899 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2900 for(i=0;i<h;i++) {
0 986e461dc072 Initial revision glantau parents: diff changeset	2901 s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
986e461dc072 Initial revision glantau parents: diff changeset	2902 s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
986e461dc072 Initial revision glantau parents: diff changeset	2903 s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
986e461dc072 Initial revision glantau parents: diff changeset	2904 s += abs(pix1[3] - avg2(pix2[3], pix3[3]));
986e461dc072 Initial revision glantau parents: diff changeset	2905 s += abs(pix1[4] - avg2(pix2[4], pix3[4]));
986e461dc072 Initial revision glantau parents: diff changeset	2906 s += abs(pix1[5] - avg2(pix2[5], pix3[5]));
986e461dc072 Initial revision glantau parents: diff changeset	2907 s += abs(pix1[6] - avg2(pix2[6], pix3[6]));
986e461dc072 Initial revision glantau parents: diff changeset	2908 s += abs(pix1[7] - avg2(pix2[7], pix3[7]));
986e461dc072 Initial revision glantau parents: diff changeset	2909 s += abs(pix1[8] - avg2(pix2[8], pix3[8]));
986e461dc072 Initial revision glantau parents: diff changeset	2910 s += abs(pix1[9] - avg2(pix2[9], pix3[9]));
986e461dc072 Initial revision glantau parents: diff changeset	2911 s += abs(pix1[10] - avg2(pix2[10], pix3[10]));
986e461dc072 Initial revision glantau parents: diff changeset	2912 s += abs(pix1[11] - avg2(pix2[11], pix3[11]));
986e461dc072 Initial revision glantau parents: diff changeset	2913 s += abs(pix1[12] - avg2(pix2[12], pix3[12]));
986e461dc072 Initial revision glantau parents: diff changeset	2914 s += abs(pix1[13] - avg2(pix2[13], pix3[13]));
986e461dc072 Initial revision glantau parents: diff changeset	2915 s += abs(pix1[14] - avg2(pix2[14], pix3[14]));
986e461dc072 Initial revision glantau parents: diff changeset	2916 s += abs(pix1[15] - avg2(pix2[15], pix3[15]));
986e461dc072 Initial revision glantau parents: diff changeset	2917 pix1 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2918 pix2 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2919 pix3 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2920 }
986e461dc072 Initial revision glantau parents: diff changeset	2921 return s;
986e461dc072 Initial revision glantau parents: diff changeset	2922 }
986e461dc072 Initial revision glantau parents: diff changeset	2923
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2924 static int pix_abs16_xy2_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
0 986e461dc072 Initial revision glantau parents: diff changeset	2925 {
986e461dc072 Initial revision glantau parents: diff changeset	2926 int s, i;
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2927 uint8_t *pix3 = pix2 + line_size;
0 986e461dc072 Initial revision glantau parents: diff changeset	2928
986e461dc072 Initial revision glantau parents: diff changeset	2929 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2930 for(i=0;i<h;i++) {
0 986e461dc072 Initial revision glantau parents: diff changeset	2931 s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
986e461dc072 Initial revision glantau parents: diff changeset	2932 s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
986e461dc072 Initial revision glantau parents: diff changeset	2933 s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
986e461dc072 Initial revision glantau parents: diff changeset	2934 s += abs(pix1[3] - avg4(pix2[3], pix2[4], pix3[3], pix3[4]));
986e461dc072 Initial revision glantau parents: diff changeset	2935 s += abs(pix1[4] - avg4(pix2[4], pix2[5], pix3[4], pix3[5]));
986e461dc072 Initial revision glantau parents: diff changeset	2936 s += abs(pix1[5] - avg4(pix2[5], pix2[6], pix3[5], pix3[6]));
986e461dc072 Initial revision glantau parents: diff changeset	2937 s += abs(pix1[6] - avg4(pix2[6], pix2[7], pix3[6], pix3[7]));
986e461dc072 Initial revision glantau parents: diff changeset	2938 s += abs(pix1[7] - avg4(pix2[7], pix2[8], pix3[7], pix3[8]));
986e461dc072 Initial revision glantau parents: diff changeset	2939 s += abs(pix1[8] - avg4(pix2[8], pix2[9], pix3[8], pix3[9]));
986e461dc072 Initial revision glantau parents: diff changeset	2940 s += abs(pix1[9] - avg4(pix2[9], pix2[10], pix3[9], pix3[10]));
986e461dc072 Initial revision glantau parents: diff changeset	2941 s += abs(pix1[10] - avg4(pix2[10], pix2[11], pix3[10], pix3[11]));
986e461dc072 Initial revision glantau parents: diff changeset	2942 s += abs(pix1[11] - avg4(pix2[11], pix2[12], pix3[11], pix3[12]));
986e461dc072 Initial revision glantau parents: diff changeset	2943 s += abs(pix1[12] - avg4(pix2[12], pix2[13], pix3[12], pix3[13]));
986e461dc072 Initial revision glantau parents: diff changeset	2944 s += abs(pix1[13] - avg4(pix2[13], pix2[14], pix3[13], pix3[14]));
986e461dc072 Initial revision glantau parents: diff changeset	2945 s += abs(pix1[14] - avg4(pix2[14], pix2[15], pix3[14], pix3[15]));
986e461dc072 Initial revision glantau parents: diff changeset	2946 s += abs(pix1[15] - avg4(pix2[15], pix2[16], pix3[15], pix3[16]));
986e461dc072 Initial revision glantau parents: diff changeset	2947 pix1 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2948 pix2 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2949 pix3 += line_size;
986e461dc072 Initial revision glantau parents: diff changeset	2950 }
986e461dc072 Initial revision glantau parents: diff changeset	2951 return s;
986e461dc072 Initial revision glantau parents: diff changeset	2952 }
986e461dc072 Initial revision glantau parents: diff changeset	2953
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2954 static inline int pix_abs8_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2955 {
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2956 int s, i;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2957
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2958 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2959 for(i=0;i<h;i++) {
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2960 s += abs(pix1[0] - pix2[0]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2961 s += abs(pix1[1] - pix2[1]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2962 s += abs(pix1[2] - pix2[2]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2963 s += abs(pix1[3] - pix2[3]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2964 s += abs(pix1[4] - pix2[4]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2965 s += abs(pix1[5] - pix2[5]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2966 s += abs(pix1[6] - pix2[6]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2967 s += abs(pix1[7] - pix2[7]);
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2968 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2969 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2970 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2971 return s;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2972 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2973
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2974 static int pix_abs8_x2_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2975 {
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2976 int s, i;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2977
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2978 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2979 for(i=0;i<h;i++) {
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2980 s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2981 s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2982 s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2983 s += abs(pix1[3] - avg2(pix2[3], pix2[4]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2984 s += abs(pix1[4] - avg2(pix2[4], pix2[5]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2985 s += abs(pix1[5] - avg2(pix2[5], pix2[6]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2986 s += abs(pix1[6] - avg2(pix2[6], pix2[7]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2987 s += abs(pix1[7] - avg2(pix2[7], pix2[8]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2988 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2989 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2990 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2991 return s;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2992 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2993
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	2994 static int pix_abs8_y2_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2995 {
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2996 int s, i;
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	2997 uint8_t *pix3 = pix2 + line_size;
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2998
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	2999 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3000 for(i=0;i<h;i++) {
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3001 s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3002 s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3003 s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3004 s += abs(pix1[3] - avg2(pix2[3], pix3[3]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3005 s += abs(pix1[4] - avg2(pix2[4], pix3[4]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3006 s += abs(pix1[5] - avg2(pix2[5], pix3[5]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3007 s += abs(pix1[6] - avg2(pix2[6], pix3[6]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3008 s += abs(pix1[7] - avg2(pix2[7], pix3[7]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3009 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3010 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3011 pix3 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3012 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3013 return s;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3014 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3015
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3016 static int pix_abs8_xy2_c(void v, uint8_t pix1, uint8_t *pix2, int line_size, int h)
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3017 {
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3018 int s, i;
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	3019 uint8_t *pix3 = pix2 + line_size;
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3020
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3021 s = 0;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3022 for(i=0;i<h;i++) {
294 944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3023 s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3024 s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3025 s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3026 s += abs(pix1[3] - avg4(pix2[3], pix2[4], pix3[3], pix3[4]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3027 s += abs(pix1[4] - avg4(pix2[4], pix2[5], pix3[4], pix3[5]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3028 s += abs(pix1[5] - avg4(pix2[5], pix2[6], pix3[5], pix3[6]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3029 s += abs(pix1[6] - avg4(pix2[6], pix2[7], pix3[6], pix3[7]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3030 s += abs(pix1[7] - avg4(pix2[7], pix2[8], pix3[7], pix3[8]));
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3031 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3032 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3033 pix3 += line_size;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3034 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3035 return s;
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3036 }
944632089814 4MV motion estimation (not finished yet) michaelni parents: 256 diff changeset	3037
2834 fd5d7c732c6b kill a bunch of compiler warnings mru parents: 2763 diff changeset	3038 static int nsse16_c(void v, uint8_t s1, uint8_t *s2, int stride, int h){
fd5d7c732c6b kill a bunch of compiler warnings mru parents: 2763 diff changeset	3039 MpegEncContext *c = v;
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3040 int score1=0;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3041 int score2=0;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3042 int x,y;
2066 4bfb146e701b nsse weight michael parents: 2065 diff changeset	3043
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3044 for(y=0; y<h; y++){
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3045 for(x=0; x<16; x++){
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3046 score1+= (s1[x ] - s2[x ])*(s1[x ] - s2[x ]);
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3047 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3048 if(y+1<h){
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3049 for(x=0; x<15; x++){
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3050 score2+= FFABS( s1[x ] - s1[x +stride]
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3051 - s1[x+1] + s1[x+1+stride])
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3052 -FFABS( s2[x ] - s2[x +stride]
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3053 - s2[x+1] + s2[x+1+stride]);
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3054 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3055 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3056 s1+= stride;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3057 s2+= stride;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3058 }
2066 4bfb146e701b nsse weight michael parents: 2065 diff changeset	3059
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3060 if(c) return score1 + FFABS(score2)*c->avctx->nsse_weight;
34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3061 else return score1 + FFABS(score2)*8;
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3062 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3063
2834 fd5d7c732c6b kill a bunch of compiler warnings mru parents: 2763 diff changeset	3064 static int nsse8_c(void v, uint8_t s1, uint8_t *s2, int stride, int h){
fd5d7c732c6b kill a bunch of compiler warnings mru parents: 2763 diff changeset	3065 MpegEncContext *c = v;
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3066 int score1=0;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3067 int score2=0;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3068 int x,y;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3069
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3070 for(y=0; y<h; y++){
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3071 for(x=0; x<8; x++){
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3072 score1+= (s1[x ] - s2[x ])*(s1[x ] - s2[x ]);
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3073 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3074 if(y+1<h){
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3075 for(x=0; x<7; x++){
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3076 score2+= FFABS( s1[x ] - s1[x +stride]
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3077 - s1[x+1] + s1[x+1+stride])
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3078 -FFABS( s2[x ] - s2[x +stride]
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3079 - s2[x+1] + s2[x+1+stride]);
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3080 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3081 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3082 s1+= stride;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3083 s2+= stride;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3084 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3085
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3086 if(c) return score1 + FFABS(score2)*c->avctx->nsse_weight;
34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3087 else return score1 + FFABS(score2)*8;
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3088 }
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3089
1784 65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3090 static int try_8x8basis_c(int16_t rem[64], int16_t weight[64], int16_t basis[64], int scale){
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3091 int i;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3092 unsigned int sum=0;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3093
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3094 for(i=0; i<8*8; i++){
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3095 int b= rem[i] + ((basis[i]*scale + (1<<(BASIS_SHIFT - RECON_SHIFT-1)))>>(BASIS_SHIFT - RECON_SHIFT));
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3096 int w= weight[i];
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3097 b>>= RECON_SHIFT;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3098 assert(-512<b && b<512);
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3099
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3100 sum += (wb)(w*b)>>4;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3101 }
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3102 return sum>>2;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3103 }
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3104
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3105 static void add_8x8basis_c(int16_t rem[64], int16_t basis[64], int scale){
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3106 int i;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3107
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3108 for(i=0; i<8*8; i++){
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3109 rem[i] += (basis[i]*scale + (1<<(BASIS_SHIFT - RECON_SHIFT-1)))>>(BASIS_SHIFT - RECON_SHIFT);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3110 }
1784 65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3111 }
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	3112
1100 207f27932628 ff_block_permute() dox michaelni parents: 1092 diff changeset	3113 /**
207f27932628 ff_block_permute() dox michaelni parents: 1092 diff changeset	3114 * permutes an 8x8 block.
1101 a3a8017dee70 more idiot proof dox michaelni parents: 1100 diff changeset	3115 * @param block the block which will be permuted according to the given permutation vector
1100 207f27932628 ff_block_permute() dox michaelni parents: 1092 diff changeset	3116 * @param permutation the permutation vector
207f27932628 ff_block_permute() dox michaelni parents: 1092 diff changeset	3117 * @param last the last non zero coefficient in scantable order, used to speed the permutation up
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3118 * @param scantable the used scantable, this is only used to speed the permutation up, the block is not
1101 a3a8017dee70 more idiot proof dox michaelni parents: 1100 diff changeset	3119 * (inverse) permutated to scantable order!
1100 207f27932628 ff_block_permute() dox michaelni parents: 1092 diff changeset	3120 */
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	3121 void ff_block_permute(DCTELEM block, uint8_t permutation, const uint8_t *scantable, int last)
174 ac5075a55488 new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable arpi_esp parents: 88 diff changeset	3122 {
764 d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3123 int i;
945 463f7260b155 trellis quantization michaelni parents: 936 diff changeset	3124 DCTELEM temp[64];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3125
764 d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3126 if(last<=0) return;
5129 0244bba24b43 misc typo fixes diego parents: 5065 diff changeset	3127 //if(permutation[1]==1) return; //FIXME it is ok but not clean and might fail for some permutations
174 ac5075a55488 new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable arpi_esp parents: 88 diff changeset	3128
764 d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3129 for(i=0; i<=last; i++){
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3130 const int j= scantable[i];
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3131 temp[j]= block[j];
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3132 block[j]=0;
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3133 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3134
764 d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3135 for(i=0; i<=last; i++){
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3136 const int j= scantable[i];
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3137 const int perm_j= permutation[j];
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3138 block[perm_j]= temp[j];
d4726182dfd2 optimize block_permute() michaelni parents: 753 diff changeset	3139 }
174 ac5075a55488 new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable arpi_esp parents: 88 diff changeset	3140 }
34 2733a4c1c693 added block permutation functions glantau parents: 19 diff changeset	3141
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3142 static int zero_cmp(void s, uint8_t a, uint8_t *b, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3143 return 0;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3144 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3145
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3146 void ff_set_cmp(DSPContext* c, me_cmp_func *cmp, int type){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3147 int i;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3148
8976 e7d87561b42b Making the arrays accomodate an extra intra 8x8 cmp function romansh parents: 8785 diff changeset	3149 memset(cmp, 0, sizeof(void)6);
e7d87561b42b Making the arrays accomodate an extra intra 8x8 cmp function romansh parents: 8785 diff changeset	3150
e7d87561b42b Making the arrays accomodate an extra intra 8x8 cmp function romansh parents: 8785 diff changeset	3151 for(i=0; i<6; i++){
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3152 switch(type&0xFF){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3153 case FF_CMP_SAD:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3154 cmp[i]= c->sad[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3155 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3156 case FF_CMP_SATD:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3157 cmp[i]= c->hadamard8_diff[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3158 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3159 case FF_CMP_SSE:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3160 cmp[i]= c->sse[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3161 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3162 case FF_CMP_DCT:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3163 cmp[i]= c->dct_sad[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3164 break;
3010 533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3165 case FF_CMP_DCT264:
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3166 cmp[i]= c->dct264_sad[i];
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3167 break;
2382 23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3168 case FF_CMP_DCTMAX:
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3169 cmp[i]= c->dct_max[i];
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3170 break;
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3171 case FF_CMP_PSNR:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3172 cmp[i]= c->quant_psnr[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3173 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3174 case FF_CMP_BIT:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3175 cmp[i]= c->bit[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3176 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3177 case FF_CMP_RD:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3178 cmp[i]= c->rd[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3179 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3180 case FF_CMP_VSAD:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3181 cmp[i]= c->vsad[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3182 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3183 case FF_CMP_VSSE:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3184 cmp[i]= c->vsse[i];
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3185 break;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3186 case FF_CMP_ZERO:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3187 cmp[i]= zero_cmp;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3188 break;
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3189 case FF_CMP_NSSE:
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3190 cmp[i]= c->nsse[i];
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	3191 break;
11485 0f0cd6b5791f Separate DWT from snow and dsputil mru parents: 11459 diff changeset	3192 #if CONFIG_DWT
2184 3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	3193 case FF_CMP_W53:
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	3194 cmp[i]= c->w53[i];
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	3195 break;
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	3196 case FF_CMP_W97:
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	3197 cmp[i]= c->w97[i];
3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	3198 break;
3373 b8996cc5ccae Disable w53 and w97 cmp methods when snow encoder is disabled gpoirier parents: 3323 diff changeset	3199 #endif
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3200 default:
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3201 av_log(NULL, AV_LOG_ERROR,"internal error in cmp function selection\n");
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3202 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3203 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3204 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3205
8288 800444234375 clear_block mmx lorenm parents: 8232 diff changeset	3206 static void clear_block_c(DCTELEM *block)
800444234375 clear_block mmx lorenm parents: 8232 diff changeset	3207 {
800444234375 clear_block mmx lorenm parents: 8232 diff changeset	3208 memset(block, 0, sizeof(DCTELEM)*64);
800444234375 clear_block mmx lorenm parents: 8232 diff changeset	3209 }
800444234375 clear_block mmx lorenm parents: 8232 diff changeset	3210
1101 a3a8017dee70 more idiot proof dox michaelni parents: 1100 diff changeset	3211 /**
a3a8017dee70 more idiot proof dox michaelni parents: 1100 diff changeset	3212 * memset(blocks, 0, sizeof(DCTELEM)664)
a3a8017dee70 more idiot proof dox michaelni parents: 1100 diff changeset	3213 */
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	3214 static void clear_blocks_c(DCTELEM *blocks)
296 c1a8a1b4a24b sizeof(s->block) isnt 6462 anymore bugfix michaelni parents: 294 diff changeset	3215 {
c1a8a1b4a24b sizeof(s->block) isnt 6462 anymore bugfix michaelni parents: 294 diff changeset	3216 memset(blocks, 0, sizeof(DCTELEM)664);
c1a8a1b4a24b sizeof(s->block) isnt 6462 anymore bugfix michaelni parents: 294 diff changeset	3217 }
c1a8a1b4a24b sizeof(s->block) isnt 6462 anymore bugfix michaelni parents: 294 diff changeset	3218
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3219 static void add_bytes_c(uint8_t dst, uint8_t src, int w){
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3220 long i;
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3221 for(i=0; i<=w-sizeof(long); i+=sizeof(long)){
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3222 long a = (long)(src+i);
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3223 long b = (long)(dst+i);
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3224 (long)(dst+i) = ((a&pb_7f) + (b&pb_7f)) ^ ((a^b)&pb_80);
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3225 }
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3226 for(; i<w; i++)
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3227 dst[i+0] += src[i+0];
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3228 }
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3229
6384 0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3230 static void add_bytes_l2_c(uint8_t dst, uint8_t src1, uint8_t *src2, int w){
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3231 long i;
6384 0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3232 for(i=0; i<=w-sizeof(long); i+=sizeof(long)){
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3233 long a = (long)(src1+i);
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3234 long b = (long)(src2+i);
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3235 (long)(dst+i) = ((a&pb_7f) + (b&pb_7f)) ^ ((a^b)&pb_80);
6384 0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3236 }
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3237 for(; i<w; i++)
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3238 dst[i] = src1[i]+src2[i];
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3239 }
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	3240
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3241 static void diff_bytes_c(uint8_t dst, uint8_t src1, uint8_t *src2, int w){
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3242 long i;
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	3243 #if !HAVE_FAST_UNALIGNED
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3244 if((long)src2 & (sizeof(long)-1)){
6386 8b570faa9a8d indent lorenm parents: 6385 diff changeset	3245 for(i=0; i+7<w; i+=8){
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3246 dst[i+0] = src1[i+0]-src2[i+0];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3247 dst[i+1] = src1[i+1]-src2[i+1];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3248 dst[i+2] = src1[i+2]-src2[i+2];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3249 dst[i+3] = src1[i+3]-src2[i+3];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3250 dst[i+4] = src1[i+4]-src2[i+4];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3251 dst[i+5] = src1[i+5]-src2[i+5];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3252 dst[i+6] = src1[i+6]-src2[i+6];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3253 dst[i+7] = src1[i+7]-src2[i+7];
8b570faa9a8d indent lorenm parents: 6385 diff changeset	3254 }
6385 40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3255 }else
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3256 #endif
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3257 for(i=0; i<=w-sizeof(long); i+=sizeof(long)){
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3258 long a = (long)(src1+i);
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3259 long b = (long)(src2+i);
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3260 (long)(dst+i) = ((a\|pb_80) - (b&pb_7f)) ^ ((a^b^pb_80)&pb_80);
40fbc878ce3f pseudo-simd add_bytes and diff_bytes lorenm parents: 6384 diff changeset	3261 }
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3262 for(; i<w; i++)
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3263 dst[i+0] = src1[i+0]-src2[i+0];
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3264 }
725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	3265
10431 546b7ebeaf07 huffyuv: add some const qualifiers lorenm parents: 10429 diff changeset	3266 static void add_hfyu_median_prediction_c(uint8_t dst, const uint8_t src1, const uint8_t diff, int w, int left, int *left_top){
8760 31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3267 int i;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3268 uint8_t l, lt;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3269
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3270 l= *left;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3271 lt= *left_top;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3272
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3273 for(i=0; i<w; i++){
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3274 l= mid_pred(l, src1[i], (l + src1[i] - lt)&0xFF) + diff[i];
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3275 lt= src1[i];
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3276 dst[i]= l;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3277 }
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3278
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3279 *left= l;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3280 *left_top= lt;
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3281 }
31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	3282
10431 546b7ebeaf07 huffyuv: add some const qualifiers lorenm parents: 10429 diff changeset	3283 static void sub_hfyu_median_prediction_c(uint8_t dst, const uint8_t src1, const uint8_t src2, int w, int left, int *left_top){
1527 8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3284 int i;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3285 uint8_t l, lt;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3286
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3287 l= *left;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3288 lt= *left_top;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3289
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3290 for(i=0; i<w; i++){
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3291 const int pred= mid_pred(l, src1[i], (l + src1[i] - lt)&0xFF);
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3292 lt= src1[i];
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3293 l= src2[i];
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3294 dst[i]= l - pred;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3295 }
1527 8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3296
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3297 *left= l;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3298 *left_top= lt;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3299 }
8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	3300
10420 442ab0c41eae Huffyuv: Add missing const to src pointers in dsputil functions. astrange parents: 10370 diff changeset	3301 static int add_hfyu_left_prediction_c(uint8_t dst, const uint8_t src, int w, int acc){
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3302 int i;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3303
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3304 for(i=0; i<w-1; i++){
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3305 acc+= src[i];
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3306 dst[i]= acc;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3307 i++;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3308 acc+= src[i];
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3309 dst[i]= acc;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3310 }
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3311
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3312 for(; i<w; i++){
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3313 acc+= src[i];
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3314 dst[i]= acc;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3315 }
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3316
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3317 return acc;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3318 }
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3319
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3320 #if HAVE_BIGENDIAN
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3321 #define B 3
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3322 #define G 2
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3323 #define R 1
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3324 #define A 0
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3325 #else
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3326 #define B 0
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3327 #define G 1
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3328 #define R 2
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3329 #define A 3
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3330 #endif
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3331 static void add_hfyu_left_prediction_bgr32_c(uint8_t dst, const uint8_t src, int w, int red, int green, int blue, int alpha){
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3332 int i;
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3333 int r,g,b,a;
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3334 r= *red;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3335 g= *green;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3336 b= *blue;
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3337 a= *alpha;
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3338
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3339 for(i=0; i<w; i++){
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3340 b+= src[4*i+B];
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3341 g+= src[4*i+G];
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3342 r+= src[4*i+R];
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3343 a+= src[4*i+A];
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3344
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3345 dst[4*i+B]= b;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3346 dst[4*i+G]= g;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3347 dst[4*i+R]= r;
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3348 dst[4*i+A]= a;
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3349 }
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3350
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3351 *red= r;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3352 *green= g;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3353 *blue= b;
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3354 *alpha= a;
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3355 }
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3356 #undef B
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3357 #undef G
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3358 #undef R
10878 a8620b001ed3 Implement alpha channel decoding for BGR HuffYUV. astrange parents: 10867 diff changeset	3359 #undef A
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	3360
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3361 #define BUTTERFLY2(o1,o2,i1,i2) \
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3362 o1= (i1)+(i2);\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3363 o2= (i1)-(i2);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3364
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3365 #define BUTTERFLY1(x,y) \
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3366 {\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3367 int a,b;\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3368 a= x;\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3369 b= y;\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3370 x= a+b;\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3371 y= a-b;\
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3372 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3373
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3374 #define BUTTERFLYA(x,y) (FFABS((x)+(y)) + FFABS((x)-(y)))
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3375
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3376 static int hadamard8_diff8x8_c(/MpegEncContext/ void s, uint8_t dst, uint8_t *src, int stride, int h){
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3377 int i;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3378 int temp[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3379 int sum=0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3380
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3381 assert(h==8);
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3382
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3383 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3384 //FIXME try pointer walks
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3385 BUTTERFLY2(temp[8i+0], temp[8i+1], src[stridei+0]-dst[stridei+0],src[stridei+1]-dst[stridei+1]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3386 BUTTERFLY2(temp[8i+2], temp[8i+3], src[stridei+2]-dst[stridei+2],src[stridei+3]-dst[stridei+3]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3387 BUTTERFLY2(temp[8i+4], temp[8i+5], src[stridei+4]-dst[stridei+4],src[stridei+5]-dst[stridei+5]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3388 BUTTERFLY2(temp[8i+6], temp[8i+7], src[stridei+6]-dst[stridei+6],src[stridei+7]-dst[stridei+7]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3389
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3390 BUTTERFLY1(temp[8i+0], temp[8i+2]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3391 BUTTERFLY1(temp[8i+1], temp[8i+3]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3392 BUTTERFLY1(temp[8i+4], temp[8i+6]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3393 BUTTERFLY1(temp[8i+5], temp[8i+7]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3394
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3395 BUTTERFLY1(temp[8i+0], temp[8i+4]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3396 BUTTERFLY1(temp[8i+1], temp[8i+5]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3397 BUTTERFLY1(temp[8i+2], temp[8i+6]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3398 BUTTERFLY1(temp[8i+3], temp[8i+7]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3399 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3400
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3401 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3402 BUTTERFLY1(temp[80+i], temp[81+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3403 BUTTERFLY1(temp[82+i], temp[83+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3404 BUTTERFLY1(temp[84+i], temp[85+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3405 BUTTERFLY1(temp[86+i], temp[87+i]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3406
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3407 BUTTERFLY1(temp[80+i], temp[82+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3408 BUTTERFLY1(temp[81+i], temp[83+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3409 BUTTERFLY1(temp[84+i], temp[86+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3410 BUTTERFLY1(temp[85+i], temp[87+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3411
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3412 sum +=
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3413 BUTTERFLYA(temp[80+i], temp[84+i])
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3414 +BUTTERFLYA(temp[81+i], temp[85+i])
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3415 +BUTTERFLYA(temp[82+i], temp[86+i])
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3416 +BUTTERFLYA(temp[83+i], temp[87+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3417 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3418 #if 0
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3419 static int maxi=0;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3420 if(sum>maxi){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3421 maxi=sum;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3422 printf("MAX:%d\n", maxi);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3423 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3424 #endif
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3425 return sum;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3426 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3427
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3428 static int hadamard8_intra8x8_c(/MpegEncContext/ void s, uint8_t src, uint8_t *dummy, int stride, int h){
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3429 int i;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3430 int temp[64];
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3431 int sum=0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3432
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3433 assert(h==8);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3434
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3435 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3436 //FIXME try pointer walks
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3437 BUTTERFLY2(temp[8i+0], temp[8i+1], src[stridei+0],src[stridei+1]);
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3438 BUTTERFLY2(temp[8i+2], temp[8i+3], src[stridei+2],src[stridei+3]);
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3439 BUTTERFLY2(temp[8i+4], temp[8i+5], src[stridei+4],src[stridei+5]);
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3440 BUTTERFLY2(temp[8i+6], temp[8i+7], src[stridei+6],src[stridei+7]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3441
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3442 BUTTERFLY1(temp[8i+0], temp[8i+2]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3443 BUTTERFLY1(temp[8i+1], temp[8i+3]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3444 BUTTERFLY1(temp[8i+4], temp[8i+6]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3445 BUTTERFLY1(temp[8i+5], temp[8i+7]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3446
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3447 BUTTERFLY1(temp[8i+0], temp[8i+4]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3448 BUTTERFLY1(temp[8i+1], temp[8i+5]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3449 BUTTERFLY1(temp[8i+2], temp[8i+6]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3450 BUTTERFLY1(temp[8i+3], temp[8i+7]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3451 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3452
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3453 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3454 BUTTERFLY1(temp[80+i], temp[81+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3455 BUTTERFLY1(temp[82+i], temp[83+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3456 BUTTERFLY1(temp[84+i], temp[85+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3457 BUTTERFLY1(temp[86+i], temp[87+i]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3458
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3459 BUTTERFLY1(temp[80+i], temp[82+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3460 BUTTERFLY1(temp[81+i], temp[83+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3461 BUTTERFLY1(temp[84+i], temp[86+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3462 BUTTERFLY1(temp[85+i], temp[87+i]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3463
ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3464 sum +=
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3465 BUTTERFLYA(temp[80+i], temp[84+i])
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3466 +BUTTERFLYA(temp[81+i], temp[85+i])
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3467 +BUTTERFLYA(temp[82+i], temp[86+i])
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3468 +BUTTERFLYA(temp[83+i], temp[87+i]);
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3469 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3470
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3471 sum -= FFABS(temp[80] + temp[84]); // -mean
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3472
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3473 return sum;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3474 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3475
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3476 static int dct_sad8x8_c(/MpegEncContext/ void c, uint8_t src1, uint8_t *src2, int stride, int h){
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3477 MpegEncContext * const s= (MpegEncContext *)c;
11195 d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3478 LOCAL_ALIGNED_16(DCTELEM, temp, [64]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3479
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3480 assert(h==8);
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3481
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3482 s->dsp.diff_pixels(temp, src1, src2, stride);
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	3483 s->dsp.fdct(temp);
4988 689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	3484 return s->dsp.sum_abs_dctelem(temp);
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3485 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3486
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	3487 #if CONFIG_GPL
3010 533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3488 #define DCT8_1D {\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3489 const int s07 = SRC(0) + SRC(7);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3490 const int s16 = SRC(1) + SRC(6);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3491 const int s25 = SRC(2) + SRC(5);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3492 const int s34 = SRC(3) + SRC(4);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3493 const int a0 = s07 + s34;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3494 const int a1 = s16 + s25;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3495 const int a2 = s07 - s34;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3496 const int a3 = s16 - s25;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3497 const int d07 = SRC(0) - SRC(7);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3498 const int d16 = SRC(1) - SRC(6);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3499 const int d25 = SRC(2) - SRC(5);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3500 const int d34 = SRC(3) - SRC(4);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3501 const int a4 = d16 + d25 + (d07 + (d07>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3502 const int a5 = d07 - d34 - (d25 + (d25>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3503 const int a6 = d07 + d34 - (d16 + (d16>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3504 const int a7 = d16 - d25 + (d34 + (d34>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3505 DST(0, a0 + a1 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3506 DST(1, a4 + (a7>>2)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3507 DST(2, a2 + (a3>>1)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3508 DST(3, a5 + (a6>>2)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3509 DST(4, a0 - a1 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3510 DST(5, a6 - (a5>>2)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3511 DST(6, (a2>>1) - a3 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3512 DST(7, (a4>>2) - a7 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3513 }
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3514
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3515 static int dct264_sad8x8_c(/MpegEncContext/ void c, uint8_t src1, uint8_t *src2, int stride, int h){
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3516 MpegEncContext * const s= (MpegEncContext *)c;
5256 f540f39e1472 fix warning mru parents: 5255 diff changeset	3517 DCTELEM dct[8][8];
3010 533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3518 int i;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3519 int sum=0;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3520
5256 f540f39e1472 fix warning mru parents: 5255 diff changeset	3521 s->dsp.diff_pixels(dct[0], src1, src2, stride);
3010 533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3522
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3523 #define SRC(x) dct[i][x]
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3524 #define DST(x,v) dct[i][x]= v
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3525 for( i = 0; i < 8; i++ )
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3526 DCT8_1D
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3527 #undef SRC
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3528 #undef DST
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3529
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3530 #define SRC(x) dct[x][i]
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3531 #define DST(x,v) sum += FFABS(v)
3010 533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3532 for( i = 0; i < 8; i++ )
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3533 DCT8_1D
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3534 #undef SRC
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3535 #undef DST
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3536 return sum;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3537 }
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3538 #endif
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	3539
2382 23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3540 static int dct_max8x8_c(/MpegEncContext/ void c, uint8_t src1, uint8_t *src2, int stride, int h){
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3541 MpegEncContext * const s= (MpegEncContext *)c;
11195 d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3542 LOCAL_ALIGNED_16(DCTELEM, temp, [64]);
2382 23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3543 int sum=0, i;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3544
2382 23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3545 assert(h==8);
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3546
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3547 s->dsp.diff_pixels(temp, src1, src2, stride);
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3548 s->dsp.fdct(temp);
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3549
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3550 for(i=0; i<64; i++)
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3551 sum= FFMAX(sum, FFABS(temp[i]));
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3552
2382 23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3553 return sum;
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3554 }
23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	3555
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3556 static int quant_psnr8x8_c(/MpegEncContext/ void c, uint8_t src1, uint8_t *src2, int stride, int h){
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3557 MpegEncContext * const s= (MpegEncContext *)c;
11195 d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3558 LOCAL_ALIGNED_16(DCTELEM, temp, [64*2]);
11193 e5ebf3a17d9d Simplify some declarations of aligned arrays mru parents: 10965 diff changeset	3559 DCTELEM * const bak = temp+64;
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3560 int sum=0, i;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3561
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3562 assert(h==8);
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3563 s->mb_intra=0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3564
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3565 s->dsp.diff_pixels(temp, src1, src2, stride);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3566
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3567 memcpy(bak, temp, 64*sizeof(DCTELEM));
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3568
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3569 s->block_last_index[0/FIXME/]= s->fast_dct_quantize(s, temp, 0/FIXME/, s->qscale, &i);
1689 1a2db2073848 split intra / inter dequantization michael parents: 1645 diff changeset	3570 s->dct_unquantize_inter(s, temp, 0, s->qscale);
6001 f4859c13426b add ff_ prefix to all simple_idct symbols aurel parents: 5899 diff changeset	3571 ff_simple_idct(temp); //FIXME
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3572
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3573 for(i=0; i<64; i++)
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3574 sum+= (temp[i]-bak[i])*(temp[i]-bak[i]);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3575
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3576 return sum;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3577 }
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3578
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3579 static int rd8x8_c(/MpegEncContext/ void c, uint8_t src1, uint8_t *src2, int stride, int h){
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3580 MpegEncContext * const s= (MpegEncContext *)c;
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	3581 const uint8_t *scantable= s->intra_scantable.permutated;
11195 d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3582 LOCAL_ALIGNED_16(DCTELEM, temp, [64]);
d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3583 LOCAL_ALIGNED_16(uint8_t, lsrc1, [64]);
d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3584 LOCAL_ALIGNED_16(uint8_t, lsrc2, [64]);
6719 e88e719b5e77 Typo: distoration -> distortion. ramiro parents: 6600 diff changeset	3585 int i, last, run, bits, level, distortion, start_i;
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3586 const int esc_length= s->ac_esc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3587 uint8_t * length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3588 uint8_t * last_length;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3589
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3590 assert(h==8);
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3591
10068 770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3592 copy_block8(lsrc1, src1, 8, stride, 8);
770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3593 copy_block8(lsrc2, src2, 8, stride, 8);
770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3594
770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3595 s->dsp.diff_pixels(temp, lsrc1, lsrc2, 8);
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3596
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3597 s->block_last_index[0/FIXME/]= last= s->fast_dct_quantize(s, temp, 0/FIXME/, s->qscale, &i);
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3598
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3599 bits=0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3600
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3601 if (s->mb_intra) {
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3602 start_i = 1;
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3603 length = s->intra_ac_vlc_length;
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3604 last_length= s->intra_ac_vlc_last_length;
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3605 bits+= s->luma_dc_vlc_length[temp[0] + 256]; //FIXME chroma
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3606 } else {
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3607 start_i = 0;
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3608 length = s->inter_ac_vlc_length;
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3609 last_length= s->inter_ac_vlc_last_length;
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3610 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3611
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3612 if(last>=start_i){
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3613 run=0;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3614 for(i=start_i; i<last; i++){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3615 int j= scantable[i];
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3616 level= temp[j];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3617
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3618 if(level){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3619 level+=64;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3620 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3621 bits+= length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3622 }else
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3623 bits+= esc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3624 run=0;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3625 }else
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3626 run++;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3627 }
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3628 i= scantable[last];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3629
1011 3b7fcfb9c551 bugs michaelni parents: 1008 diff changeset	3630 level= temp[i] + 64;
3b7fcfb9c551 bugs michaelni parents: 1008 diff changeset	3631
3b7fcfb9c551 bugs michaelni parents: 1008 diff changeset	3632 assert(level - 64);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3633
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3634 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3635 bits+= last_length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3636 }else
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3637 bits+= esc_length;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3638
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3639 }
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3640
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3641 if(last>=0){
1689 1a2db2073848 split intra / inter dequantization michael parents: 1645 diff changeset	3642 if(s->mb_intra)
1a2db2073848 split intra / inter dequantization michael parents: 1645 diff changeset	3643 s->dct_unquantize_intra(s, temp, 0, s->qscale);
1a2db2073848 split intra / inter dequantization michael parents: 1645 diff changeset	3644 else
1a2db2073848 split intra / inter dequantization michael parents: 1645 diff changeset	3645 s->dct_unquantize_inter(s, temp, 0, s->qscale);
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3646 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3647
10068 770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3648 s->dsp.idct_add(lsrc2, 8, temp);
770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3649
770294452eaf Get rid of large stack array in rd8x8_c() mru parents: 9995 diff changeset	3650 distortion= s->dsp.sse[1](NULL, lsrc2, lsrc1, 8, 8);
6719 e88e719b5e77 Typo: distoration -> distortion. ramiro parents: 6600 diff changeset	3651
e88e719b5e77 Typo: distoration -> distortion. ramiro parents: 6600 diff changeset	3652 return distortion + ((bitss->qscales->qscale*109 + 64)>>7);
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3653 }
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3654
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3655 static int bit8x8_c(/MpegEncContext/ void c, uint8_t src1, uint8_t *src2, int stride, int h){
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3656 MpegEncContext * const s= (MpegEncContext *)c;
1064 b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t kabi parents: 1016 diff changeset	3657 const uint8_t *scantable= s->intra_scantable.permutated;
11195 d464f498e19f Use LOCAL_ALIGNED macro for local arrays mru parents: 11193 diff changeset	3658 LOCAL_ALIGNED_16(DCTELEM, temp, [64]);
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3659 int i, last, run, bits, level, start_i;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3660 const int esc_length= s->ac_esc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3661 uint8_t * length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3662 uint8_t * last_length;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3663
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	3664 assert(h==8);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3665
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3666 s->dsp.diff_pixels(temp, src1, src2, stride);
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3667
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3668 s->block_last_index[0/FIXME/]= last= s->fast_dct_quantize(s, temp, 0/FIXME/, s->qscale, &i);
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3669
5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3670 bits=0;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3671
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3672 if (s->mb_intra) {
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3673 start_i = 1;
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3674 length = s->intra_ac_vlc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3675 last_length= s->intra_ac_vlc_last_length;
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3676 bits+= s->luma_dc_vlc_length[temp[0] + 256]; //FIXME chroma
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3677 } else {
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3678 start_i = 0;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3679 length = s->inter_ac_vlc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3680 last_length= s->inter_ac_vlc_last_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3681 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3682
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3683 if(last>=start_i){
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3684 run=0;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3685 for(i=start_i; i<last; i++){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3686 int j= scantable[i];
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3687 level= temp[j];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3688
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3689 if(level){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3690 level+=64;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3691 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3692 bits+= length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3693 }else
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3694 bits+= esc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3695 run=0;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3696 }else
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3697 run++;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3698 }
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3699 i= scantable[last];
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3700
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3701 level= temp[i] + 64;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3702
1013 5d4c95f323d0 finetuneing thresholds/factors michaelni parents: 1012 diff changeset	3703 assert(level - 64);
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3704
1007 b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3705 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3706 bits+= last_length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3707 }else
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3708 bits+= esc_length;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3709 }
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3710
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3711 return bits;
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3712 }
b2cf2a1d9a51 more compare functions (rd & bit) michaelni parents: 997 diff changeset	3713
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3714 #define VSAD_INTRA(size) \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3715 static int vsad_intra##size##_c(/MpegEncContext/ void c, uint8_t s, uint8_t *dummy, int stride, int h){ \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3716 int score=0; \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3717 int x,y; \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3718 \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3719 for(y=1; y<h; y++){ \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3720 for(x=0; x<size; x+=4){ \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3721 score+= FFABS(s[x ] - s[x +stride]) + FFABS(s[x+1] - s[x+1+stride]) \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3722 +FFABS(s[x+2] - s[x+2+stride]) + FFABS(s[x+3] - s[x+3+stride]); \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3723 } \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3724 s+= stride; \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3725 } \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3726 \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3727 return score; \
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3728 }
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3729 VSAD_INTRA(8)
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3730 VSAD_INTRA(16)
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3731
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3732 static int vsad16_c(/MpegEncContext/ void c, uint8_t s1, uint8_t *s2, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3733 int score=0;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3734 int x,y;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3735
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3736 for(y=1; y<h; y++){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3737 for(x=0; x<16; x++){
4001 34fdffe98bd0 Rename ABS macro to FFABS. diego parents: 3947 diff changeset	3738 score+= FFABS(s1[x ] - s2[x ] - s1[x +stride] + s2[x +stride]);
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3739 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3740 s1+= stride;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3741 s2+= stride;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3742 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3743
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3744 return score;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3745 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3746
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3747 #define SQ(a) ((a)*(a))
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3748 #define VSSE_INTRA(size) \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3749 static int vsse_intra##size##_c(/MpegEncContext/ void c, uint8_t s, uint8_t *dummy, int stride, int h){ \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3750 int score=0; \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3751 int x,y; \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3752 \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3753 for(y=1; y<h; y++){ \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3754 for(x=0; x<size; x+=4){ \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3755 score+= SQ(s[x ] - s[x +stride]) + SQ(s[x+1] - s[x+1+stride]) \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3756 +SQ(s[x+2] - s[x+2+stride]) + SQ(s[x+3] - s[x+3+stride]); \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3757 } \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3758 s+= stride; \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3759 } \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3760 \
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3761 return score; \
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3762 }
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3763 VSSE_INTRA(8)
a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	3764 VSSE_INTRA(16)
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3765
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3766 static int vsse16_c(/MpegEncContext/ void c, uint8_t s1, uint8_t *s2, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3767 int score=0;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3768 int x,y;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3769
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3770 for(y=1; y<h; y++){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3771 for(x=0; x<16; x++){
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3772 score+= SQ(s1[x ] - s2[x ] - s1[x +stride] + s2[x +stride]);
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3773 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3774 s1+= stride;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3775 s2+= stride;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3776 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	3777
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3778 return score;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3779 }
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	3780
5255 669a97223dc7 make arguments to ssd_int8_vs_int16() const mru parents: 5214 diff changeset	3781 static int ssd_int8_vs_int16_c(const int8_t pix1, const int16_t pix2,
669a97223dc7 make arguments to ssd_int8_vs_int16() const mru parents: 5214 diff changeset	3782 int size){
4749 7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3783 int score=0;
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3784 int i;
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3785 for(i=0; i<size; i++)
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3786 score += (pix1[i]-pix2[i])*(pix1[i]-pix2[i]);
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3787 return score;
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3788 }
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	3789
6056 558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3790 WRAPPER8_16_SQ(hadamard8_diff8x8_c, hadamard8_diff16_c)
558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3791 WRAPPER8_16_SQ(hadamard8_intra8x8_c, hadamard8_intra16_c)
558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3792 WRAPPER8_16_SQ(dct_sad8x8_c, dct_sad16_c)
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	3793 #if CONFIG_GPL
6056 558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3794 WRAPPER8_16_SQ(dct264_sad8x8_c, dct264_sad16_c)
3013 b6a90fabaa76 ugly, but necessary melanson parents: 3010 diff changeset	3795 #endif
6056 558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3796 WRAPPER8_16_SQ(dct_max8x8_c, dct_max16_c)
558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3797 WRAPPER8_16_SQ(quant_psnr8x8_c, quant_psnr16_c)
558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3798 WRAPPER8_16_SQ(rd8x8_c, rd16_c)
558c1fd0ee72 Fix typo in macro name: WARPER8_16_SQ --> WRAPPER8_16_SQ. diego parents: 6054 diff changeset	3799 WRAPPER8_16_SQ(bit8x8_c, bit16_c)
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	3800
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3801 static void vector_fmul_c(float dst, const float src, int len){
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3802 int i;
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3803 for(i=0; i<len; i++)
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3804 dst[i] *= src[i];
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3805 }
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3806
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3807 static void vector_fmul_reverse_c(float dst, const float src0, const float *src1, int len){
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3808 int i;
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3809 src1 += len-1;
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3810 for(i=0; i<len; i++)
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3811 dst[i] = src0[i] * src1[-i];
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3812 }
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3813
10300 4d1b9ca628fc Drop unused args from vector_fmul_add_add, simpify code, and rename mru parents: 10219 diff changeset	3814 static void vector_fmul_add_c(float dst, const float src0, const float src1, const float src2, int len){
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3815 int i;
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3816 for(i=0; i<len; i++)
10300 4d1b9ca628fc Drop unused args from vector_fmul_add_add, simpify code, and rename mru parents: 10219 diff changeset	3817 dst[i] = src0[i] * src1[i] + src2[i];
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3818 }
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3819
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3820 void ff_vector_fmul_window_c(float dst, const float src0, const float src1, const float win, float add_bias, int len){
7263 fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3821 int i,j;
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3822 dst += len;
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3823 win += len;
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3824 src0+= len;
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3825 for(i=-len, j=len-1; i<0; i++, j--) {
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3826 float s0 = src0[i];
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3827 float s1 = src1[j];
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3828 float wi = win[i];
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3829 float wj = win[j];
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3830 dst[i] = s0wj - s1wi + add_bias;
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3831 dst[j] = s0wi + s1wj + add_bias;
fc843d00867c exploit mdct symmetry lorenm parents: 7261 diff changeset	3832 }
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3833 }
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3834
10219 87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3835 static void vector_fmul_scalar_c(float dst, const float src, float mul,
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3836 int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3837 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3838 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3839 for (i = 0; i < len; i++)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3840 dst[i] = src[i] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3841 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3842
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3843 static void vector_fmul_sv_scalar_2_c(float dst, const float src,
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3844 const float **sv, float mul, int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3845 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3846 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3847 for (i = 0; i < len; i += 2, sv++) {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3848 dst[i ] = src[i ] * sv[0][0] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3849 dst[i+1] = src[i+1] * sv[0][1] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3850 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3851 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3852
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3853 static void vector_fmul_sv_scalar_4_c(float dst, const float src,
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3854 const float **sv, float mul, int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3855 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3856 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3857 for (i = 0; i < len; i += 4, sv++) {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3858 dst[i ] = src[i ] * sv[0][0] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3859 dst[i+1] = src[i+1] * sv[0][1] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3860 dst[i+2] = src[i+2] * sv[0][2] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3861 dst[i+3] = src[i+3] * sv[0][3] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3862 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3863 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3864
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3865 static void sv_fmul_scalar_2_c(float dst, const float *sv, float mul,
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3866 int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3867 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3868 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3869 for (i = 0; i < len; i += 2, sv++) {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3870 dst[i ] = sv[0][0] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3871 dst[i+1] = sv[0][1] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3872 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3873 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3874
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3875 static void sv_fmul_scalar_4_c(float dst, const float *sv, float mul,
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3876 int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3877 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3878 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3879 for (i = 0; i < len; i += 4, sv++) {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3880 dst[i ] = sv[0][0] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3881 dst[i+1] = sv[0][1] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3882 dst[i+2] = sv[0][2] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3883 dst[i+3] = sv[0][3] * mul;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3884 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3885 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3886
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3887 static void butterflies_float_c(float restrict v1, float restrict v2,
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3888 int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3889 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3890 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3891 for (i = 0; i < len; i++) {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3892 float t = v1[i] - v2[i];
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3893 v1[i] += v2[i];
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3894 v2[i] = t;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3895 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3896 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3897
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3898 static float scalarproduct_float_c(const float v1, const float v2, int len)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3899 {
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3900 float p = 0.0;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3901 int i;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3902
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3903 for (i = 0; i < len; i++)
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3904 p += v1[i] * v2[i];
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3905
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3906 return p;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3907 }
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	3908
7564 7cf793954871 simd int->float lorenm parents: 7563 diff changeset	3909 static void int32_to_float_fmul_scalar_c(float dst, const int src, float mul, int len){
7cf793954871 simd int->float lorenm parents: 7563 diff changeset	3910 int i;
7cf793954871 simd int->float lorenm parents: 7563 diff changeset	3911 for(i=0; i<len; i++)
7cf793954871 simd int->float lorenm parents: 7563 diff changeset	3912 dst[i] = src[i] * mul;
7cf793954871 simd int->float lorenm parents: 7563 diff changeset	3913 }
7cf793954871 simd int->float lorenm parents: 7563 diff changeset	3914
10104 0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3915 static inline uint32_t clipf_c_one(uint32_t a, uint32_t mini,
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3916 uint32_t maxi, uint32_t maxisign)
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3917 {
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3918
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3919 if(a > mini) return mini;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3920 else if((a^(1<<31)) > maxisign) return maxi;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3921 else return a;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3922 }
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3923
10105 7775f6627612 Mark parameter src of vector_clipf() as const vitor parents: 10104 diff changeset	3924 static void vector_clipf_c_opposite_sign(float dst, const float src, float min, float max, int len){
10104 0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3925 int i;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3926 uint32_t mini = (uint32_t)min;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3927 uint32_t maxi = (uint32_t)max;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3928 uint32_t maxisign = maxi ^ (1<<31);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3929 uint32_t dsti = (uint32_t)dst;
10105 7775f6627612 Mark parameter src of vector_clipf() as const vitor parents: 10104 diff changeset	3930 const uint32_t srci = (const uint32_t)src;
10104 0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3931 for(i=0; i<len; i+=8) {
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3932 dsti[i + 0] = clipf_c_one(srci[i + 0], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3933 dsti[i + 1] = clipf_c_one(srci[i + 1], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3934 dsti[i + 2] = clipf_c_one(srci[i + 2], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3935 dsti[i + 3] = clipf_c_one(srci[i + 3], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3936 dsti[i + 4] = clipf_c_one(srci[i + 4], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3937 dsti[i + 5] = clipf_c_one(srci[i + 5], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3938 dsti[i + 6] = clipf_c_one(srci[i + 6], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3939 dsti[i + 7] = clipf_c_one(srci[i + 7], mini, maxi, maxisign);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3940 }
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3941 }
10105 7775f6627612 Mark parameter src of vector_clipf() as const vitor parents: 10104 diff changeset	3942 static void vector_clipf_c(float dst, const float src, float min, float max, int len){
10104 0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3943 int i;
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3944 if(min < 0 && max > 0) {
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3945 vector_clipf_c_opposite_sign(dst, src, &min, &max, len);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3946 } else {
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3947 for(i=0; i < len; i+=8) {
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3948 dst[i ] = av_clipf(src[i ], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3949 dst[i + 1] = av_clipf(src[i + 1], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3950 dst[i + 2] = av_clipf(src[i + 2], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3951 dst[i + 3] = av_clipf(src[i + 3], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3952 dst[i + 4] = av_clipf(src[i + 4], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3953 dst[i + 5] = av_clipf(src[i + 5], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3954 dst[i + 6] = av_clipf(src[i + 6], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3955 dst[i + 7] = av_clipf(src[i + 7], min, max);
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3956 }
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3957 }
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3958 }
0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	3959
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3960 static av_always_inline int float_to_int16_one(const float *src){
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3961 int_fast32_t tmp = (const int32_t)src;
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3962 if(tmp & 0xf0000){
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3963 tmp = (0x43c0ffff - tmp)>>31;
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3964 // is this faster on some gcc/cpu combinations?
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3965 // if(tmp > 0x43c0ffff) tmp = 0xFFFF;
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3966 // else tmp = 0;
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3967 }
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3968 return tmp - 0x8000;
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3969 }
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3970
7218 7f3d6509628b Fix x86-64 michael parents: 7203 diff changeset	3971 void ff_float_to_int16_c(int16_t dst, const float src, long len){
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3972 int i;
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3973 for(i=0; i<len; i++)
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3974 dst[i] = float_to_int16_one(src+i);
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3975 }
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3976
7286 e267f2519248 float_to_int16_interleave: change src to an array of pointers instead of assuming it's contiguous. lorenm parents: 7263 diff changeset	3977 void ff_float_to_int16_interleave_c(int16_t dst, const float *src, long len, int channels){
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3978 int i,j,c;
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3979 if(channels==2){
032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3980 for(i=0; i<len; i++){
7286 e267f2519248 float_to_int16_interleave: change src to an array of pointers instead of assuming it's contiguous. lorenm parents: 7263 diff changeset	3981 dst[2*i] = float_to_int16_one(src[0]+i);
e267f2519248 float_to_int16_interleave: change src to an array of pointers instead of assuming it's contiguous. lorenm parents: 7263 diff changeset	3982 dst[2*i+1] = float_to_int16_one(src[1]+i);
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3983 }
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3984 }else{
7286 e267f2519248 float_to_int16_interleave: change src to an array of pointers instead of assuming it's contiguous. lorenm parents: 7263 diff changeset	3985 for(c=0; c<channels; c++)
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	3986 for(i=0, j=c; i<len; i++, j+=channels)
7286 e267f2519248 float_to_int16_interleave: change src to an array of pointers instead of assuming it's contiguous. lorenm parents: 7263 diff changeset	3987 dst[j] = float_to_int16_one(src[c]+i);
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3988 }
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3989 }
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	3990
11981 d3551fcf4c1c Add const to some pointer parameters. cehoyos parents: 11950 diff changeset	3991 static int32_t scalarproduct_int16_c(const int16_t * v1, const int16_t * v2, int order, int shift)
7203 87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3992 {
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3993 int res = 0;
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3994
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3995 while (order--)
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3996 res += (v1++ *v2++) >> shift;
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3997
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3998 return res;
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	3999 }
87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	4000
11981 d3551fcf4c1c Add const to some pointer parameters. cehoyos parents: 11950 diff changeset	4001 static int32_t scalarproduct_and_madd_int16_c(int16_t v1, const int16_t v2, const int16_t *v3, int order, int mul)
10644 5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4002 {
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4003 int res = 0;
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4004 while (order--) {
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4005 res += v1 *v2++;
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4006 v1++ += mul *v3++;
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4007 }
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4008 return res;
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4009 }
5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4010
5887 83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4011 #define W0 2048
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4012 #define W1 2841 /* 2048sqrt (2)cos (1pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4013 #define W2 2676 /* 2048sqrt (2)cos (2pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4014 #define W3 2408 /* 2048sqrt (2)cos (3pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4015 #define W4 2048 /* 2048sqrt (2)cos (4pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4016 #define W5 1609 /* 2048sqrt (2)cos (5pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4017 #define W6 1108 /* 2048sqrt (2)cos (6pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4018 #define W7 565 /* 2048sqrt (2)cos (7pi/16) /
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4019
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4020 static void wmv2_idct_row(short * b)
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4021 {
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4022 int s1,s2;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4023 int a0,a1,a2,a3,a4,a5,a6,a7;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4024 /step 1/
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4025 a1 = W1b[1]+W7b[7];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4026 a7 = W7b[1]-W1b[7];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4027 a5 = W5b[5]+W3b[3];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4028 a3 = W3b[5]-W5b[3];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4029 a2 = W2b[2]+W6b[6];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4030 a6 = W6b[2]-W2b[6];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4031 a0 = W0b[0]+W0b[4];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4032 a4 = W0b[0]-W0b[4];
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4033 /step 2/
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4034 s1 = (181*(a1-a5+a7-a3)+128)>>8;//1,3,5,7,
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4035 s2 = (181*(a1-a5-a7+a3)+128)>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4036 /step 3/
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4037 b[0] = (a0+a2+a1+a5 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4038 b[1] = (a4+a6 +s1 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4039 b[2] = (a4-a6 +s2 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4040 b[3] = (a0-a2+a7+a3 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4041 b[4] = (a0-a2-a7-a3 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4042 b[5] = (a4-a6 -s2 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4043 b[6] = (a4+a6 -s1 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4044 b[7] = (a0+a2-a1-a5 + (1<<7))>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4045 }
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4046 static void wmv2_idct_col(short * b)
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4047 {
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4048 int s1,s2;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4049 int a0,a1,a2,a3,a4,a5,a6,a7;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4050 /step 1, with extended precision/
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4051 a1 = (W1b[81]+W7b[87] + 4)>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4052 a7 = (W7b[81]-W1b[87] + 4)>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4053 a5 = (W5b[85]+W3b[83] + 4)>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4054 a3 = (W3b[85]-W5b[83] + 4)>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4055 a2 = (W2b[82]+W6b[86] + 4)>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4056 a6 = (W6b[82]-W2b[86] + 4)>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4057 a0 = (W0b[80]+W0b[84] )>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4058 a4 = (W0b[80]-W0b[84] )>>3;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4059 /step 2/
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4060 s1 = (181*(a1-a5+a7-a3)+128)>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4061 s2 = (181*(a1-a5-a7+a3)+128)>>8;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4062 /step 3/
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4063 b[8*0] = (a0+a2+a1+a5 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4064 b[8*1] = (a4+a6 +s1 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4065 b[8*2] = (a4-a6 +s2 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4066 b[8*3] = (a0-a2+a7+a3 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4067
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4068 b[8*4] = (a0-a2-a7-a3 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4069 b[8*5] = (a4-a6 -s2 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4070 b[8*6] = (a4+a6 -s1 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4071 b[8*7] = (a0+a2-a1-a5 + (1<<13))>>14;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4072 }
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4073 void ff_wmv2_idct_c(short * block){
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4074 int i;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4075
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4076 for(i=0;i<64;i+=8){
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4077 wmv2_idct_row(block+i);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4078 }
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4079 for(i=0;i<8;i++){
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4080 wmv2_idct_col(block+i);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4081 }
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4082 }
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4083 /* XXX: those functions should be suppressed ASAP when all IDCTs are
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4084 converted */
5887 83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4085 static void ff_wmv2_idct_put_c(uint8_t dest, int line_size, DCTELEM block)
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4086 {
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4087 ff_wmv2_idct_c(block);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4088 put_pixels_clamped_c(block, dest, line_size);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4089 }
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4090 static void ff_wmv2_idct_add_c(uint8_t dest, int line_size, DCTELEM block)
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4091 {
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4092 ff_wmv2_idct_c(block);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4093 add_pixels_clamped_c(block, dest, line_size);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4094 }
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4095 static void ff_jref_idct_put(uint8_t dest, int line_size, DCTELEM block)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4096 {
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4097 j_rev_dct (block);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4098 put_pixels_clamped_c(block, dest, line_size);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4099 }
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4100 static void ff_jref_idct_add(uint8_t dest, int line_size, DCTELEM block)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4101 {
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4102 j_rev_dct (block);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4103 add_pixels_clamped_c(block, dest, line_size);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4104 }
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4105
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4106 static void ff_jref_idct4_put(uint8_t dest, int line_size, DCTELEM block)
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4107 {
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4108 j_rev_dct4 (block);
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4109 put_pixels_clamped4_c(block, dest, line_size);
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4110 }
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4111 static void ff_jref_idct4_add(uint8_t dest, int line_size, DCTELEM block)
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4112 {
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4113 j_rev_dct4 (block);
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4114 add_pixels_clamped4_c(block, dest, line_size);
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4115 }
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4116
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4117 static void ff_jref_idct2_put(uint8_t dest, int line_size, DCTELEM block)
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4118 {
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4119 j_rev_dct2 (block);
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4120 put_pixels_clamped2_c(block, dest, line_size);
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4121 }
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4122 static void ff_jref_idct2_add(uint8_t dest, int line_size, DCTELEM block)
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4123 {
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4124 j_rev_dct2 (block);
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4125 add_pixels_clamped2_c(block, dest, line_size);
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4126 }
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4127
2259 12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4128 static void ff_jref_idct1_put(uint8_t dest, int line_size, DCTELEM block)
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4129 {
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	4130 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2259 12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4131
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4132 dest[0] = cm[(block[0] + 4)>>3];
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4133 }
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4134 static void ff_jref_idct1_add(uint8_t dest, int line_size, DCTELEM block)
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4135 {
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	4136 uint8_t *cm = ff_cropTbl + MAX_NEG_CROP;
2259 12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4137
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4138 dest[0] = cm[dest[0] + ((block[0] + 4)>>3)];
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4139 }
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4140
5143 151f6f3a507b Correct signature of just_return(). takis parents: 5140 diff changeset	4141 static void just_return(void *mem av_unused, int stride av_unused, int h av_unused) { return; }
3215 06f98047ff26 prefetch pixels for future motion compensation. 2-5% faster h264. lorenm parents: 3199 diff changeset	4142
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4143 /* init static data */
10867 bf309c7ce615 More av_cold for infrequently called functions. zuxy parents: 10749 diff changeset	4144 av_cold void dsputil_static_init(void)
0 986e461dc072 Initial revision glantau parents: diff changeset	4145 {
751 cbe316f082bc warning fixes michaelni parents: 706 diff changeset	4146 int i;
0 986e461dc072 Initial revision glantau parents: diff changeset	4147
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	4148 for(i=0;i<256;i++) ff_cropTbl[i + MAX_NEG_CROP] = i;
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4149 for(i=0;i<MAX_NEG_CROP;i++) {
4176 23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	4150 ff_cropTbl[i] = 0;
23da44e8fd05 rename cropTbl -> ff_cropTbl mru parents: 4174 diff changeset	4151 ff_cropTbl[i + MAX_NEG_CROP + 256] = 255;
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4152 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4153
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4154 for(i=0;i<512;i++) {
4179 46d38e3d7038 rename squareTbl -> ff_squareTbl mru parents: 4176 diff changeset	4155 ff_squareTbl[i] = (i - 256) * (i - 256);
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4156 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4157
4197 bbe0bc387a19 revert bad checkin mru parents: 4196 diff changeset	4158 for(i=0; i<64; i++) inv_zigzag_direct16[ff_zigzag_direct[i]]= i+1;
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4159 }
0 986e461dc072 Initial revision glantau parents: diff changeset	4160
4281 de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4161 int ff_check_alignment(void){
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4162 static int did_fail=0;
11369 98970e51365a Remove DECLARE_ALIGNED_{8,16} macros mru parents: 11231 diff changeset	4163 DECLARE_ALIGNED(16, int, aligned);
4281 de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4164
9259 a031926f7d6b Use intptr_t when casting pointers to int. ramiro parents: 8978 diff changeset	4165 if((intptr_t)&aligned & 15){
4281 de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4166 if(!did_fail){
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4167 #if HAVE_MMX \|\| HAVE_ALTIVEC
4281 de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4168 av_log(NULL, AV_LOG_ERROR,
4292 a26b5096dbb0 improved stack misalignment warning mru parents: 4282 diff changeset	4169 "Compiler did not align stack variables. Libavcodec has been miscompiled\n"
a26b5096dbb0 improved stack misalignment warning mru parents: 4282 diff changeset	4170 "and may be very slow or crash. This is not a bug in libavcodec,\n"
5542 b0a566346fb1 Add attribute that forces alignment of stack to functions that need it. ramiro parents: 5520 diff changeset	4171 "but in the compiler. You may try recompiling using gcc >= 4.2.\n"
b0a566346fb1 Add attribute that forces alignment of stack to functions that need it. ramiro parents: 5520 diff changeset	4172 "Do not report crashes to FFmpeg developers.\n");
4281 de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4173 #endif
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4174 did_fail=1;
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4175 }
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4176 return -1;
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4177 }
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4178 return 0;
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4179 }
861 243cc33da3eb * init for inv_zigzag_direct16 moved to init block kabi parents: 860 diff changeset	4180
10867 bf309c7ce615 More av_cold for infrequently called functions. zuxy parents: 10749 diff changeset	4181 av_cold void dsputil_init(DSPContext* c, AVCodecContext *avctx)
1201 e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4182 {
e0fc95a6eb4e fixed static init bellard parents: 1168 diff changeset	4183 int i;
0 986e461dc072 Initial revision glantau parents: diff changeset	4184
4281 de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4185 ff_check_alignment();
de525a2b41db ff_check_alignment to warn the user about a missaligned stack michael parents: 4240 diff changeset	4186
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4187 #if CONFIG_ENCODERS
1567 e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	4188 if(avctx->dct_algo==FF_DCT_FASTINT) {
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4189 c->fdct = fdct_ifast;
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	4190 c->fdct248 = fdct_ifast248;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4191 }
1567 e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	4192 else if(avctx->dct_algo==FF_DCT_FAAN) {
1557 5d53c03186a1 floating point AAN DCT michael parents: 1527 diff changeset	4193 c->fdct = ff_faandct;
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	4194 c->fdct248 = ff_faandct248;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4195 }
1567 e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	4196 else {
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4197 c->fdct = ff_jpeg_fdct_islow; //slow/accurate/default
2979 bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting diego parents: 2967 diff changeset	4198 c->fdct248 = ff_fdct248_islow;
1567 e08df4d22d27 * introducing dct248 into the DSP context. romansh parents: 1557 diff changeset	4199 }
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4200 #endif //CONFIG_ENCODERS
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4201
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4202 if(avctx->lowres==1){
8596 68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4203 if(avctx->idct_algo==FF_IDCT_INT \|\| avctx->idct_algo==FF_IDCT_AUTO \|\| !CONFIG_H264_DECODER){
2272 cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext michael parents: 2259 diff changeset	4204 c->idct_put= ff_jref_idct4_put;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext michael parents: 2259 diff changeset	4205 c->idct_add= ff_jref_idct4_add;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext michael parents: 2259 diff changeset	4206 }else{
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext michael parents: 2259 diff changeset	4207 c->idct_put= ff_h264_lowres_idct_put_c;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext michael parents: 2259 diff changeset	4208 c->idct_add= ff_h264_lowres_idct_add_c;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext michael parents: 2259 diff changeset	4209 }
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4210 c->idct = j_rev_dct4;
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4211 c->idct_permutation_type= FF_NO_IDCT_PERM;
2257 5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4212 }else if(avctx->lowres==2){
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4213 c->idct_put= ff_jref_idct2_put;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4214 c->idct_add= ff_jref_idct2_add;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4215 c->idct = j_rev_dct2;
5f64a30339e5 1/4 resolution decoding michael parents: 2256 diff changeset	4216 c->idct_permutation_type= FF_NO_IDCT_PERM;
2259 12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4217 }else if(avctx->lowres==3){
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4218 c->idct_put= ff_jref_idct1_put;
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4219 c->idct_add= ff_jref_idct1_add;
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4220 c->idct = j_rev_dct1;
12e75af1d44c 1/8 resolution decoding michael parents: 2257 diff changeset	4221 c->idct_permutation_type= FF_NO_IDCT_PERM;
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4222 }else{
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4223 if(avctx->idct_algo==FF_IDCT_INT){
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4224 c->idct_put= ff_jref_idct_put;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4225 c->idct_add= ff_jref_idct_add;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4226 c->idct = j_rev_dct;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4227 c->idct_permutation_type= FF_LIBMPEG2_IDCT_PERM;
9975 d6d7e8d4a04d Do not redundantly check for both CONFIG_THEORA_DECODER and CONFIG_VP3_DECODER. diego parents: 9586 diff changeset	4228 }else if((CONFIG_VP3_DECODER \|\| CONFIG_VP5_DECODER \|\| CONFIG_VP6_DECODER ) &&
5007 f7edc4fe94db Make vp3dsp.c compilation optional. takis* parents: 4988 diff changeset	4229 avctx->idct_algo==FF_IDCT_VP3){
2693 02925a3903b6 porting vp3 idct over to lavc idct api michael parents: 2651 diff changeset	4230 c->idct_put= ff_vp3_idct_put_c;
02925a3903b6 porting vp3 idct over to lavc idct api michael parents: 2651 diff changeset	4231 c->idct_add= ff_vp3_idct_add_c;
02925a3903b6 porting vp3 idct over to lavc idct api michael parents: 2651 diff changeset	4232 c->idct = ff_vp3_idct_c;
02925a3903b6 porting vp3 idct over to lavc idct api michael parents: 2651 diff changeset	4233 c->idct_permutation_type= FF_NO_IDCT_PERM;
5887 83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4234 }else if(avctx->idct_algo==FF_IDCT_WMV2){
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4235 c->idct_put= ff_wmv2_idct_put_c;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4236 c->idct_add= ff_wmv2_idct_add_c;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4237 c->idct = ff_wmv2_idct_c;
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4238 c->idct_permutation_type= FF_NO_IDCT_PERM;
6407 7f9e2b5893fc floating point AAN IDCT michael parents: 6387 diff changeset	4239 }else if(avctx->idct_algo==FF_IDCT_FAAN){
7f9e2b5893fc floating point AAN IDCT michael parents: 6387 diff changeset	4240 c->idct_put= ff_faanidct_put;
7f9e2b5893fc floating point AAN IDCT michael parents: 6387 diff changeset	4241 c->idct_add= ff_faanidct_add;
7f9e2b5893fc floating point AAN IDCT michael parents: 6387 diff changeset	4242 c->idct = ff_faanidct;
7f9e2b5893fc floating point AAN IDCT michael parents: 6387 diff changeset	4243 c->idct_permutation_type= FF_NO_IDCT_PERM;
8596 68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4244 }else if(CONFIG_EATGQ_DECODER && avctx->idct_algo==FF_IDCT_EA) {
8120 3d4e01bcd2a5 Electronic Arts TGQ/TQI/MAD IDCT algorithm pross parents: 7995 diff changeset	4245 c->idct_put= ff_ea_idct_put_c;
3d4e01bcd2a5 Electronic Arts TGQ/TQI/MAD IDCT algorithm pross parents: 7995 diff changeset	4246 c->idct_permutation_type= FF_NO_IDCT_PERM;
11231 0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4247 }else if(CONFIG_BINK_DECODER && avctx->idct_algo==FF_IDCT_BINK) {
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4248 c->idct = ff_bink_idct_c;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4249 c->idct_add = ff_bink_idct_add_c;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4250 c->idct_put = ff_bink_idct_put_c;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4251 c->idct_permutation_type = FF_NO_IDCT_PERM;
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4252 }else{ //accurate/default
6001 f4859c13426b add ff_ prefix to all simple_idct symbols aurel parents: 5899 diff changeset	4253 c->idct_put= ff_simple_idct_put;
f4859c13426b add ff_ prefix to all simple_idct symbols aurel parents: 5899 diff changeset	4254 c->idct_add= ff_simple_idct_add;
f4859c13426b add ff_ prefix to all simple_idct symbols aurel parents: 5899 diff changeset	4255 c->idct = ff_simple_idct;
2256 7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4256 c->idct_permutation_type= FF_NO_IDCT_PERM;
7e0b2e86afa9 1/2 resolution decoding michael parents: 2208 diff changeset	4257 }
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4258 }
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4259
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4260 c->get_pixels = get_pixels_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4261 c->diff_pixels = diff_pixels_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4262 c->put_pixels_clamped = put_pixels_clamped_c;
1984 ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and melanson parents: 1977 diff changeset	4263 c->put_signed_pixels_clamped = put_signed_pixels_clamped_c;
11231 0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4264 c->put_pixels_nonclamped = put_pixels_nonclamped_c;
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4265 c->add_pixels_clamped = add_pixels_clamped_c;
2763 01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	4266 c->add_pixels8 = add_pixels8_c;
01ed2c3b8f08 H.264 lossless mode lorenm parents: 2755 diff changeset	4267 c->add_pixels4 = add_pixels4_c;
4988 689490842cf5 factor sum_abs_dctelem out of dct_sad, and simd it. lorenm parents: 4749 diff changeset	4268 c->sum_abs_dctelem = sum_abs_dctelem_c;
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4269 c->gmc1 = gmc1_c;
3248 7aa9f80e7954 mmx implementation of 3-point GMC. (5x faster than C) lorenm parents: 3245 diff changeset	4270 c->gmc = ff_gmc_c;
8288 800444234375 clear_block mmx lorenm parents: 8232 diff changeset	4271 c->clear_block = clear_block_c;
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4272 c->clear_blocks = clear_blocks_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4273 c->pix_sum = pix_sum_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4274 c->pix_norm1 = pix_norm1_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4275
11231 0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4276 c->fill_block_tab[0] = fill_block16_c;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4277 c->fill_block_tab[1] = fill_block8_c;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4278 c->scale_block = scale_block_c;
0fc1cdd984b7 Bink video decoder kostya parents: 11195 diff changeset	4279
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4280 /* TODO [0] 16 [1] 8 */
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4281 c->pix_abs[0][0] = pix_abs16_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4282 c->pix_abs[0][1] = pix_abs16_x2_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4283 c->pix_abs[0][2] = pix_abs16_y2_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4284 c->pix_abs[0][3] = pix_abs16_xy2_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4285 c->pix_abs[1][0] = pix_abs8_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4286 c->pix_abs[1][1] = pix_abs8_x2_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4287 c->pix_abs[1][2] = pix_abs8_y2_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4288 c->pix_abs[1][3] = pix_abs8_xy2_c;
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4289
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4290 #define dspfunc(PFX, IDX, NUM) \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4291 c->PFX ## _pixels_tab[IDX][0] = PFX ## _pixels ## NUM ## _c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4292 c->PFX ## _pixels_tab[IDX][1] = PFX ## _pixels ## NUM ## _x2_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4293 c->PFX ## _pixels_tab[IDX][2] = PFX ## _pixels ## NUM ## _y2_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4294 c->PFX ## _pixels_tab[IDX][3] = PFX ## _pixels ## NUM ## _xy2_c
853 eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension kabi parents: 764 diff changeset	4295
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4296 dspfunc(put, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4297 dspfunc(put_no_rnd, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4298 dspfunc(put, 1, 8);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4299 dspfunc(put_no_rnd, 1, 8);
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4300 dspfunc(put, 2, 4);
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4301 dspfunc(put, 3, 2);
0 986e461dc072 Initial revision glantau parents: diff changeset	4302
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4303 dspfunc(avg, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4304 dspfunc(avg_no_rnd, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4305 dspfunc(avg, 1, 8);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4306 dspfunc(avg_no_rnd, 1, 8);
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4307 dspfunc(avg, 2, 4);
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4308 dspfunc(avg, 3, 2);
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4309 #undef dspfunc
857 b510a7b6decd 100l for kabi (fixing qpel) michaelni parents: 853 diff changeset	4310
1864 9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	4311 c->put_no_rnd_pixels_l2[0]= put_no_rnd_pixels16_l2_c;
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	4312 c->put_no_rnd_pixels_l2[1]= put_no_rnd_pixels8_l2_c;
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs michael parents: 1784 diff changeset	4313
1267 85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4314 c->put_tpel_pixels_tab[ 0] = put_tpel_pixels_mc00_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4315 c->put_tpel_pixels_tab[ 1] = put_tpel_pixels_mc10_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4316 c->put_tpel_pixels_tab[ 2] = put_tpel_pixels_mc20_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4317 c->put_tpel_pixels_tab[ 4] = put_tpel_pixels_mc01_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4318 c->put_tpel_pixels_tab[ 5] = put_tpel_pixels_mc11_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4319 c->put_tpel_pixels_tab[ 6] = put_tpel_pixels_mc21_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4320 c->put_tpel_pixels_tab[ 8] = put_tpel_pixels_mc02_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4321 c->put_tpel_pixels_tab[ 9] = put_tpel_pixels_mc12_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4322 c->put_tpel_pixels_tab[10] = put_tpel_pixels_mc22_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...) michaelni parents: 1264 diff changeset	4323
1319 449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4324 c->avg_tpel_pixels_tab[ 0] = avg_tpel_pixels_mc00_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4325 c->avg_tpel_pixels_tab[ 1] = avg_tpel_pixels_mc10_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4326 c->avg_tpel_pixels_tab[ 2] = avg_tpel_pixels_mc20_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4327 c->avg_tpel_pixels_tab[ 4] = avg_tpel_pixels_mc01_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4328 c->avg_tpel_pixels_tab[ 5] = avg_tpel_pixels_mc11_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4329 c->avg_tpel_pixels_tab[ 6] = avg_tpel_pixels_mc21_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4330 c->avg_tpel_pixels_tab[ 8] = avg_tpel_pixels_mc02_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4331 c->avg_tpel_pixels_tab[ 9] = avg_tpel_pixels_mc12_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4332 c->avg_tpel_pixels_tab[10] = avg_tpel_pixels_mc22_c;
449f6e32b425 added support for B-frames and multiple slices tmmm parents: 1273 diff changeset	4333
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4334 #define dspfunc(PFX, IDX, NUM) \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4335 c->PFX ## _pixels_tab[IDX][ 0] = PFX ## NUM ## _mc00_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4336 c->PFX ## _pixels_tab[IDX][ 1] = PFX ## NUM ## _mc10_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4337 c->PFX ## _pixels_tab[IDX][ 2] = PFX ## NUM ## _mc20_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4338 c->PFX ## _pixels_tab[IDX][ 3] = PFX ## NUM ## _mc30_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4339 c->PFX ## _pixels_tab[IDX][ 4] = PFX ## NUM ## _mc01_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4340 c->PFX ## _pixels_tab[IDX][ 5] = PFX ## NUM ## _mc11_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4341 c->PFX ## _pixels_tab[IDX][ 6] = PFX ## NUM ## _mc21_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4342 c->PFX ## _pixels_tab[IDX][ 7] = PFX ## NUM ## _mc31_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4343 c->PFX ## _pixels_tab[IDX][ 8] = PFX ## NUM ## _mc02_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4344 c->PFX ## _pixels_tab[IDX][ 9] = PFX ## NUM ## _mc12_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4345 c->PFX ## _pixels_tab[IDX][10] = PFX ## NUM ## _mc22_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4346 c->PFX ## _pixels_tab[IDX][11] = PFX ## NUM ## _mc32_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4347 c->PFX ## _pixels_tab[IDX][12] = PFX ## NUM ## _mc03_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4348 c->PFX ## _pixels_tab[IDX][13] = PFX ## NUM ## _mc13_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4349 c->PFX ## _pixels_tab[IDX][14] = PFX ## NUM ## _mc23_c; \
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4350 c->PFX ## _pixels_tab[IDX][15] = PFX ## NUM ## _mc33_c
857 b510a7b6decd 100l for kabi (fixing qpel) michaelni parents: 853 diff changeset	4351
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4352 dspfunc(put_qpel, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4353 dspfunc(put_no_rnd_qpel, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4354
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4355 dspfunc(avg_qpel, 0, 16);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4356 /* dspfunc(avg_no_rnd_qpel, 0, 16); */
857 b510a7b6decd 100l for kabi (fixing qpel) michaelni parents: 853 diff changeset	4357
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4358 dspfunc(put_qpel, 1, 8);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4359 dspfunc(put_no_rnd_qpel, 1, 8);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4360
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4361 dspfunc(avg_qpel, 1, 8);
9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4362 /* dspfunc(avg_no_rnd_qpel, 1, 8); */
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4363
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4364 dspfunc(put_h264_qpel, 0, 16);
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4365 dspfunc(put_h264_qpel, 1, 8);
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4366 dspfunc(put_h264_qpel, 2, 4);
3020 c75fb0747e74 use h264 MC functions for 2xX Xx2 blocks in snow too michael parents: 3013 diff changeset	4367 dspfunc(put_h264_qpel, 3, 2);
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4368 dspfunc(avg_h264_qpel, 0, 16);
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4369 dspfunc(avg_h264_qpel, 1, 8);
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4370 dspfunc(avg_h264_qpel, 2, 4);
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4371
859 9512471dec40 * using macros to shorten init part kabi parents: 858 diff changeset	4372 #undef dspfunc
1168 5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4373 c->put_h264_chroma_pixels_tab[0]= put_h264_chroma_mc8_c;
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4374 c->put_h264_chroma_pixels_tab[1]= put_h264_chroma_mc4_c;
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4375 c->put_h264_chroma_pixels_tab[2]= put_h264_chroma_mc2_c;
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4376 c->avg_h264_chroma_pixels_tab[0]= avg_h264_chroma_mc8_c;
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4377 c->avg_h264_chroma_pixels_tab[1]= avg_h264_chroma_mc4_c;
5af9aeadbdc3 H264 decoder & demuxer michaelni parents: 1106 diff changeset	4378 c->avg_h264_chroma_pixels_tab[2]= avg_h264_chroma_mc2_c;
9439 ef3a7b711cc0 Rename put_no_rnd_h264_chroma* to reflect its usage in VC1 only conrad parents: 9437 diff changeset	4379 c->put_no_rnd_vc1_chroma_pixels_tab[0]= put_no_rnd_vc1_chroma_mc8_c;
9440 daee921fb6bb VC1: add and use avg_no_rnd chroma MC functions conrad parents: 9439 diff changeset	4380 c->avg_no_rnd_vc1_chroma_pixels_tab[0]= avg_no_rnd_vc1_chroma_mc8_c;
857 b510a7b6decd 100l for kabi (fixing qpel) michaelni parents: 853 diff changeset	4381
6437 5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	4382 c->draw_edges = draw_edges_c;
5154ab444372 move draw_edges() into dsputil aurel parents: 6407 diff changeset	4383
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4384 #if CONFIG_CAVS_DECODER
3395 adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	4385 ff_cavsdsp_init(c,avctx);
3432 ab49baf4adad Fix compilation with --disable-decoders. diego parents: 3395 diff changeset	4386 #endif
9585 5e1d9508b62f mlpdec: Move MLP's filter_channel() to dsputils. ramiro parents: 9440 diff changeset	4387
5e1d9508b62f mlpdec: Move MLP's filter_channel() to dsputils. ramiro parents: 9440 diff changeset	4388 #if CONFIG_MLP_DECODER \|\| CONFIG_TRUEHD_DECODER
5e1d9508b62f mlpdec: Move MLP's filter_channel() to dsputils. ramiro parents: 9440 diff changeset	4389 ff_mlp_init(c, avctx);
5e1d9508b62f mlpdec: Move MLP's filter_channel() to dsputils. ramiro parents: 9440 diff changeset	4390 #endif
9995 3141f69e3905 Do not check for both CONFIG_VC1_DECODER and CONFIG_WMV3_DECODER, diego parents: 9975 diff changeset	4391 #if CONFIG_VC1_DECODER
3526 7dc8e4a12105 New functions in DSPContext for VC-1 decoding kostya parents: 3432 diff changeset	4392 ff_vc1dsp_init(c,avctx);
7dc8e4a12105 New functions in DSPContext for VC-1 decoding kostya parents: 3432 diff changeset	4393 #endif
9995 3141f69e3905 Do not check for both CONFIG_VC1_DECODER and CONFIG_WMV3_DECODER, diego parents: 9975 diff changeset	4394 #if CONFIG_WMV2_DECODER \|\| CONFIG_VC1_DECODER
5887 83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4395 ff_intrax8dsp_init(c,avctx);
83ac4620c6ed intrax8 decoder patch by "someone" michael parents: 5737 diff changeset	4396 #endif
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4397 #if CONFIG_RV30_DECODER
8410 b0ec9768b39b RV30 decoder kostya parents: 8395 diff changeset	4398 ff_rv30dsp_init(c,avctx);
b0ec9768b39b RV30 decoder kostya parents: 8395 diff changeset	4399 #endif
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4400 #if CONFIG_RV40_DECODER
8232 520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	4401 ff_rv40dsp_init(c,avctx);
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	4402 c->put_rv40_qpel_pixels_tab[0][15] = put_rv40_qpel16_mc33_c;
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	4403 c->avg_rv40_qpel_pixels_tab[0][15] = avg_rv40_qpel16_mc33_c;
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	4404 c->put_rv40_qpel_pixels_tab[1][15] = put_rv40_qpel8_mc33_c;
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	4405 c->avg_rv40_qpel_pixels_tab[1][15] = avg_rv40_qpel8_mc33_c;
520a6e56b8c0 RV40 MC functions kostya parents: 8120 diff changeset	4406 #endif
3395 adccbf4a1040 CAVS decoder by (Stefan Gehrer stefan.gehrer gmx.de) michael parents: 3373 diff changeset	4407
936 caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4408 c->put_mspel_pixels_tab[0]= put_mspel8_mc00_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4409 c->put_mspel_pixels_tab[1]= put_mspel8_mc10_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4410 c->put_mspel_pixels_tab[2]= put_mspel8_mc20_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4411 c->put_mspel_pixels_tab[3]= put_mspel8_mc30_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4412 c->put_mspel_pixels_tab[4]= put_mspel8_mc02_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4413 c->put_mspel_pixels_tab[5]= put_mspel8_mc12_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4414 c->put_mspel_pixels_tab[6]= put_mspel8_mc22_c;
caa77cd960c0 qpel encoding michaelni parents: 909 diff changeset	4415 c->put_mspel_pixels_tab[7]= put_mspel8_mc32_c;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4416
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4417 #define SET_CMP_FUNC(name) \
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4418 c->name[0]= name ## 16_c;\
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4419 c->name[1]= name ## 8x8_c;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4420
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4421 SET_CMP_FUNC(hadamard8_diff)
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	4422 c->hadamard8_diff[4]= hadamard8_intra16_c;
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	4423 c->hadamard8_diff[5]= hadamard8_intra8x8_c;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4424 SET_CMP_FUNC(dct_sad)
2382 23e7af611c34 more flexible frame skip decission michael parents: 2272 diff changeset	4425 SET_CMP_FUNC(dct_max)
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4426 #if CONFIG_GPL
3010 533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL) michael parents: 2979 diff changeset	4427 SET_CMP_FUNC(dct264_sad)
3013 b6a90fabaa76 ugly, but necessary melanson parents: 3010 diff changeset	4428 #endif
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4429 c->sad[0]= pix_abs16_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4430 c->sad[1]= pix_abs8_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4431 c->sse[0]= sse16_c;
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4432 c->sse[1]= sse8_c;
2184 3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	4433 c->sse[2]= sse4_c;
1708 dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4434 SET_CMP_FUNC(quant_psnr)
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4435 SET_CMP_FUNC(rd)
dea5b2946999 interlaced motion estimation michael parents: 1689 diff changeset	4436 SET_CMP_FUNC(bit)
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	4437 c->vsad[0]= vsad16_c;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	4438 c->vsad[4]= vsad_intra16_c;
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	4439 c->vsad[5]= vsad_intra8_c;
1729 a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	4440 c->vsse[0]= vsse16_c;
a4a5e7521339 interlaced dct decision cleanup michael parents: 1708 diff changeset	4441 c->vsse[4]= vsse_intra16_c;
8978 a49197cd37ce Adding 2 intra 8x8 cmp functions: vsad, vsse romansh parents: 8976 diff changeset	4442 c->vsse[5]= vsse_intra8_c;
2065 9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	4443 c->nsse[0]= nsse16_c;
9e4bebc39ade noise preserving sum of squares comparission function michael parents: 2045 diff changeset	4444 c->nsse[1]= nsse8_c;
11485 0f0cd6b5791f Separate DWT from snow and dsputil mru parents: 11459 diff changeset	4445 #if CONFIG_DWT
0f0cd6b5791f Separate DWT from snow and dsputil mru parents: 11459 diff changeset	4446 ff_dsputil_init_dwt(c);
3373 b8996cc5ccae Disable w53 and w97 cmp methods when snow encoder is disabled gpoirier parents: 3323 diff changeset	4447 #endif
2184 3378d0677903 4x4 SSE compare function michael parents: 2169 diff changeset	4448
4749 7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	4449 c->ssd_int8_vs_int16 = ssd_int8_vs_int16_c;
7011f597e473 mmx 16-bit ssd. 2.3x faster svq1 encoding. lorenm parents: 4598 diff changeset	4450
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	4451 c->add_bytes= add_bytes_c;
6384 0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	4452 c->add_bytes_l2= add_bytes_l2_c;
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	4453 c->diff_bytes= diff_bytes_c;
8760 31138c296ac6 ff_add_hfyu_median_prediction_mmx2 lorenm parents: 8719 diff changeset	4454 c->add_hfyu_median_prediction= add_hfyu_median_prediction_c;
1527 8ffd0c00e6df mmx2 optimization of huffyuv median encoding michael parents: 1329 diff changeset	4455 c->sub_hfyu_median_prediction= sub_hfyu_median_prediction_c;
10370 6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	4456 c->add_hfyu_left_prediction = add_hfyu_left_prediction_c;
6009feb54020 Move HuffYUV left prediction to dsputil. cehoyos parents: 10300 diff changeset	4457 c->add_hfyu_left_prediction_bgr32 = add_hfyu_left_prediction_bgr32_c;
1273 a979fab41ed8 ASV1 codec michaelni parents: 1267 diff changeset	4458 c->bswap_buf= bswap_buf;
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4459 #if CONFIG_PNG_DECODER
6384 0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	4460 c->add_png_paeth_prediction= ff_add_png_paeth_prediction;
0a403ade8c81 simd and unroll png_filter_row lorenm parents: 6241 diff changeset	4461 #endif
2633 72e6ffa1f3a5 MMX for H.264 deblocking filter lorenm parents: 2522 diff changeset	4462
10749 5cca4b6c459d Get rid of pointless CONFIG_ANY_H263 preprocessor definition. diego parents: 10748 diff changeset	4463 if (CONFIG_H263_DECODER \|\| CONFIG_H263_ENCODER) {
5278 ef85411bb7e8 cosmetics: indentation aurel parents: 5277 diff changeset	4464 c->h263_h_loop_filter= h263_h_loop_filter_c;
ef85411bb7e8 cosmetics: indentation aurel parents: 5277 diff changeset	4465 c->h263_v_loop_filter= h263_v_loop_filter_c;
5277 7b3fcb7c61ce Avoid linking with h263.c functions when the relevant codecs aurel parents: 5256 diff changeset	4466 }
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4467
9975 d6d7e8d4a04d Do not redundantly check for both CONFIG_THEORA_DECODER and CONFIG_VP3_DECODER. diego parents: 9586 diff changeset	4468 if (CONFIG_VP3_DECODER) {
7995 1fbfce20cb79 Move VP3 loop filter to DSPContext conrad parents: 7564 diff changeset	4469 c->vp3_h_loop_filter= ff_vp3_h_loop_filter_c;
1fbfce20cb79 Move VP3 loop filter to DSPContext conrad parents: 7564 diff changeset	4470 c->vp3_v_loop_filter= ff_vp3_v_loop_filter_c;
11637 f7281af560fe vp3: DC-only IDCT conrad parents: 11499 diff changeset	4471 c->vp3_idct_dc_add= ff_vp3_idct_dc_add_c;
7995 1fbfce20cb79 Move VP3 loop filter to DSPContext conrad parents: 7564 diff changeset	4472 }
8785 bee83b3f9a6b move vp6_filter_diag4() to a new vp6dsp.c file and use it throught dsputil aurel parents: 8760 diff changeset	4473 if (CONFIG_VP6_DECODER) {
bee83b3f9a6b move vp6_filter_diag4() to a new vp6dsp.c file and use it throught dsputil aurel parents: 8760 diff changeset	4474 c->vp6_filter_diag4= ff_vp6_filter_diag4_c;
bee83b3f9a6b move vp6_filter_diag4() to a new vp6dsp.c file and use it throught dsputil aurel parents: 8760 diff changeset	4475 }
7995 1fbfce20cb79 Move VP3 loop filter to DSPContext conrad parents: 7564 diff changeset	4476
2045 9447bbd8a7e9 rewrite h261 loop filter michael parents: 2044 diff changeset	4477 c->h261_loop_filter= h261_loop_filter_c;
2967 ef2149182f1c COSMETICS: Remove all trailing whitespace. diego parents: 2834 diff changeset	4478
1784 65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	4479 c->try_8x8basis= try_8x8basis_c;
65f7bd09f37b quantizer noise shaping optimization michael parents: 1739 diff changeset	4480 c->add_8x8basis= add_8x8basis_c;
866 725ef4ea3ecc huffyuv michaelni parents: 861 diff changeset	4481
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4482 #if CONFIG_VORBIS_DECODER
3536 545a15c19c91 sse & sse2 implementations of vorbis channel coupling. lorenm parents: 3526 diff changeset	4483 c->vorbis_inverse_coupling = vorbis_inverse_coupling;
545a15c19c91 sse & sse2 implementations of vorbis channel coupling. lorenm parents: 3526 diff changeset	4484 #endif
8590 7a463923ecd1 Change semantic of CONFIG_, HAVE_ and ARCH_. aurel* parents: 8496 diff changeset	4485 #if CONFIG_AC3_DECODER
7563 8390efaa0c03 simd downmix lorenm parents: 7286 diff changeset	4486 c->ac3_downmix = ff_ac3_downmix_c;
8390efaa0c03 simd downmix lorenm parents: 7286 diff changeset	4487 #endif
10429 289dd8daf4ee add CONFIG_LPC to the build system for lpc dsputil functions. fixes build jbr parents: 10424 diff changeset	4488 #if CONFIG_LPC
10424 94595d0e617c Move autocorrelation function from flacenc.c to lpc.c. Also rename the jbr parents: 10421 diff changeset	4489 c->lpc_compute_autocorr = ff_lpc_compute_autocorr;
10429 289dd8daf4ee add CONFIG_LPC to the build system for lpc dsputil functions. fixes build jbr parents: 10424 diff changeset	4490 #endif
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	4491 c->vector_fmul = vector_fmul_c;
945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	4492 c->vector_fmul_reverse = vector_fmul_reverse_c;
10300 4d1b9ca628fc Drop unused args from vector_fmul_add_add, simpify code, and rename mru parents: 10219 diff changeset	4493 c->vector_fmul_add = vector_fmul_add_c;
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	4494 c->vector_fmul_window = ff_vector_fmul_window_c;
7564 7cf793954871 simd int->float lorenm parents: 7563 diff changeset	4495 c->int32_to_float_fmul_scalar = int32_to_float_fmul_scalar_c;
10104 0fa3d21b317e SSE optimized vector_clipf(). 10% faster TwinVQ decoding. vitor parents: 10094 diff changeset	4496 c->vector_clipf = vector_clipf_c;
3568 945caa35ee9a sse and 3dnow implementations of float->int conversion and mdct windowing. lorenm parents: 3536 diff changeset	4497 c->float_to_int16 = ff_float_to_int16_c;
7261 032a49f033e8 simplify vorbis windowing lorenm parents: 7218 diff changeset	4498 c->float_to_int16_interleave = ff_float_to_int16_interleave_c;
7203 87b1dfb5a98d Add several vector functions used by Monkey's Audio decoder to dsputil kostya parents: 6719 diff changeset	4499 c->scalarproduct_int16 = scalarproduct_int16_c;
10644 5da7180afadf refactor and optimize scalarproduct lorenm parents: 10431 diff changeset	4500 c->scalarproduct_and_madd_int16 = scalarproduct_and_madd_int16_c;
10219 87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4501 c->scalarproduct_float = scalarproduct_float_c;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4502 c->butterflies_float = butterflies_float_c;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4503 c->vector_fmul_scalar = vector_fmul_scalar_c;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4504
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4505 c->vector_fmul_sv_scalar[0] = vector_fmul_sv_scalar_2_c;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4506 c->vector_fmul_sv_scalar[1] = vector_fmul_sv_scalar_4_c;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4507
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4508 c->sv_fmul_scalar[0] = sv_fmul_scalar_2_c;
87ae4a167138 Add some dsputil functions useful for AAC decoder mru parents: 10207 diff changeset	4509 c->sv_fmul_scalar[1] = sv_fmul_scalar_4_c;
3536 545a15c19c91 sse & sse2 implementations of vorbis channel coupling. lorenm parents: 3526 diff changeset	4510
3245 c2c29be6282e remove mpegvideo.c img resample dependancy michael parents: 3215 diff changeset	4511 c->shrink[0]= ff_img_copy_plane;
c2c29be6282e remove mpegvideo.c img resample dependancy michael parents: 3215 diff changeset	4512 c->shrink[1]= ff_shrink22;
c2c29be6282e remove mpegvideo.c img resample dependancy michael parents: 3215 diff changeset	4513 c->shrink[2]= ff_shrink44;
c2c29be6282e remove mpegvideo.c img resample dependancy michael parents: 3215 diff changeset	4514 c->shrink[3]= ff_shrink88;
c2c29be6282e remove mpegvideo.c img resample dependancy michael parents: 3215 diff changeset	4515
3215 06f98047ff26 prefetch pixels for future motion compensation. 2-5% faster h264. lorenm parents: 3199 diff changeset	4516 c->prefetch= just_return;
06f98047ff26 prefetch pixels for future motion compensation. 2-5% faster h264. lorenm parents: 3199 diff changeset	4517
3807 6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4518 memset(c->put_2tap_qpel_pixels_tab, 0, sizeof(c->put_2tap_qpel_pixels_tab));
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4519 memset(c->avg_2tap_qpel_pixels_tab, 0, sizeof(c->avg_2tap_qpel_pixels_tab));
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4520
8596 68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4521 if (HAVE_MMX) dsputil_init_mmx (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4522 if (ARCH_ARM) dsputil_init_arm (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4523 if (CONFIG_MLIB) dsputil_init_mlib (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4524 if (HAVE_VIS) dsputil_init_vis (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4525 if (ARCH_ALPHA) dsputil_init_alpha (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4526 if (ARCH_PPC) dsputil_init_ppc (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4527 if (HAVE_MMI) dsputil_init_mmi (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4528 if (ARCH_SH4) dsputil_init_sh4 (c, avctx);
68e959302527 replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_ aurel parents: 8590 diff changeset	4529 if (ARCH_BFIN) dsputil_init_bfin (c, avctx);
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4530
3807 6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4531 for(i=0; i<64; i++){
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4532 if(!c->put_2tap_qpel_pixels_tab[0][i])
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4533 c->put_2tap_qpel_pixels_tab[0][i]= c->put_h264_qpel_pixels_tab[0][i];
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4534 if(!c->avg_2tap_qpel_pixels_tab[0][i])
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4535 c->avg_2tap_qpel_pixels_tab[0][i]= c->avg_h264_qpel_pixels_tab[0][i];
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4536 }
6a40092eb9e6 approximate qpel functions: sacrifice some quality for some decoding speed. enabled on B-frames with -lavdopts fast. lorenm parents: 3728 diff changeset	4537
11988 e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4538 c->put_rv30_tpel_pixels_tab[0][0] = c->put_h264_qpel_pixels_tab[0][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4539 c->put_rv30_tpel_pixels_tab[1][0] = c->put_h264_qpel_pixels_tab[1][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4540 c->avg_rv30_tpel_pixels_tab[0][0] = c->avg_h264_qpel_pixels_tab[0][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4541 c->avg_rv30_tpel_pixels_tab[1][0] = c->avg_h264_qpel_pixels_tab[1][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4542
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4543 c->put_rv40_qpel_pixels_tab[0][0] = c->put_h264_qpel_pixels_tab[0][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4544 c->put_rv40_qpel_pixels_tab[1][0] = c->put_h264_qpel_pixels_tab[1][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4545 c->avg_rv40_qpel_pixels_tab[0][0] = c->avg_h264_qpel_pixels_tab[0][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4546 c->avg_rv40_qpel_pixels_tab[1][0] = c->avg_h264_qpel_pixels_tab[1][0];
e382860b855f Set rv34 (0,0) subpel mc functions to the optimised h264 ones mru parents: 11981 diff changeset	4547
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4548 switch(c->idct_permutation_type){
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4549 case FF_NO_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4550 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4551 c->idct_permutation[i]= i;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4552 break;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4553 case FF_LIBMPEG2_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4554 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4555 c->idct_permutation[i]= (i & 0x38) \| ((i & 6) >> 1) \| ((i & 1) << 2);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4556 break;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4557 case FF_SIMPLE_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4558 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4559 c->idct_permutation[i]= simple_mmx_permutation[i];
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4560 break;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4561 case FF_TRANSPOSE_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4562 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4563 c->idct_permutation[i]= ((i&7)<<3) \| (i>>3);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4564 break;
2696 9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API michael parents: 2693 diff changeset	4565 case FF_PARTTRANS_IDCT_PERM:
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API michael parents: 2693 diff changeset	4566 for(i=0; i<64; i++)
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API michael parents: 2693 diff changeset	4567 c->idct_permutation[i]= (i&0x24) \| ((i&3)<<3) \| ((i>>3)&3);
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API michael parents: 2693 diff changeset	4568 break;
6600 c3213c91124c Add a new IDCT permutation, used in xvid_sse2 and possibly future similar IDCTs. astrange parents: 6450 diff changeset	4569 case FF_SSE2_IDCT_PERM:
c3213c91124c Add a new IDCT permutation, used in xvid_sse2 and possibly future similar IDCTs. astrange parents: 6450 diff changeset	4570 for(i=0; i<64; i++)
c3213c91124c Add a new IDCT permutation, used in xvid_sse2 and possibly future similar IDCTs. astrange parents: 6450 diff changeset	4571 c->idct_permutation[i]= (i&0x38) \| idct_sse2_row_perm[i&7];
c3213c91124c Add a new IDCT permutation, used in xvid_sse2 and possibly future similar IDCTs. astrange parents: 6450 diff changeset	4572 break;
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4573 default:
1598 932d306bf1dc av_log() patch by (Michel Bardiaux <mbardiaux at peaktime dot be>) michael parents: 1571 diff changeset	4574 av_log(avctx, AV_LOG_ERROR, "Internal error, IDCT permutation not set\n");
1092 f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_* michaelni parents: 1064 diff changeset	4575 }
0 986e461dc072 Initial revision glantau parents: diff changeset	4576 }
252 ddb1a0e94cf4 - Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm pulento parents: 220 diff changeset	4577

Mercurial > libavcodec.hg

annotate dsputil.c @ 12043:f9a0bd0888a4 libavcodec