annotate dsputil.c @ 3010:533c6386eca9 libavcodec

8x8 integer dct from x264 as cmp function (under CONFIG_GPL) if this gives better quality then SATD then someone should port the x86 code too or maybe we could even just call it from libx264 the 4x4 one could be tried too ...
author michael
date Wed, 04 Jan 2006 16:31:23 +0000
parents bfabfdf9ce55
children b6a90fabaa76
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
1 /*
986e461dc072 Initial revision
glantau
parents:
diff changeset
2 * DSP utils
429
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
3 * Copyright (c) 2000, 2001 Fabrice Bellard.
1739
07a484280a82 copyright year update of the files i touched and remembered, things look annoyingly unmaintained otherwise
michael
parents: 1729
diff changeset
4 * Copyright (c) 2002-2004 Michael Niedermayer <michaelni@gmx.at>
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
5 *
429
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
6 * This library is free software; you can redistribute it and/or
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
7 * modify it under the terms of the GNU Lesser General Public
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
8 * License as published by the Free Software Foundation; either
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
9 * version 2 of the License, or (at your option) any later version.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
10 *
429
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
11 * This library is distributed in the hope that it will be useful,
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
429
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
14 * Lesser General Public License for more details.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
15 *
429
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
16 * You should have received a copy of the GNU Lesser General Public
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
17 * License along with this library; if not, write to the Free Software
718a22dc121f license/copyright change
glantau
parents: 403
diff changeset
18 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
256
4c1cec7c3c7c q-pel mc fixed
michaelni
parents: 255
diff changeset
19 *
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
20 * gmc & q-pel & 32/64 bit based MC by Michael Niedermayer <michaelni@gmx.at>
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
21 */
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
22
1106
1e39f273ecd6 per file doxy
michaelni
parents: 1101
diff changeset
23 /**
1e39f273ecd6 per file doxy
michaelni
parents: 1101
diff changeset
24 * @file dsputil.c
1e39f273ecd6 per file doxy
michaelni
parents: 1101
diff changeset
25 * DSP utils
1e39f273ecd6 per file doxy
michaelni
parents: 1101
diff changeset
26 */
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
27
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
28 #include "avcodec.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
29 #include "dsputil.h"
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
30 #include "mpegvideo.h"
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
31 #include "simple_idct.h"
1557
5d53c03186a1 floating point AAN DCT
michael
parents: 1527
diff changeset
32 #include "faandct.h"
676
c3bdb00a98a9 dont store version for bit-exact tests
michaelni
parents: 651
diff changeset
33
2522
e25782262d7d kill warnings patch by (Mns Rullgrd <mru inprovide com>)
michael
parents: 2448
diff changeset
34 /* snow.c */
e25782262d7d kill warnings patch by (Mns Rullgrd <mru inprovide com>)
michael
parents: 2448
diff changeset
35 void ff_spatial_dwt(int *buffer, int width, int height, int stride, int type, int decomposition_count);
e25782262d7d kill warnings patch by (Mns Rullgrd <mru inprovide com>)
michael
parents: 2448
diff changeset
36
2169
db8baace74d8 Minor Patch for shared libs on Mac OSX by (Bill May <wmay at cisco dot com>)
michael
parents: 2066
diff changeset
37 uint8_t cropTbl[256 + 2 * MAX_NEG_CROP] = {0, };
db8baace74d8 Minor Patch for shared libs on Mac OSX by (Bill May <wmay at cisco dot com>)
michael
parents: 2066
diff changeset
38 uint32_t squareTbl[512] = {0, };
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
39
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
40 const uint8_t ff_zigzag_direct[64] = {
706
e65798d228ea idct permutation cleanup, idct can be selected per context now
michaelni
parents: 689
diff changeset
41 0, 1, 8, 16, 9, 2, 3, 10,
e65798d228ea idct permutation cleanup, idct can be selected per context now
michaelni
parents: 689
diff changeset
42 17, 24, 32, 25, 18, 11, 4, 5,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
43 12, 19, 26, 33, 40, 48, 41, 34,
706
e65798d228ea idct permutation cleanup, idct can be selected per context now
michaelni
parents: 689
diff changeset
44 27, 20, 13, 6, 7, 14, 21, 28,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
45 35, 42, 49, 56, 57, 50, 43, 36,
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
46 29, 22, 15, 23, 30, 37, 44, 51,
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
47 58, 59, 52, 45, 38, 31, 39, 46,
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
48 53, 60, 61, 54, 47, 55, 62, 63
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
49 };
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
50
1567
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
51 /* Specific zigzag scan for 248 idct. NOTE that unlike the
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
52 specification, we interleave the fields */
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
53 const uint8_t ff_zigzag248_direct[64] = {
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
54 0, 8, 1, 9, 16, 24, 2, 10,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
55 17, 25, 32, 40, 48, 56, 33, 41,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
56 18, 26, 3, 11, 4, 12, 19, 27,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
57 34, 42, 49, 57, 50, 58, 35, 43,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
58 20, 28, 5, 13, 6, 14, 21, 29,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
59 36, 44, 51, 59, 52, 60, 37, 45,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
60 22, 30, 7, 15, 23, 31, 38, 46,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
61 53, 61, 54, 62, 39, 47, 55, 63,
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
62 };
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
63
220
0b234715e205 (commit by michael)
arpi_esp
parents: 214
diff changeset
64 /* not permutated inverse zigzag_direct + 1 for MMX quantizer */
2169
db8baace74d8 Minor Patch for shared libs on Mac OSX by (Bill May <wmay at cisco dot com>)
michael
parents: 2066
diff changeset
65 uint16_t __align8 inv_zigzag_direct16[64] = {0, };
220
0b234715e205 (commit by michael)
arpi_esp
parents: 214
diff changeset
66
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
67 const uint8_t ff_alternate_horizontal_scan[64] = {
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
68 0, 1, 2, 3, 8, 9, 16, 17,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
69 10, 11, 4, 5, 6, 7, 15, 14,
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
70 13, 12, 19, 18, 24, 25, 32, 33,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
71 26, 27, 20, 21, 22, 23, 28, 29,
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
72 30, 31, 34, 35, 40, 41, 48, 49,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
73 42, 43, 36, 37, 38, 39, 44, 45,
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
74 46, 47, 50, 51, 56, 57, 58, 59,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
75 52, 53, 54, 55, 60, 61, 62, 63,
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
76 };
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
77
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
78 const uint8_t ff_alternate_vertical_scan[64] = {
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
79 0, 8, 16, 24, 1, 9, 2, 10,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
80 17, 25, 32, 40, 48, 56, 57, 49,
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
81 41, 33, 26, 18, 3, 11, 4, 12,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
82 19, 27, 34, 42, 50, 58, 35, 43,
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
83 51, 59, 20, 28, 5, 13, 6, 14,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
84 21, 29, 36, 44, 52, 60, 37, 45,
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
85 53, 61, 22, 30, 7, 15, 23, 31,
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
86 38, 46, 54, 62, 39, 47, 55, 63,
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
87 };
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
88
220
0b234715e205 (commit by michael)
arpi_esp
parents: 214
diff changeset
89 /* a*inverse[b]>>32 == a/b for all 0<=a<=65536 && 2<=b<=255 */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
90 const uint32_t inverse[256]={
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
91 0, 4294967295U,2147483648U,1431655766, 1073741824, 858993460, 715827883, 613566757,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
92 536870912, 477218589, 429496730, 390451573, 357913942, 330382100, 306783379, 286331154,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
93 268435456, 252645136, 238609295, 226050911, 214748365, 204522253, 195225787, 186737709,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
94 178956971, 171798692, 165191050, 159072863, 153391690, 148102321, 143165577, 138547333,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
95 134217728, 130150525, 126322568, 122713352, 119304648, 116080198, 113025456, 110127367,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
96 107374183, 104755300, 102261127, 99882961, 97612894, 95443718, 93368855, 91382283,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
97 89478486, 87652394, 85899346, 84215046, 82595525, 81037119, 79536432, 78090315,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
98 76695845, 75350304, 74051161, 72796056, 71582789, 70409300, 69273667, 68174085,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
99 67108864, 66076420, 65075263, 64103990, 63161284, 62245903, 61356676, 60492498,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
100 59652324, 58835169, 58040099, 57266231, 56512728, 55778797, 55063684, 54366675,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
101 53687092, 53024288, 52377650, 51746594, 51130564, 50529028, 49941481, 49367441,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
102 48806447, 48258060, 47721859, 47197443, 46684428, 46182445, 45691142, 45210183,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
103 44739243, 44278014, 43826197, 43383509, 42949673, 42524429, 42107523, 41698712,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
104 41297763, 40904451, 40518560, 40139882, 39768216, 39403370, 39045158, 38693400,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
105 38347923, 38008561, 37675152, 37347542, 37025581, 36709123, 36398028, 36092163,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
106 35791395, 35495598, 35204650, 34918434, 34636834, 34359739, 34087043, 33818641,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
107 33554432, 33294321, 33038210, 32786010, 32537632, 32292988, 32051995, 31814573,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
108 31580642, 31350127, 31122952, 30899046, 30678338, 30460761, 30246249, 30034737,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
109 29826162, 29620465, 29417585, 29217465, 29020050, 28825284, 28633116, 28443493,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
110 28256364, 28071682, 27889399, 27709467, 27531842, 27356480, 27183338, 27012373,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
111 26843546, 26676816, 26512144, 26349493, 26188825, 26030105, 25873297, 25718368,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
112 25565282, 25414008, 25264514, 25116768, 24970741, 24826401, 24683721, 24542671,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
113 24403224, 24265352, 24129030, 23994231, 23860930, 23729102, 23598722, 23469767,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
114 23342214, 23216040, 23091223, 22967740, 22845571, 22724695, 22605092, 22486740,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
115 22369622, 22253717, 22139007, 22025474, 21913099, 21801865, 21691755, 21582751,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
116 21474837, 21367997, 21262215, 21157475, 21053762, 20951060, 20849356, 20748635,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
117 20648882, 20550083, 20452226, 20355296, 20259280, 20164166, 20069941, 19976593,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
118 19884108, 19792477, 19701685, 19611723, 19522579, 19434242, 19346700, 19259944,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
119 19173962, 19088744, 19004281, 18920561, 18837576, 18755316, 18673771, 18592933,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
120 18512791, 18433337, 18354562, 18276457, 18199014, 18122225, 18046082, 17970575,
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
121 17895698, 17821442, 17747799, 17674763, 17602325, 17530479, 17459217, 17388532,
220
0b234715e205 (commit by michael)
arpi_esp
parents: 214
diff changeset
122 17318417, 17248865, 17179870, 17111424, 17043522, 16976156, 16909321, 16843010,
0b234715e205 (commit by michael)
arpi_esp
parents: 214
diff changeset
123 };
0b234715e205 (commit by michael)
arpi_esp
parents: 214
diff changeset
124
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
125 /* Input permutation for the simple_idct_mmx */
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
126 static const uint8_t simple_mmx_permutation[64]={
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
127 0x00, 0x08, 0x04, 0x09, 0x01, 0x0C, 0x05, 0x0D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
128 0x10, 0x18, 0x14, 0x19, 0x11, 0x1C, 0x15, 0x1D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
129 0x20, 0x28, 0x24, 0x29, 0x21, 0x2C, 0x25, 0x2D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
130 0x12, 0x1A, 0x16, 0x1B, 0x13, 0x1E, 0x17, 0x1F,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
131 0x02, 0x0A, 0x06, 0x0B, 0x03, 0x0E, 0x07, 0x0F,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
132 0x30, 0x38, 0x34, 0x39, 0x31, 0x3C, 0x35, 0x3D,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
133 0x22, 0x2A, 0x26, 0x2B, 0x23, 0x2E, 0x27, 0x2F,
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
134 0x32, 0x3A, 0x36, 0x3B, 0x33, 0x3E, 0x37, 0x3F,
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
135 };
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
136
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
137 static int pix_sum_c(uint8_t * pix, int line_size)
612
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
138 {
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
139 int s, i, j;
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
140
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
141 s = 0;
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
142 for (i = 0; i < 16; i++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
143 for (j = 0; j < 16; j += 8) {
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
144 s += pix[0];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
145 s += pix[1];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
146 s += pix[2];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
147 s += pix[3];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
148 s += pix[4];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
149 s += pix[5];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
150 s += pix[6];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
151 s += pix[7];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
152 pix += 8;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
153 }
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
154 pix += line_size - 16;
612
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
155 }
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
156 return s;
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
157 }
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
158
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
159 static int pix_norm1_c(uint8_t * pix, int line_size)
612
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
160 {
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
161 int s, i, j;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
162 uint32_t *sq = squareTbl + 256;
612
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
163
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
164 s = 0;
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
165 for (i = 0; i < 16; i++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
166 for (j = 0; j < 16; j += 8) {
997
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
167 #if 0
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
168 s += sq[pix[0]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
169 s += sq[pix[1]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
170 s += sq[pix[2]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
171 s += sq[pix[3]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
172 s += sq[pix[4]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
173 s += sq[pix[5]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
174 s += sq[pix[6]];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
175 s += sq[pix[7]];
997
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
176 #else
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
177 #if LONG_MAX > 2147483647
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
178 register uint64_t x=*(uint64_t*)pix;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
179 s += sq[x&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
180 s += sq[(x>>8)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
181 s += sq[(x>>16)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
182 s += sq[(x>>24)&0xff];
997
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
183 s += sq[(x>>32)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
184 s += sq[(x>>40)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
185 s += sq[(x>>48)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
186 s += sq[(x>>56)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
187 #else
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
188 register uint32_t x=*(uint32_t*)pix;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
189 s += sq[x&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
190 s += sq[(x>>8)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
191 s += sq[(x>>16)&0xff];
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
192 s += sq[(x>>24)&0xff];
997
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
193 x=*(uint32_t*)(pix+4);
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
194 s += sq[x&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
195 s += sq[(x>>8)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
196 s += sq[(x>>16)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
197 s += sq[(x>>24)&0xff];
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
198 #endif
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
199 #endif
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
200 pix += 8;
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
201 }
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
202 pix += line_size - 16;
612
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
203 }
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
204 return s;
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
205 }
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
206
1273
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
207 static void bswap_buf(uint32_t *dst, uint32_t *src, int w){
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
208 int i;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
209
1273
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
210 for(i=0; i+8<=w; i+=8){
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
211 dst[i+0]= bswap_32(src[i+0]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
212 dst[i+1]= bswap_32(src[i+1]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
213 dst[i+2]= bswap_32(src[i+2]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
214 dst[i+3]= bswap_32(src[i+3]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
215 dst[i+4]= bswap_32(src[i+4]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
216 dst[i+5]= bswap_32(src[i+5]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
217 dst[i+6]= bswap_32(src[i+6]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
218 dst[i+7]= bswap_32(src[i+7]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
219 }
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
220 for(;i<w; i++){
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
221 dst[i+0]= bswap_32(src[i+0]);
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
222 }
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
223 }
612
c0005de2be59 new ratecontrol code
michaelni
parents: 590
diff changeset
224
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
225 static int sse4_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h)
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
226 {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
227 int s, i;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
228 uint32_t *sq = squareTbl + 256;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
229
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
230 s = 0;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
231 for (i = 0; i < h; i++) {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
232 s += sq[pix1[0] - pix2[0]];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
233 s += sq[pix1[1] - pix2[1]];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
234 s += sq[pix1[2] - pix2[2]];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
235 s += sq[pix1[3] - pix2[3]];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
236 pix1 += line_size;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
237 pix2 += line_size;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
238 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
239 return s;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
240 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
241
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
242 static int sse8_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h)
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
243 {
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
244 int s, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
245 uint32_t *sq = squareTbl + 256;
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
246
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
247 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
248 for (i = 0; i < h; i++) {
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
249 s += sq[pix1[0] - pix2[0]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
250 s += sq[pix1[1] - pix2[1]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
251 s += sq[pix1[2] - pix2[2]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
252 s += sq[pix1[3] - pix2[3]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
253 s += sq[pix1[4] - pix2[4]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
254 s += sq[pix1[5] - pix2[5]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
255 s += sq[pix1[6] - pix2[6]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
256 s += sq[pix1[7] - pix2[7]];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
257 pix1 += line_size;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
258 pix2 += line_size;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
259 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
260 return s;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
261 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
262
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
263 static int sse16_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
884
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
264 {
1012
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
265 int s, i;
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
266 uint32_t *sq = squareTbl + 256;
884
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
267
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
268 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
269 for (i = 0; i < h; i++) {
1012
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
270 s += sq[pix1[ 0] - pix2[ 0]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
271 s += sq[pix1[ 1] - pix2[ 1]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
272 s += sq[pix1[ 2] - pix2[ 2]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
273 s += sq[pix1[ 3] - pix2[ 3]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
274 s += sq[pix1[ 4] - pix2[ 4]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
275 s += sq[pix1[ 5] - pix2[ 5]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
276 s += sq[pix1[ 6] - pix2[ 6]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
277 s += sq[pix1[ 7] - pix2[ 7]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
278 s += sq[pix1[ 8] - pix2[ 8]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
279 s += sq[pix1[ 9] - pix2[ 9]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
280 s += sq[pix1[10] - pix2[10]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
281 s += sq[pix1[11] - pix2[11]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
282 s += sq[pix1[12] - pix2[12]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
283 s += sq[pix1[13] - pix2[13]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
284 s += sq[pix1[14] - pix2[14]];
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
285 s += sq[pix1[15] - pix2[15]];
997
4dfe15ae0078 sse16 & pix_norm1 optimization patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>) (with some modifications)
michaelni
parents: 996
diff changeset
286
1012
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
287 pix1 += line_size;
7a5038ec769b sse16_c is totally fucked up (unaligned loads, LONG_MAX is undefined,
mellum
parents: 1011
diff changeset
288 pix2 += line_size;
884
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
289 }
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
290 return s;
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
291 }
2cef5c4c0ca6 * altivec and pix_norm patch by Brian Foley
kabi
parents: 882
diff changeset
292
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
293
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
294 static inline int w_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int w, int h, int type){
2639
e2780f828440 put most codecs under ifdefs
michael
parents: 2633
diff changeset
295 #ifdef CONFIG_SNOW_ENCODER //idwt is in snow.c
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
296 int s, i, j;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
297 const int dec_count= w==8 ? 3 : 4;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
298 int tmp[16*16];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
299 #if 0
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
300 int level, ori;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
301 static const int scale[2][2][4][4]={
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
302 {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
303 {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
304 //8x8 dec=3
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
305 {268, 239, 239, 213},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
306 { 0, 224, 224, 152},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
307 { 0, 135, 135, 110},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
308 },{
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
309 //16x16 dec=4
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
310 {344, 310, 310, 280},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
311 { 0, 320, 320, 228},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
312 { 0, 175, 175, 136},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
313 { 0, 129, 129, 102},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
314 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
315 },{
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
316 {//FIXME 5/3
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
317 //8x8 dec=3
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
318 {275, 245, 245, 218},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
319 { 0, 230, 230, 156},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
320 { 0, 138, 138, 113},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
321 },{
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
322 //16x16 dec=4
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
323 {352, 317, 317, 286},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
324 { 0, 328, 328, 233},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
325 { 0, 180, 180, 140},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
326 { 0, 132, 132, 105},
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
327 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
328 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
329 };
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
330 #endif
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
331
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
332 for (i = 0; i < h; i++) {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
333 for (j = 0; j < w; j+=4) {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
334 tmp[16*i+j+0] = (pix1[j+0] - pix2[j+0])<<4;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
335 tmp[16*i+j+1] = (pix1[j+1] - pix2[j+1])<<4;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
336 tmp[16*i+j+2] = (pix1[j+2] - pix2[j+2])<<4;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
337 tmp[16*i+j+3] = (pix1[j+3] - pix2[j+3])<<4;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
338 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
339 pix1 += line_size;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
340 pix2 += line_size;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
341 }
2639
e2780f828440 put most codecs under ifdefs
michael
parents: 2633
diff changeset
342
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
343 ff_spatial_dwt(tmp, w, h, 16, type, dec_count);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
344
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
345 s=0;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
346 #if 0
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
347 for(level=0; level<dec_count; level++){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
348 for(ori= level ? 1 : 0; ori<4; ori++){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
349 int sx= (ori&1) ? 1<<level: 0;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
350 int stride= 16<<(dec_count-level);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
351 int sy= (ori&2) ? stride>>1 : 0;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
352 int size= 1<<level;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
353
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
354 for(i=0; i<size; i++){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
355 for(j=0; j<size; j++){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
356 int v= tmp[sx + sy + i*stride + j] * scale[type][dec_count-3][level][ori];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
357 s += ABS(v);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
358 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
359 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
360 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
361 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
362 #endif
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
363 for (i = 0; i < h; i++) {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
364 for (j = 0; j < w; j+=4) {
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
365 s+= ABS(tmp[16*i+j+0]);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
366 s+= ABS(tmp[16*i+j+1]);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
367 s+= ABS(tmp[16*i+j+2]);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
368 s+= ABS(tmp[16*i+j+3]);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
369 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
370 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
371 assert(s>=0);
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
372
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
373 return s>>2;
2639
e2780f828440 put most codecs under ifdefs
michael
parents: 2633
diff changeset
374 #endif
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
375 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
376
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
377 static int w53_8_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
378 return w_c(v, pix1, pix2, line_size, 8, h, 1);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
379 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
380
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
381 static int w97_8_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
382 return w_c(v, pix1, pix2, line_size, 8, h, 0);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
383 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
384
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
385 static int w53_16_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
386 return w_c(v, pix1, pix2, line_size, 16, h, 1);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
387 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
388
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
389 static int w97_16_c(void *v, uint8_t * pix1, uint8_t * pix2, int line_size, int h){
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
390 return w_c(v, pix1, pix2, line_size, 16, h, 0);
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
391 }
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
392
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
393 static void get_pixels_c(DCTELEM *restrict block, const uint8_t *pixels, int line_size)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
394 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
395 int i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
396
986e461dc072 Initial revision
glantau
parents:
diff changeset
397 /* read the pixels */
986e461dc072 Initial revision
glantau
parents:
diff changeset
398 for(i=0;i<8;i++) {
516
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
399 block[0] = pixels[0];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
400 block[1] = pixels[1];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
401 block[2] = pixels[2];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
402 block[3] = pixels[3];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
403 block[4] = pixels[4];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
404 block[5] = pixels[5];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
405 block[6] = pixels[6];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
406 block[7] = pixels[7];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
407 pixels += line_size;
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
408 block += 8;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
409 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
410 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
411
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
412 static void diff_pixels_c(DCTELEM *restrict block, const uint8_t *s1,
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
413 const uint8_t *s2, int stride){
324
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
414 int i;
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
415
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
416 /* read the pixels */
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
417 for(i=0;i<8;i++) {
516
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
418 block[0] = s1[0] - s2[0];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
419 block[1] = s1[1] - s2[1];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
420 block[2] = s1[2] - s2[2];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
421 block[3] = s1[3] - s2[3];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
422 block[4] = s1[4] - s2[4];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
423 block[5] = s1[5] - s2[5];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
424 block[6] = s1[6] - s2[6];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
425 block[7] = s1[7] - s2[7];
324
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
426 s1 += stride;
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
427 s2 += stride;
516
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
428 block += 8;
324
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
429 }
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
430 }
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
431
9c6f056f0e41 fixed mpeg4 time stuff on encoding
michaelni
parents: 320
diff changeset
432
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
433 static void put_pixels_clamped_c(const DCTELEM *block, uint8_t *restrict pixels,
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
434 int line_size)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
435 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
436 int i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
437 uint8_t *cm = cropTbl + MAX_NEG_CROP;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
438
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
439 /* read the pixels */
986e461dc072 Initial revision
glantau
parents:
diff changeset
440 for(i=0;i<8;i++) {
516
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
441 pixels[0] = cm[block[0]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
442 pixels[1] = cm[block[1]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
443 pixels[2] = cm[block[2]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
444 pixels[3] = cm[block[3]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
445 pixels[4] = cm[block[4]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
446 pixels[5] = cm[block[5]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
447 pixels[6] = cm[block[6]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
448 pixels[7] = cm[block[7]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
449
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
450 pixels += line_size;
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
451 block += 8;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
452 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
453 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
454
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
455 static void put_pixels_clamped4_c(const DCTELEM *block, uint8_t *restrict pixels,
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
456 int line_size)
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
457 {
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
458 int i;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
459 uint8_t *cm = cropTbl + MAX_NEG_CROP;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
460
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
461 /* read the pixels */
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
462 for(i=0;i<4;i++) {
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
463 pixels[0] = cm[block[0]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
464 pixels[1] = cm[block[1]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
465 pixels[2] = cm[block[2]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
466 pixels[3] = cm[block[3]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
467
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
468 pixels += line_size;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
469 block += 8;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
470 }
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
471 }
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
472
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
473 static void put_pixels_clamped2_c(const DCTELEM *block, uint8_t *restrict pixels,
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
474 int line_size)
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
475 {
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
476 int i;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
477 uint8_t *cm = cropTbl + MAX_NEG_CROP;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
478
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
479 /* read the pixels */
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
480 for(i=0;i<2;i++) {
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
481 pixels[0] = cm[block[0]];
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
482 pixels[1] = cm[block[1]];
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
483
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
484 pixels += line_size;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
485 block += 8;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
486 }
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
487 }
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
488
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
489 static void put_signed_pixels_clamped_c(const DCTELEM *block,
1984
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
490 uint8_t *restrict pixels,
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
491 int line_size)
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
492 {
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
493 int i, j;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
494
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
495 for (i = 0; i < 8; i++) {
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
496 for (j = 0; j < 8; j++) {
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
497 if (*block < -128)
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
498 *pixels = 0;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
499 else if (*block > 127)
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
500 *pixels = 255;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
501 else
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
502 *pixels = (uint8_t)(*block + 128);
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
503 block++;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
504 pixels++;
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
505 }
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
506 pixels += (line_size - 8);
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
507 }
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
508 }
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
509
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
510 static void add_pixels_clamped_c(const DCTELEM *block, uint8_t *restrict pixels,
516
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
511 int line_size)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
512 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
513 int i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
514 uint8_t *cm = cropTbl + MAX_NEG_CROP;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
515
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
516 /* read the pixels */
986e461dc072 Initial revision
glantau
parents:
diff changeset
517 for(i=0;i<8;i++) {
516
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
518 pixels[0] = cm[pixels[0] + block[0]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
519 pixels[1] = cm[pixels[1] + block[1]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
520 pixels[2] = cm[pixels[2] + block[2]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
521 pixels[3] = cm[pixels[3] + block[3]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
522 pixels[4] = cm[pixels[4] + block[4]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
523 pixels[5] = cm[pixels[5] + block[5]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
524 pixels[6] = cm[pixels[6] + block[6]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
525 pixels[7] = cm[pixels[7] + block[7]];
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
526 pixels += line_size;
0cb7ab35ccb2 * Detect "retrict" keyword
mellum
parents: 493
diff changeset
527 block += 8;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
528 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
529 }
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
530
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
531 static void add_pixels_clamped4_c(const DCTELEM *block, uint8_t *restrict pixels,
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
532 int line_size)
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
533 {
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
534 int i;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
535 uint8_t *cm = cropTbl + MAX_NEG_CROP;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
536
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
537 /* read the pixels */
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
538 for(i=0;i<4;i++) {
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
539 pixels[0] = cm[pixels[0] + block[0]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
540 pixels[1] = cm[pixels[1] + block[1]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
541 pixels[2] = cm[pixels[2] + block[2]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
542 pixels[3] = cm[pixels[3] + block[3]];
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
543 pixels += line_size;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
544 block += 8;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
545 }
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
546 }
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
547
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
548 static void add_pixels_clamped2_c(const DCTELEM *block, uint8_t *restrict pixels,
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
549 int line_size)
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
550 {
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
551 int i;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
552 uint8_t *cm = cropTbl + MAX_NEG_CROP;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
553
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
554 /* read the pixels */
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
555 for(i=0;i<2;i++) {
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
556 pixels[0] = cm[pixels[0] + block[0]];
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
557 pixels[1] = cm[pixels[1] + block[1]];
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
558 pixels += line_size;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
559 block += 8;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
560 }
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
561 }
2763
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
562
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
563 static void add_pixels8_c(uint8_t *restrict pixels, DCTELEM *block, int line_size)
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
564 {
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
565 int i;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
566 for(i=0;i<8;i++) {
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
567 pixels[0] += block[0];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
568 pixels[1] += block[1];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
569 pixels[2] += block[2];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
570 pixels[3] += block[3];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
571 pixels[4] += block[4];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
572 pixels[5] += block[5];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
573 pixels[6] += block[6];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
574 pixels[7] += block[7];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
575 pixels += line_size;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
576 block += 8;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
577 }
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
578 }
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
579
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
580 static void add_pixels4_c(uint8_t *restrict pixels, DCTELEM *block, int line_size)
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
581 {
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
582 int i;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
583 for(i=0;i<4;i++) {
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
584 pixels[0] += block[0];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
585 pixels[1] += block[1];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
586 pixels[2] += block[2];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
587 pixels[3] += block[3];
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
588 pixels += line_size;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
589 block += 4;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
590 }
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
591 }
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
592
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
593 #if 0
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
594
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
595 #define PIXOP2(OPNAME, OP) \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
596 static void OPNAME ## _pixels(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
597 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
598 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
599 for(i=0; i<h; i++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
600 OP(*((uint64_t*)block), LD64(pixels));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
601 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
602 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
603 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
604 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
605 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
606 static void OPNAME ## _no_rnd_pixels_x2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
607 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
608 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
609 for(i=0; i<h; i++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
610 const uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
611 const uint64_t b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
612 OP(*((uint64_t*)block), (a&b) + (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
613 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
614 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
615 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
616 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
617 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
618 static void OPNAME ## _pixels_x2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
619 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
620 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
621 for(i=0; i<h; i++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
622 const uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
623 const uint64_t b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
624 OP(*((uint64_t*)block), (a|b) - (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
625 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
626 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
627 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
628 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
629 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
630 static void OPNAME ## _no_rnd_pixels_y2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
631 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
632 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
633 for(i=0; i<h; i++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
634 const uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
635 const uint64_t b= LD64(pixels+line_size);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
636 OP(*((uint64_t*)block), (a&b) + (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
637 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
638 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
639 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
640 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
641 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
642 static void OPNAME ## _pixels_y2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
643 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
644 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
645 for(i=0; i<h; i++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
646 const uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
647 const uint64_t b= LD64(pixels+line_size);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
648 OP(*((uint64_t*)block), (a|b) - (((a^b)&0xFEFEFEFEFEFEFEFEULL)>>1));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
649 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
650 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
651 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
652 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
653 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
654 static void OPNAME ## _pixels_xy2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
655 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
656 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
657 const uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
658 const uint64_t b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
659 uint64_t l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
660 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
661 + 0x0202020202020202ULL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
662 uint64_t h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
663 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
664 uint64_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
665 \
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
666 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
667 for(i=0; i<h; i+=2){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
668 uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
669 uint64_t b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
670 l1= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
671 + (b&0x0303030303030303ULL);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
672 h1= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
673 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
674 OP(*((uint64_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
675 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
676 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
677 a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
678 b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
679 l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
680 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
681 + 0x0202020202020202ULL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
682 h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
683 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
684 OP(*((uint64_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
685 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
686 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
687 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
688 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
689 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
690 static void OPNAME ## _no_rnd_pixels_xy2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
691 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
692 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
693 const uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
694 const uint64_t b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
695 uint64_t l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
696 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
697 + 0x0101010101010101ULL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
698 uint64_t h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
699 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
700 uint64_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
701 \
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
702 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
703 for(i=0; i<h; i+=2){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
704 uint64_t a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
705 uint64_t b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
706 l1= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
707 + (b&0x0303030303030303ULL);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
708 h1= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
709 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
710 OP(*((uint64_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
711 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
712 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
713 a= LD64(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
714 b= LD64(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
715 l0= (a&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
716 + (b&0x0303030303030303ULL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
717 + 0x0101010101010101ULL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
718 h0= ((a&0xFCFCFCFCFCFCFCFCULL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
719 + ((b&0xFCFCFCFCFCFCFCFCULL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
720 OP(*((uint64_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0F0F0F0F0FULL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
721 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
722 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
723 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
724 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
725 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
726 CALL_2X_PIXELS(OPNAME ## _pixels16_c , OPNAME ## _pixels_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
727 CALL_2X_PIXELS(OPNAME ## _pixels16_x2_c , OPNAME ## _pixels_x2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
728 CALL_2X_PIXELS(OPNAME ## _pixels16_y2_c , OPNAME ## _pixels_y2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
729 CALL_2X_PIXELS(OPNAME ## _pixels16_xy2_c, OPNAME ## _pixels_xy2_c, 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
730 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_x2_c , OPNAME ## _no_rnd_pixels_x2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
731 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_y2_c , OPNAME ## _no_rnd_pixels_y2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
732 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_xy2_c, OPNAME ## _no_rnd_pixels_xy2_c, 8)
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
733
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
734 #define op_avg(a, b) a = ( ((a)|(b)) - ((((a)^(b))&0xFEFEFEFEFEFEFEFEULL)>>1) )
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
735 #else // 64 bit variant
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
736
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
737 #define PIXOP2(OPNAME, OP) \
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
738 static void OPNAME ## _pixels2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
739 int i;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
740 for(i=0; i<h; i++){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
741 OP(*((uint16_t*)(block )), LD16(pixels ));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
742 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
743 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
744 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
745 }\
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
746 static void OPNAME ## _pixels4_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
747 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
748 for(i=0; i<h; i++){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
749 OP(*((uint32_t*)(block )), LD32(pixels ));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
750 pixels+=line_size;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
751 block +=line_size;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
752 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
753 }\
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
754 static void OPNAME ## _pixels8_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
755 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
756 for(i=0; i<h; i++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
757 OP(*((uint32_t*)(block )), LD32(pixels ));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
758 OP(*((uint32_t*)(block+4)), LD32(pixels+4));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
759 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
760 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
761 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
762 }\
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
763 static inline void OPNAME ## _no_rnd_pixels8_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
764 OPNAME ## _pixels8_c(block, pixels, line_size, h);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
765 }\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
766 \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
767 static inline void OPNAME ## _no_rnd_pixels8_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
768 int src_stride1, int src_stride2, int h){\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
769 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
770 for(i=0; i<h; i++){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
771 uint32_t a,b;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
772 a= LD32(&src1[i*src_stride1 ]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
773 b= LD32(&src2[i*src_stride2 ]);\
1264
2fa34e615c76 cleanup
michaelni
parents: 1259
diff changeset
774 OP(*((uint32_t*)&dst[i*dst_stride ]), no_rnd_avg32(a, b));\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
775 a= LD32(&src1[i*src_stride1+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
776 b= LD32(&src2[i*src_stride2+4]);\
1264
2fa34e615c76 cleanup
michaelni
parents: 1259
diff changeset
777 OP(*((uint32_t*)&dst[i*dst_stride+4]), no_rnd_avg32(a, b));\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
778 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
779 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
780 \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
781 static inline void OPNAME ## _pixels8_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
782 int src_stride1, int src_stride2, int h){\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
783 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
784 for(i=0; i<h; i++){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
785 uint32_t a,b;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
786 a= LD32(&src1[i*src_stride1 ]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
787 b= LD32(&src2[i*src_stride2 ]);\
1264
2fa34e615c76 cleanup
michaelni
parents: 1259
diff changeset
788 OP(*((uint32_t*)&dst[i*dst_stride ]), rnd_avg32(a, b));\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
789 a= LD32(&src1[i*src_stride1+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
790 b= LD32(&src2[i*src_stride2+4]);\
1264
2fa34e615c76 cleanup
michaelni
parents: 1259
diff changeset
791 OP(*((uint32_t*)&dst[i*dst_stride+4]), rnd_avg32(a, b));\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
792 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
793 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
794 \
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
795 static inline void OPNAME ## _pixels4_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
796 int src_stride1, int src_stride2, int h){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
797 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
798 for(i=0; i<h; i++){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
799 uint32_t a,b;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
800 a= LD32(&src1[i*src_stride1 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
801 b= LD32(&src2[i*src_stride2 ]);\
1264
2fa34e615c76 cleanup
michaelni
parents: 1259
diff changeset
802 OP(*((uint32_t*)&dst[i*dst_stride ]), rnd_avg32(a, b));\
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
803 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
804 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
805 \
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
806 static inline void OPNAME ## _pixels2_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
807 int src_stride1, int src_stride2, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
808 int i;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
809 for(i=0; i<h; i++){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
810 uint32_t a,b;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
811 a= LD16(&src1[i*src_stride1 ]);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
812 b= LD16(&src2[i*src_stride2 ]);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
813 OP(*((uint16_t*)&dst[i*dst_stride ]), rnd_avg32(a, b));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
814 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
815 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
816 \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
817 static inline void OPNAME ## _pixels16_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
818 int src_stride1, int src_stride2, int h){\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
819 OPNAME ## _pixels8_l2(dst , src1 , src2 , dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
820 OPNAME ## _pixels8_l2(dst+8, src1+8, src2+8, dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
821 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
822 \
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
823 static inline void OPNAME ## _no_rnd_pixels16_l2(uint8_t *dst, const uint8_t *src1, const uint8_t *src2, int dst_stride, \
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
824 int src_stride1, int src_stride2, int h){\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
825 OPNAME ## _no_rnd_pixels8_l2(dst , src1 , src2 , dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
826 OPNAME ## _no_rnd_pixels8_l2(dst+8, src1+8, src2+8, dst_stride, src_stride1, src_stride2, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
827 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
828 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
829 static inline void OPNAME ## _no_rnd_pixels8_x2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
830 OPNAME ## _no_rnd_pixels8_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
831 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
832 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
833 static inline void OPNAME ## _pixels8_x2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
834 OPNAME ## _pixels8_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
835 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
836 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
837 static inline void OPNAME ## _no_rnd_pixels8_y2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
838 OPNAME ## _no_rnd_pixels8_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
839 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
840 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
841 static inline void OPNAME ## _pixels8_y2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
842 OPNAME ## _pixels8_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
843 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
844 \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
845 static inline void OPNAME ## _pixels8_l4(uint8_t *dst, const uint8_t *src1, uint8_t *src2, uint8_t *src3, uint8_t *src4,\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
846 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
847 int i;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
848 for(i=0; i<h; i++){\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
849 uint32_t a, b, c, d, l0, l1, h0, h1;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
850 a= LD32(&src1[i*src_stride1]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
851 b= LD32(&src2[i*src_stride2]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
852 c= LD32(&src3[i*src_stride3]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
853 d= LD32(&src4[i*src_stride4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
854 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
855 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
856 + 0x02020202UL;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
857 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
858 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
859 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
860 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
861 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
862 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
863 OP(*((uint32_t*)&dst[i*dst_stride]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
864 a= LD32(&src1[i*src_stride1+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
865 b= LD32(&src2[i*src_stride2+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
866 c= LD32(&src3[i*src_stride3+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
867 d= LD32(&src4[i*src_stride4+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
868 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
869 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
870 + 0x02020202UL;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
871 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
872 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
873 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
874 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
875 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
876 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
877 OP(*((uint32_t*)&dst[i*dst_stride+4]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
878 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
879 }\
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
880 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
881 static inline void OPNAME ## _pixels4_x2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
882 OPNAME ## _pixels4_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
883 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
884 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
885 static inline void OPNAME ## _pixels4_y2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
886 OPNAME ## _pixels4_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
887 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
888 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
889 static inline void OPNAME ## _pixels2_x2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
890 OPNAME ## _pixels2_l2(block, pixels, pixels+1, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
891 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
892 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
893 static inline void OPNAME ## _pixels2_y2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
894 OPNAME ## _pixels2_l2(block, pixels, pixels+line_size, line_size, line_size, line_size, h);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
895 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
896 \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
897 static inline void OPNAME ## _no_rnd_pixels8_l4(uint8_t *dst, const uint8_t *src1, uint8_t *src2, uint8_t *src3, uint8_t *src4,\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
898 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
899 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
900 for(i=0; i<h; i++){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
901 uint32_t a, b, c, d, l0, l1, h0, h1;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
902 a= LD32(&src1[i*src_stride1]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
903 b= LD32(&src2[i*src_stride2]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
904 c= LD32(&src3[i*src_stride3]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
905 d= LD32(&src4[i*src_stride4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
906 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
907 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
908 + 0x01010101UL;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
909 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
910 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
911 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
912 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
913 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
914 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
915 OP(*((uint32_t*)&dst[i*dst_stride]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
916 a= LD32(&src1[i*src_stride1+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
917 b= LD32(&src2[i*src_stride2+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
918 c= LD32(&src3[i*src_stride3+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
919 d= LD32(&src4[i*src_stride4+4]);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
920 l0= (a&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
921 + (b&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
922 + 0x01010101UL;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
923 h0= ((a&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
924 + ((b&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
925 l1= (c&0x03030303UL)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
926 + (d&0x03030303UL);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
927 h1= ((c&0xFCFCFCFCUL)>>2)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
928 + ((d&0xFCFCFCFCUL)>>2);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
929 OP(*((uint32_t*)&dst[i*dst_stride+4]), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
930 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
931 }\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
932 static inline void OPNAME ## _pixels16_l4(uint8_t *dst, const uint8_t *src1, uint8_t *src2, uint8_t *src3, uint8_t *src4,\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
933 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
934 OPNAME ## _pixels8_l4(dst , src1 , src2 , src3 , src4 , dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
935 OPNAME ## _pixels8_l4(dst+8, src1+8, src2+8, src3+8, src4+8, dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
936 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
937 static inline void OPNAME ## _no_rnd_pixels16_l4(uint8_t *dst, const uint8_t *src1, uint8_t *src2, uint8_t *src3, uint8_t *src4,\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
938 int dst_stride, int src_stride1, int src_stride2,int src_stride3,int src_stride4, int h){\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
939 OPNAME ## _no_rnd_pixels8_l4(dst , src1 , src2 , src3 , src4 , dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
940 OPNAME ## _no_rnd_pixels8_l4(dst+8, src1+8, src2+8, src3+8, src4+8, dst_stride, src_stride1, src_stride2, src_stride3, src_stride4, h);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
941 }\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
942 \
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
943 static inline void OPNAME ## _pixels2_xy2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
944 {\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
945 int i, a0, b0, a1, b1;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
946 a0= pixels[0];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
947 b0= pixels[1] + 2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
948 a0 += b0;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
949 b0 += pixels[2];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
950 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
951 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
952 for(i=0; i<h; i+=2){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
953 a1= pixels[0];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
954 b1= pixels[1];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
955 a1 += b1;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
956 b1 += pixels[2];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
957 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
958 block[0]= (a1+a0)>>2; /* FIXME non put */\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
959 block[1]= (b1+b0)>>2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
960 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
961 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
962 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
963 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
964 a0= pixels[0];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
965 b0= pixels[1] + 2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
966 a0 += b0;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
967 b0 += pixels[2];\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
968 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
969 block[0]= (a1+a0)>>2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
970 block[1]= (b1+b0)>>2;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
971 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
972 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
973 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
974 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
975 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
976 static inline void OPNAME ## _pixels4_xy2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
977 {\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
978 int i;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
979 const uint32_t a= LD32(pixels );\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
980 const uint32_t b= LD32(pixels+1);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
981 uint32_t l0= (a&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
982 + (b&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
983 + 0x02020202UL;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
984 uint32_t h0= ((a&0xFCFCFCFCUL)>>2)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
985 + ((b&0xFCFCFCFCUL)>>2);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
986 uint32_t l1,h1;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
987 \
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
988 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
989 for(i=0; i<h; i+=2){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
990 uint32_t a= LD32(pixels );\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
991 uint32_t b= LD32(pixels+1);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
992 l1= (a&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
993 + (b&0x03030303UL);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
994 h1= ((a&0xFCFCFCFCUL)>>2)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
995 + ((b&0xFCFCFCFCUL)>>2);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
996 OP(*((uint32_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
997 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
998 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
999 a= LD32(pixels );\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1000 b= LD32(pixels+1);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1001 l0= (a&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1002 + (b&0x03030303UL)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1003 + 0x02020202UL;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1004 h0= ((a&0xFCFCFCFCUL)>>2)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1005 + ((b&0xFCFCFCFCUL)>>2);\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1006 OP(*((uint32_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1007 pixels+=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1008 block +=line_size;\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1009 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1010 }\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1011 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1012 static inline void OPNAME ## _pixels8_xy2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1013 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1014 int j;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1015 for(j=0; j<2; j++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1016 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1017 const uint32_t a= LD32(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1018 const uint32_t b= LD32(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1019 uint32_t l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1020 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1021 + 0x02020202UL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1022 uint32_t h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1023 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1024 uint32_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1025 \
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1026 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1027 for(i=0; i<h; i+=2){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1028 uint32_t a= LD32(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1029 uint32_t b= LD32(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1030 l1= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1031 + (b&0x03030303UL);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1032 h1= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1033 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1034 OP(*((uint32_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1035 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1036 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1037 a= LD32(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1038 b= LD32(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1039 l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1040 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1041 + 0x02020202UL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1042 h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1043 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1044 OP(*((uint32_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1045 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1046 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1047 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1048 pixels+=4-line_size*(h+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1049 block +=4-line_size*h;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1050 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1051 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1052 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1053 static inline void OPNAME ## _no_rnd_pixels8_xy2_c(uint8_t *block, const uint8_t *pixels, int line_size, int h)\
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1054 {\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1055 int j;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1056 for(j=0; j<2; j++){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1057 int i;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1058 const uint32_t a= LD32(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1059 const uint32_t b= LD32(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1060 uint32_t l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1061 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1062 + 0x01010101UL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1063 uint32_t h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1064 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1065 uint32_t l1,h1;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1066 \
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1067 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1068 for(i=0; i<h; i+=2){\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1069 uint32_t a= LD32(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1070 uint32_t b= LD32(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1071 l1= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1072 + (b&0x03030303UL);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1073 h1= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1074 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1075 OP(*((uint32_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1076 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1077 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1078 a= LD32(pixels );\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1079 b= LD32(pixels+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1080 l0= (a&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1081 + (b&0x03030303UL)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1082 + 0x01010101UL;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1083 h0= ((a&0xFCFCFCFCUL)>>2)\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1084 + ((b&0xFCFCFCFCUL)>>2);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1085 OP(*((uint32_t*)block), h0+h1+(((l0+l1)>>2)&0x0F0F0F0FUL));\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1086 pixels+=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1087 block +=line_size;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1088 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1089 pixels+=4-line_size*(h+1);\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1090 block +=4-line_size*h;\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1091 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1092 }\
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1093 \
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1094 CALL_2X_PIXELS(OPNAME ## _pixels16_c , OPNAME ## _pixels8_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1095 CALL_2X_PIXELS(OPNAME ## _pixels16_x2_c , OPNAME ## _pixels8_x2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1096 CALL_2X_PIXELS(OPNAME ## _pixels16_y2_c , OPNAME ## _pixels8_y2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1097 CALL_2X_PIXELS(OPNAME ## _pixels16_xy2_c, OPNAME ## _pixels8_xy2_c, 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1098 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_c , OPNAME ## _pixels8_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1099 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_x2_c , OPNAME ## _no_rnd_pixels8_x2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1100 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_y2_c , OPNAME ## _no_rnd_pixels8_y2_c , 8)\
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1101 CALL_2X_PIXELS(OPNAME ## _no_rnd_pixels16_xy2_c, OPNAME ## _no_rnd_pixels8_xy2_c, 8)\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1102
1264
2fa34e615c76 cleanup
michaelni
parents: 1259
diff changeset
1103 #define op_avg(a, b) a = rnd_avg32(a, b)
385
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1104 #endif
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1105 #define op_put(a, b) a = b
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1106
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1107 PIXOP2(avg, op_avg)
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1108 PIXOP2(put, op_put)
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1109 #undef op_avg
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1110 #undef op_put
7ac7a48fbe5e new hopefully faster MC
michaelni
parents: 324
diff changeset
1111
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
1112 #define avg2(a,b) ((a+b+1)>>1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
1113 #define avg4(a,b,c,d) ((a+b+c+d+2)>>2)
986e461dc072 Initial revision
glantau
parents:
diff changeset
1114
1864
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1115 static void put_no_rnd_pixels16_l2_c(uint8_t *dst, const uint8_t *a, const uint8_t *b, int stride, int h){
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1116 put_no_rnd_pixels16_l2(dst, a, b, stride, stride, stride, h);
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1117 }
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1118
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1119 static void put_no_rnd_pixels8_l2_c(uint8_t *dst, const uint8_t *a, const uint8_t *b, int stride, int h){
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1120 put_no_rnd_pixels8_l2(dst, a, b, stride, stride, stride, h);
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
1121 }
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1122
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1123 static void gmc1_c(uint8_t *dst, uint8_t *src, int stride, int h, int x16, int y16, int rounder)
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1124 {
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1125 const int A=(16-x16)*(16-y16);
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1126 const int B=( x16)*(16-y16);
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1127 const int C=(16-x16)*( y16);
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1128 const int D=( x16)*( y16);
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1129 int i;
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1130
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1131 for(i=0; i<h; i++)
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1132 {
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1133 dst[0]= (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1134 dst[1]= (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1135 dst[2]= (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1136 dst[3]= (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1137 dst[4]= (A*src[4] + B*src[5] + C*src[stride+4] + D*src[stride+5] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1138 dst[5]= (A*src[5] + B*src[6] + C*src[stride+5] + D*src[stride+6] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1139 dst[6]= (A*src[6] + B*src[7] + C*src[stride+6] + D*src[stride+7] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1140 dst[7]= (A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8] + rounder)>>8;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1141 dst+= stride;
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1142 src+= stride;
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1143 }
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1144 }
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1145
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1146 static void gmc_c(uint8_t *dst, uint8_t *src, int stride, int h, int ox, int oy,
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1147 int dxx, int dxy, int dyx, int dyy, int shift, int r, int width, int height)
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1148 {
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1149 int y, vx, vy;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1150 const int s= 1<<shift;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1151
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1152 width--;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1153 height--;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1154
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1155 for(y=0; y<h; y++){
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1156 int x;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1157
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1158 vx= ox;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1159 vy= oy;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1160 for(x=0; x<8; x++){ //XXX FIXME optimize
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1161 int src_x, src_y, frac_x, frac_y, index;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1162
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1163 src_x= vx>>16;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1164 src_y= vy>>16;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1165 frac_x= src_x&(s-1);
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1166 frac_y= src_y&(s-1);
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1167 src_x>>=shift;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1168 src_y>>=shift;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1169
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1170 if((unsigned)src_x < width){
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1171 if((unsigned)src_y < height){
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1172 index= src_x + src_y*stride;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1173 dst[y*stride + x]= ( ( src[index ]*(s-frac_x)
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1174 + src[index +1]* frac_x )*(s-frac_y)
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1175 + ( src[index+stride ]*(s-frac_x)
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1176 + src[index+stride+1]* frac_x )* frac_y
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1177 + r)>>(shift*2);
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1178 }else{
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1179 index= src_x + clip(src_y, 0, height)*stride;
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1180 dst[y*stride + x]= ( ( src[index ]*(s-frac_x)
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1181 + src[index +1]* frac_x )*s
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1182 + r)>>(shift*2);
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1183 }
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1184 }else{
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1185 if((unsigned)src_y < height){
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1186 index= clip(src_x, 0, width) + src_y*stride;
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1187 dst[y*stride + x]= ( ( src[index ]*(s-frac_y)
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1188 + src[index+stride ]* frac_y )*s
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1189 + r)>>(shift*2);
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1190 }else{
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1191 index= clip(src_x, 0, width) + clip(src_y, 0, height)*stride;
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1192 dst[y*stride + x]= src[index ];
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1193 }
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1194 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1195
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1196 vx+= dxx;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1197 vy+= dyx;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1198 }
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1199 ox += dxy;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1200 oy += dyy;
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1201 }
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1202 }
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1203
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1204 static inline void put_tpel_pixels_mc00_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1205 switch(width){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1206 case 2: put_pixels2_c (dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1207 case 4: put_pixels4_c (dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1208 case 8: put_pixels8_c (dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1209 case 16:put_pixels16_c(dst, src, stride, height); break;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1210 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1211 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1212
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1213 static inline void put_tpel_pixels_mc10_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1214 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1215 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1216 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1217 dst[j] = (683*(2*src[j] + src[j+1] + 1)) >> 11;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1218 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1219 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1220 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1221 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1222 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1223
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1224 static inline void put_tpel_pixels_mc20_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1225 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1226 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1227 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1228 dst[j] = (683*(src[j] + 2*src[j+1] + 1)) >> 11;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1229 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1230 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1231 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1232 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1233 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1234
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1235 static inline void put_tpel_pixels_mc01_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1236 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1237 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1238 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1239 dst[j] = (683*(2*src[j] + src[j+stride] + 1)) >> 11;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1240 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1241 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1242 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1243 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1244 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1245
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1246 static inline void put_tpel_pixels_mc11_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1247 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1248 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1249 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1250 dst[j] = (2731*(4*src[j] + 3*src[j+1] + 3*src[j+stride] + 2*src[j+stride+1] + 6)) >> 15;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1251 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1252 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1253 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1254 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1255 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1256
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1257 static inline void put_tpel_pixels_mc12_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1258 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1259 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1260 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1261 dst[j] = (2731*(3*src[j] + 2*src[j+1] + 4*src[j+stride] + 3*src[j+stride+1] + 6)) >> 15;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1262 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1263 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1264 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1265 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1266 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1268 static inline void put_tpel_pixels_mc02_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1269 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1270 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1271 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1272 dst[j] = (683*(src[j] + 2*src[j+stride] + 1)) >> 11;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1273 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1274 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1275 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1276 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1277 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1278
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1279 static inline void put_tpel_pixels_mc21_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1280 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1281 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1282 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1283 dst[j] = (2731*(3*src[j] + 4*src[j+1] + 2*src[j+stride] + 3*src[j+stride+1] + 6)) >> 15;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1284 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1285 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1286 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1287 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1288 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1289
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1290 static inline void put_tpel_pixels_mc22_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1291 int i,j;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1292 for (i=0; i < height; i++) {
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1293 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1294 dst[j] = (2731*(2*src[j] + 3*src[j+1] + 3*src[j+stride] + 4*src[j+stride+1] + 6)) >> 15;
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1295 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1296 src += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1297 dst += stride;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1298 }
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1299 }
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1300
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1301 static inline void avg_tpel_pixels_mc00_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1302 switch(width){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1303 case 2: avg_pixels2_c (dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1304 case 4: avg_pixels4_c (dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1305 case 8: avg_pixels8_c (dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1306 case 16:avg_pixels16_c(dst, src, stride, height); break;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1307 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1308 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1309
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1310 static inline void avg_tpel_pixels_mc10_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1311 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1312 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1313 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1314 dst[j] = (dst[j] + ((683*(2*src[j] + src[j+1] + 1)) >> 11) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1315 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1316 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1317 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1318 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1319 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1320
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1321 static inline void avg_tpel_pixels_mc20_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1322 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1323 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1324 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1325 dst[j] = (dst[j] + ((683*(src[j] + 2*src[j+1] + 1)) >> 11) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1326 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1327 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1328 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1329 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1330 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1331
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1332 static inline void avg_tpel_pixels_mc01_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1333 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1334 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1335 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1336 dst[j] = (dst[j] + ((683*(2*src[j] + src[j+stride] + 1)) >> 11) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1337 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1338 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1339 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1340 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1341 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
1342
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1343 static inline void avg_tpel_pixels_mc11_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1344 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1345 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1346 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1347 dst[j] = (dst[j] + ((2731*(4*src[j] + 3*src[j+1] + 3*src[j+stride] + 2*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1348 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1349 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1350 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1351 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1352 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1353
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1354 static inline void avg_tpel_pixels_mc12_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1355 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1356 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1357 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1358 dst[j] = (dst[j] + ((2731*(3*src[j] + 2*src[j+1] + 4*src[j+stride] + 3*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1359 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1360 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1361 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1362 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1363 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1364
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1365 static inline void avg_tpel_pixels_mc02_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1366 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1367 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1368 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1369 dst[j] = (dst[j] + ((683*(src[j] + 2*src[j+stride] + 1)) >> 11) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1370 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1371 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1372 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1373 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1374 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1375
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1376 static inline void avg_tpel_pixels_mc21_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1377 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1378 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1379 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1380 dst[j] = (dst[j] + ((2731*(3*src[j] + 4*src[j+1] + 2*src[j+stride] + 3*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1381 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1382 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1383 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1384 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1385 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1386
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1387 static inline void avg_tpel_pixels_mc22_c(uint8_t *dst, const uint8_t *src, int stride, int width, int height){
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1388 int i,j;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1389 for (i=0; i < height; i++) {
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1390 for (j=0; j < width; j++) {
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
1391 dst[j] = (dst[j] + ((2731*(2*src[j] + 3*src[j+1] + 3*src[j+stride] + 4*src[j+stride+1] + 6)) >> 15) + 1) >> 1;
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1392 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1393 src += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1394 dst += stride;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1395 }
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
1396 }
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1397 #if 0
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1398 #define TPEL_WIDTH(width)\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1399 static void put_tpel_pixels ## width ## _mc00_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1400 void put_tpel_pixels_mc00_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1401 static void put_tpel_pixels ## width ## _mc10_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1402 void put_tpel_pixels_mc10_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1403 static void put_tpel_pixels ## width ## _mc20_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1404 void put_tpel_pixels_mc20_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1405 static void put_tpel_pixels ## width ## _mc01_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1406 void put_tpel_pixels_mc01_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1407 static void put_tpel_pixels ## width ## _mc11_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1408 void put_tpel_pixels_mc11_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1409 static void put_tpel_pixels ## width ## _mc21_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1410 void put_tpel_pixels_mc21_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1411 static void put_tpel_pixels ## width ## _mc02_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1412 void put_tpel_pixels_mc02_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1413 static void put_tpel_pixels ## width ## _mc12_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1414 void put_tpel_pixels_mc12_c(dst, src, stride, width, height);}\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1415 static void put_tpel_pixels ## width ## _mc22_c(uint8_t *dst, const uint8_t *src, int stride, int height){\
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1416 void put_tpel_pixels_mc22_c(dst, src, stride, width, height);}
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1417 #endif
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
1418
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1419 #define H264_CHROMA_MC(OPNAME, OP)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1420 static void OPNAME ## h264_chroma_mc2_c(uint8_t *dst/*align 8*/, uint8_t *src/*align 1*/, int stride, int h, int x, int y){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1421 const int A=(8-x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1422 const int B=( x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1423 const int C=(8-x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1424 const int D=( x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1425 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1426 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1427 assert(x<8 && y<8 && x>=0 && y>=0);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1428 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1429 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1430 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1431 OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1432 OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1433 dst+= stride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1434 src+= stride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1435 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1436 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1437 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1438 static void OPNAME ## h264_chroma_mc4_c(uint8_t *dst/*align 8*/, uint8_t *src/*align 1*/, int stride, int h, int x, int y){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1439 const int A=(8-x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1440 const int B=( x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1441 const int C=(8-x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1442 const int D=( x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1443 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1444 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1445 assert(x<8 && y<8 && x>=0 && y>=0);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1446 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1447 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1448 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1449 OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1450 OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1451 OP(dst[2], (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1452 OP(dst[3], (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1453 dst+= stride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1454 src+= stride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1455 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1456 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1457 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1458 static void OPNAME ## h264_chroma_mc8_c(uint8_t *dst/*align 8*/, uint8_t *src/*align 1*/, int stride, int h, int x, int y){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1459 const int A=(8-x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1460 const int B=( x)*(8-y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1461 const int C=(8-x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1462 const int D=( x)*( y);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1463 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1464 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1465 assert(x<8 && y<8 && x>=0 && y>=0);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1466 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1467 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1468 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1469 OP(dst[0], (A*src[0] + B*src[1] + C*src[stride+0] + D*src[stride+1]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1470 OP(dst[1], (A*src[1] + B*src[2] + C*src[stride+1] + D*src[stride+2]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1471 OP(dst[2], (A*src[2] + B*src[3] + C*src[stride+2] + D*src[stride+3]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1472 OP(dst[3], (A*src[3] + B*src[4] + C*src[stride+3] + D*src[stride+4]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1473 OP(dst[4], (A*src[4] + B*src[5] + C*src[stride+4] + D*src[stride+5]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1474 OP(dst[5], (A*src[5] + B*src[6] + C*src[stride+5] + D*src[stride+6]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1475 OP(dst[6], (A*src[6] + B*src[7] + C*src[stride+6] + D*src[stride+7]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1476 OP(dst[7], (A*src[7] + B*src[8] + C*src[stride+7] + D*src[stride+8]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1477 dst+= stride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1478 src+= stride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1479 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1480 }
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1481
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1482 #define op_avg(a, b) a = (((a)+(((b) + 32)>>6)+1)>>1)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1483 #define op_put(a, b) a = (((b) + 32)>>6)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1484
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1485 H264_CHROMA_MC(put_ , op_put)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1486 H264_CHROMA_MC(avg_ , op_avg)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1487 #undef op_avg
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1488 #undef op_put
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1489
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1490 static inline void copy_block4(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1491 {
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1492 int i;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1493 for(i=0; i<h; i++)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1494 {
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1495 ST32(dst , LD32(src ));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1496 dst+=dstStride;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1497 src+=srcStride;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1498 }
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1499 }
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1500
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1501 static inline void copy_block8(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1502 {
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1503 int i;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1504 for(i=0; i<h; i++)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1505 {
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1506 ST32(dst , LD32(src ));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1507 ST32(dst+4 , LD32(src+4 ));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1508 dst+=dstStride;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1509 src+=srcStride;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1510 }
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1511 }
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1512
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1513 static inline void copy_block16(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1514 {
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1515 int i;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1516 for(i=0; i<h; i++)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1517 {
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1518 ST32(dst , LD32(src ));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1519 ST32(dst+4 , LD32(src+4 ));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1520 ST32(dst+8 , LD32(src+8 ));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1521 ST32(dst+12, LD32(src+12));
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1522 dst+=dstStride;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1523 src+=srcStride;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1524 }
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
1525 }
753
8e1f0939d15d complete mpeg4 GMC decoding support
michaelni
parents: 751
diff changeset
1526
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1527 static inline void copy_block17(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1528 {
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1529 int i;
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1530 for(i=0; i<h; i++)
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1531 {
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1532 ST32(dst , LD32(src ));
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1533 ST32(dst+4 , LD32(src+4 ));
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1534 ST32(dst+8 , LD32(src+8 ));
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1535 ST32(dst+12, LD32(src+12));
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1536 dst[16]= src[16];
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1537 dst+=dstStride;
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1538 src+=srcStride;
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1539 }
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1540 }
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1541
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1542 static inline void copy_block9(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h)
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1543 {
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1544 int i;
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1545 for(i=0; i<h; i++)
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1546 {
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1547 ST32(dst , LD32(src ));
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1548 ST32(dst+4 , LD32(src+4 ));
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1549 dst[8]= src[8];
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1550 dst+=dstStride;
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1551 src+=srcStride;
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1552 }
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1553 }
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1554
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1555
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1556 #define QPEL_MC(r, OPNAME, RND, OP) \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1557 static void OPNAME ## mpeg4_qpel8_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1558 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1559 int i;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1560 for(i=0; i<h; i++)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1561 {\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1562 OP(dst[0], (src[0]+src[1])*20 - (src[0]+src[2])*6 + (src[1]+src[3])*3 - (src[2]+src[4]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1563 OP(dst[1], (src[1]+src[2])*20 - (src[0]+src[3])*6 + (src[0]+src[4])*3 - (src[1]+src[5]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1564 OP(dst[2], (src[2]+src[3])*20 - (src[1]+src[4])*6 + (src[0]+src[5])*3 - (src[0]+src[6]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1565 OP(dst[3], (src[3]+src[4])*20 - (src[2]+src[5])*6 + (src[1]+src[6])*3 - (src[0]+src[7]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1566 OP(dst[4], (src[4]+src[5])*20 - (src[3]+src[6])*6 + (src[2]+src[7])*3 - (src[1]+src[8]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1567 OP(dst[5], (src[5]+src[6])*20 - (src[4]+src[7])*6 + (src[3]+src[8])*3 - (src[2]+src[8]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1568 OP(dst[6], (src[6]+src[7])*20 - (src[5]+src[8])*6 + (src[4]+src[8])*3 - (src[3]+src[7]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1569 OP(dst[7], (src[7]+src[8])*20 - (src[6]+src[8])*6 + (src[5]+src[7])*3 - (src[4]+src[6]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1570 dst+=dstStride;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1571 src+=srcStride;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1572 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1573 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1574 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1575 static void OPNAME ## mpeg4_qpel8_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1576 const int w=8;\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1577 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1578 int i;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1579 for(i=0; i<w; i++)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1580 {\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1581 const int src0= src[0*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1582 const int src1= src[1*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1583 const int src2= src[2*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1584 const int src3= src[3*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1585 const int src4= src[4*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1586 const int src5= src[5*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1587 const int src6= src[6*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1588 const int src7= src[7*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1589 const int src8= src[8*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1590 OP(dst[0*dstStride], (src0+src1)*20 - (src0+src2)*6 + (src1+src3)*3 - (src2+src4));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1591 OP(dst[1*dstStride], (src1+src2)*20 - (src0+src3)*6 + (src0+src4)*3 - (src1+src5));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1592 OP(dst[2*dstStride], (src2+src3)*20 - (src1+src4)*6 + (src0+src5)*3 - (src0+src6));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1593 OP(dst[3*dstStride], (src3+src4)*20 - (src2+src5)*6 + (src1+src6)*3 - (src0+src7));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1594 OP(dst[4*dstStride], (src4+src5)*20 - (src3+src6)*6 + (src2+src7)*3 - (src1+src8));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1595 OP(dst[5*dstStride], (src5+src6)*20 - (src4+src7)*6 + (src3+src8)*3 - (src2+src8));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1596 OP(dst[6*dstStride], (src6+src7)*20 - (src5+src8)*6 + (src4+src8)*3 - (src3+src7));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1597 OP(dst[7*dstStride], (src7+src8)*20 - (src6+src8)*6 + (src5+src7)*3 - (src4+src6));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1598 dst++;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1599 src++;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1600 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1601 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1602 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1603 static void OPNAME ## mpeg4_qpel16_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1604 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1605 int i;\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1606 \
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1607 for(i=0; i<h; i++)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1608 {\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1609 OP(dst[ 0], (src[ 0]+src[ 1])*20 - (src[ 0]+src[ 2])*6 + (src[ 1]+src[ 3])*3 - (src[ 2]+src[ 4]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1610 OP(dst[ 1], (src[ 1]+src[ 2])*20 - (src[ 0]+src[ 3])*6 + (src[ 0]+src[ 4])*3 - (src[ 1]+src[ 5]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1611 OP(dst[ 2], (src[ 2]+src[ 3])*20 - (src[ 1]+src[ 4])*6 + (src[ 0]+src[ 5])*3 - (src[ 0]+src[ 6]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1612 OP(dst[ 3], (src[ 3]+src[ 4])*20 - (src[ 2]+src[ 5])*6 + (src[ 1]+src[ 6])*3 - (src[ 0]+src[ 7]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1613 OP(dst[ 4], (src[ 4]+src[ 5])*20 - (src[ 3]+src[ 6])*6 + (src[ 2]+src[ 7])*3 - (src[ 1]+src[ 8]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1614 OP(dst[ 5], (src[ 5]+src[ 6])*20 - (src[ 4]+src[ 7])*6 + (src[ 3]+src[ 8])*3 - (src[ 2]+src[ 9]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1615 OP(dst[ 6], (src[ 6]+src[ 7])*20 - (src[ 5]+src[ 8])*6 + (src[ 4]+src[ 9])*3 - (src[ 3]+src[10]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1616 OP(dst[ 7], (src[ 7]+src[ 8])*20 - (src[ 6]+src[ 9])*6 + (src[ 5]+src[10])*3 - (src[ 4]+src[11]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1617 OP(dst[ 8], (src[ 8]+src[ 9])*20 - (src[ 7]+src[10])*6 + (src[ 6]+src[11])*3 - (src[ 5]+src[12]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1618 OP(dst[ 9], (src[ 9]+src[10])*20 - (src[ 8]+src[11])*6 + (src[ 7]+src[12])*3 - (src[ 6]+src[13]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1619 OP(dst[10], (src[10]+src[11])*20 - (src[ 9]+src[12])*6 + (src[ 8]+src[13])*3 - (src[ 7]+src[14]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1620 OP(dst[11], (src[11]+src[12])*20 - (src[10]+src[13])*6 + (src[ 9]+src[14])*3 - (src[ 8]+src[15]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1621 OP(dst[12], (src[12]+src[13])*20 - (src[11]+src[14])*6 + (src[10]+src[15])*3 - (src[ 9]+src[16]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1622 OP(dst[13], (src[13]+src[14])*20 - (src[12]+src[15])*6 + (src[11]+src[16])*3 - (src[10]+src[16]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1623 OP(dst[14], (src[14]+src[15])*20 - (src[13]+src[16])*6 + (src[12]+src[16])*3 - (src[11]+src[15]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1624 OP(dst[15], (src[15]+src[16])*20 - (src[14]+src[16])*6 + (src[13]+src[15])*3 - (src[12]+src[14]));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1625 dst+=dstStride;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1626 src+=srcStride;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1627 }\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1628 }\
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1629 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1630 static void OPNAME ## mpeg4_qpel16_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1631 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1632 int i;\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1633 const int w=16;\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1634 for(i=0; i<w; i++)\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1635 {\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1636 const int src0= src[0*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1637 const int src1= src[1*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1638 const int src2= src[2*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1639 const int src3= src[3*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1640 const int src4= src[4*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1641 const int src5= src[5*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1642 const int src6= src[6*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1643 const int src7= src[7*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1644 const int src8= src[8*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1645 const int src9= src[9*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1646 const int src10= src[10*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1647 const int src11= src[11*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1648 const int src12= src[12*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1649 const int src13= src[13*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1650 const int src14= src[14*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1651 const int src15= src[15*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1652 const int src16= src[16*srcStride];\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1653 OP(dst[ 0*dstStride], (src0 +src1 )*20 - (src0 +src2 )*6 + (src1 +src3 )*3 - (src2 +src4 ));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1654 OP(dst[ 1*dstStride], (src1 +src2 )*20 - (src0 +src3 )*6 + (src0 +src4 )*3 - (src1 +src5 ));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1655 OP(dst[ 2*dstStride], (src2 +src3 )*20 - (src1 +src4 )*6 + (src0 +src5 )*3 - (src0 +src6 ));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1656 OP(dst[ 3*dstStride], (src3 +src4 )*20 - (src2 +src5 )*6 + (src1 +src6 )*3 - (src0 +src7 ));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1657 OP(dst[ 4*dstStride], (src4 +src5 )*20 - (src3 +src6 )*6 + (src2 +src7 )*3 - (src1 +src8 ));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1658 OP(dst[ 5*dstStride], (src5 +src6 )*20 - (src4 +src7 )*6 + (src3 +src8 )*3 - (src2 +src9 ));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1659 OP(dst[ 6*dstStride], (src6 +src7 )*20 - (src5 +src8 )*6 + (src4 +src9 )*3 - (src3 +src10));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1660 OP(dst[ 7*dstStride], (src7 +src8 )*20 - (src6 +src9 )*6 + (src5 +src10)*3 - (src4 +src11));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1661 OP(dst[ 8*dstStride], (src8 +src9 )*20 - (src7 +src10)*6 + (src6 +src11)*3 - (src5 +src12));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1662 OP(dst[ 9*dstStride], (src9 +src10)*20 - (src8 +src11)*6 + (src7 +src12)*3 - (src6 +src13));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1663 OP(dst[10*dstStride], (src10+src11)*20 - (src9 +src12)*6 + (src8 +src13)*3 - (src7 +src14));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1664 OP(dst[11*dstStride], (src11+src12)*20 - (src10+src13)*6 + (src9 +src14)*3 - (src8 +src15));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1665 OP(dst[12*dstStride], (src12+src13)*20 - (src11+src14)*6 + (src10+src15)*3 - (src9 +src16));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1666 OP(dst[13*dstStride], (src13+src14)*20 - (src12+src15)*6 + (src11+src16)*3 - (src10+src16));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1667 OP(dst[14*dstStride], (src14+src15)*20 - (src13+src16)*6 + (src12+src16)*3 - (src11+src15));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1668 OP(dst[15*dstStride], (src15+src16)*20 - (src14+src16)*6 + (src13+src15)*3 - (src12+src14));\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1669 dst++;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1670 src++;\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1671 }\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1672 }\
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1673 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1674 static void OPNAME ## qpel8_mc00_c (uint8_t *dst, uint8_t *src, int stride){\
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1675 OPNAME ## pixels8_c(dst, src, stride, 8);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1676 }\
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1677 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1678 static void OPNAME ## qpel8_mc10_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1679 uint8_t half[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1680 put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1681 OPNAME ## pixels8_l2(dst, src, half, stride, stride, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1682 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1683 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1684 static void OPNAME ## qpel8_mc20_c(uint8_t *dst, uint8_t *src, int stride){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1685 OPNAME ## mpeg4_qpel8_h_lowpass(dst, src, stride, stride, 8);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1686 }\
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1687 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1688 static void OPNAME ## qpel8_mc30_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1689 uint8_t half[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1690 put ## RND ## mpeg4_qpel8_h_lowpass(half, src, 8, stride, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1691 OPNAME ## pixels8_l2(dst, src+1, half, stride, stride, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1692 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1693 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1694 static void OPNAME ## qpel8_mc01_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1695 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1696 uint8_t half[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1697 copy_block9(full, src, 16, stride, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1698 put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1699 OPNAME ## pixels8_l2(dst, full, half, stride, 16, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1700 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1701 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1702 static void OPNAME ## qpel8_mc02_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1703 uint8_t full[16*9];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1704 copy_block9(full, src, 16, stride, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1705 OPNAME ## mpeg4_qpel8_v_lowpass(dst, full, stride, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1706 }\
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1707 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1708 static void OPNAME ## qpel8_mc03_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1709 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1710 uint8_t half[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1711 copy_block9(full, src, 16, stride, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1712 put ## RND ## mpeg4_qpel8_v_lowpass(half, full, 8, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1713 OPNAME ## pixels8_l2(dst, full+16, half, stride, 16, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1714 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1715 void ff_ ## OPNAME ## qpel8_mc11_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1716 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1717 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1718 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1719 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1720 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1721 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1722 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1723 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1724 OPNAME ## pixels8_l4(dst, full, halfH, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1725 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1726 static void OPNAME ## qpel8_mc11_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1727 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1728 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1729 uint8_t halfHV[64];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1730 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1731 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1732 put ## RND ## pixels8_l2(halfH, halfH, full, 8, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1733 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1734 OPNAME ## pixels8_l2(dst, halfH, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1735 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1736 void ff_ ## OPNAME ## qpel8_mc31_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1737 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1738 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1739 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1740 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1741 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1742 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1743 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full+1, 8, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1744 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1745 OPNAME ## pixels8_l4(dst, full+1, halfH, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1746 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1747 static void OPNAME ## qpel8_mc31_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1748 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1749 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1750 uint8_t halfHV[64];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1751 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1752 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1753 put ## RND ## pixels8_l2(halfH, halfH, full+1, 8, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1754 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1755 OPNAME ## pixels8_l2(dst, halfH, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1756 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1757 void ff_ ## OPNAME ## qpel8_mc13_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1758 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1759 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1760 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1761 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1762 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1763 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1764 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1765 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1766 OPNAME ## pixels8_l4(dst, full+16, halfH+8, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1767 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1768 static void OPNAME ## qpel8_mc13_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1769 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1770 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1771 uint8_t halfHV[64];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1772 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1773 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1774 put ## RND ## pixels8_l2(halfH, halfH, full, 8, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1775 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1776 OPNAME ## pixels8_l2(dst, halfH+8, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1777 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1778 void ff_ ## OPNAME ## qpel8_mc33_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1779 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1780 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1781 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1782 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1783 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1784 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full , 8, 16, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1785 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full+1, 8, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1786 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1787 OPNAME ## pixels8_l4(dst, full+17, halfH+8, halfV, halfHV, stride, 16, 8, 8, 8, 8);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1788 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1789 static void OPNAME ## qpel8_mc33_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1790 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1791 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1792 uint8_t halfHV[64];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1793 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1794 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1795 put ## RND ## pixels8_l2(halfH, halfH, full+1, 8, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1796 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1797 OPNAME ## pixels8_l2(dst, halfH+8, halfHV, stride, 8, 8, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1798 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1799 static void OPNAME ## qpel8_mc21_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1800 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1801 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1802 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1803 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1804 OPNAME ## pixels8_l2(dst, halfH, halfHV, stride, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1805 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1806 static void OPNAME ## qpel8_mc23_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1807 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1808 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1809 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1810 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1811 OPNAME ## pixels8_l2(dst, halfH+8, halfHV, stride, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1812 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1813 void ff_ ## OPNAME ## qpel8_mc12_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1814 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1815 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1816 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1817 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1818 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1819 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1820 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full, 8, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1821 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1822 OPNAME ## pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1823 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1824 static void OPNAME ## qpel8_mc12_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1825 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1826 uint8_t halfH[72];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1827 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1828 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1829 put ## RND ## pixels8_l2(halfH, halfH, full, 8, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1830 OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1831 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1832 void ff_ ## OPNAME ## qpel8_mc32_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1833 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1834 uint8_t halfH[72];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1835 uint8_t halfV[64];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1836 uint8_t halfHV[64];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1837 copy_block9(full, src, 16, stride, 9);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1838 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1839 put ## RND ## mpeg4_qpel8_v_lowpass(halfV, full+1, 8, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1840 put ## RND ## mpeg4_qpel8_v_lowpass(halfHV, halfH, 8, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1841 OPNAME ## pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1842 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1843 static void OPNAME ## qpel8_mc32_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1844 uint8_t full[16*9];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1845 uint8_t halfH[72];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1846 copy_block9(full, src, 16, stride, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1847 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, full, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1848 put ## RND ## pixels8_l2(halfH, halfH, full+1, 8, 8, 16, 9);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1849 OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1850 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1851 static void OPNAME ## qpel8_mc22_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1852 uint8_t halfH[72];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1853 put ## RND ## mpeg4_qpel8_h_lowpass(halfH, src, 8, stride, 9);\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1854 OPNAME ## mpeg4_qpel8_v_lowpass(dst, halfH, stride, 8);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1855 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1856 static void OPNAME ## qpel16_mc00_c (uint8_t *dst, uint8_t *src, int stride){\
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
1857 OPNAME ## pixels16_c(dst, src, stride, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1858 }\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1859 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1860 static void OPNAME ## qpel16_mc10_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1861 uint8_t half[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1862 put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1863 OPNAME ## pixels16_l2(dst, src, half, stride, stride, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1864 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1865 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1866 static void OPNAME ## qpel16_mc20_c(uint8_t *dst, uint8_t *src, int stride){\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1867 OPNAME ## mpeg4_qpel16_h_lowpass(dst, src, stride, stride, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1868 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1869 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1870 static void OPNAME ## qpel16_mc30_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1871 uint8_t half[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1872 put ## RND ## mpeg4_qpel16_h_lowpass(half, src, 16, stride, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1873 OPNAME ## pixels16_l2(dst, src+1, half, stride, stride, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1874 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1875 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1876 static void OPNAME ## qpel16_mc01_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1877 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1878 uint8_t half[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1879 copy_block17(full, src, 24, stride, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1880 put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1881 OPNAME ## pixels16_l2(dst, full, half, stride, 24, 16, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1882 }\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1883 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1884 static void OPNAME ## qpel16_mc02_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1885 uint8_t full[24*17];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1886 copy_block17(full, src, 24, stride, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1887 OPNAME ## mpeg4_qpel16_v_lowpass(dst, full, stride, 24);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1888 }\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1889 \
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1890 static void OPNAME ## qpel16_mc03_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1891 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1892 uint8_t half[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1893 copy_block17(full, src, 24, stride, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1894 put ## RND ## mpeg4_qpel16_v_lowpass(half, full, 16, 24);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1895 OPNAME ## pixels16_l2(dst, full+24, half, stride, 24, 16, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1896 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1897 void ff_ ## OPNAME ## qpel16_mc11_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1898 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1899 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1900 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1901 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1902 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1903 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1904 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1905 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1906 OPNAME ## pixels16_l4(dst, full, halfH, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1907 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1908 static void OPNAME ## qpel16_mc11_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1909 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1910 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1911 uint8_t halfHV[256];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1912 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1913 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1914 put ## RND ## pixels16_l2(halfH, halfH, full, 16, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1915 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1916 OPNAME ## pixels16_l2(dst, halfH, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1917 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1918 void ff_ ## OPNAME ## qpel16_mc31_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1919 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1920 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1921 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1922 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1923 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1924 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1925 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full+1, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1926 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1927 OPNAME ## pixels16_l4(dst, full+1, halfH, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1928 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1929 static void OPNAME ## qpel16_mc31_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1930 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1931 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1932 uint8_t halfHV[256];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1933 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1934 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1935 put ## RND ## pixels16_l2(halfH, halfH, full+1, 16, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1936 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1937 OPNAME ## pixels16_l2(dst, halfH, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1938 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1939 void ff_ ## OPNAME ## qpel16_mc13_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1940 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1941 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1942 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1943 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1944 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1945 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1946 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1947 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1948 OPNAME ## pixels16_l4(dst, full+24, halfH+16, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1949 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1950 static void OPNAME ## qpel16_mc13_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1951 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1952 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1953 uint8_t halfHV[256];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1954 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1955 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1956 put ## RND ## pixels16_l2(halfH, halfH, full, 16, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1957 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1958 OPNAME ## pixels16_l2(dst, halfH+16, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1959 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1960 void ff_ ## OPNAME ## qpel16_mc33_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1961 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1962 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1963 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1964 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1965 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1966 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full , 16, 24, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1967 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full+1, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1968 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1969 OPNAME ## pixels16_l4(dst, full+25, halfH+16, halfV, halfHV, stride, 24, 16, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1970 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1971 static void OPNAME ## qpel16_mc33_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1972 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1973 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1974 uint8_t halfHV[256];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1975 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1976 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1977 put ## RND ## pixels16_l2(halfH, halfH, full+1, 16, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1978 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1979 OPNAME ## pixels16_l2(dst, halfH+16, halfHV, stride, 16, 16, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
1980 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1981 static void OPNAME ## qpel16_mc21_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1982 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1983 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1984 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1985 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1986 OPNAME ## pixels16_l2(dst, halfH, halfHV, stride, 16, 16, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
1987 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1988 static void OPNAME ## qpel16_mc23_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1989 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1990 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1991 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
1992 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1993 OPNAME ## pixels16_l2(dst, halfH+16, halfHV, stride, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
1994 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1995 void ff_ ## OPNAME ## qpel16_mc12_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1996 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1997 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1998 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
1999 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2000 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2001 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
2002 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
2003 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2004 OPNAME ## pixels16_l2(dst, halfV, halfHV, stride, 16, 16, 16);\
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
2005 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2006 static void OPNAME ## qpel16_mc12_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2007 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2008 uint8_t halfH[272];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2009 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2010 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2011 put ## RND ## pixels16_l2(halfH, halfH, full, 16, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2012 OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2013 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2014 void ff_ ## OPNAME ## qpel16_mc32_old_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2015 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2016 uint8_t halfH[272];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2017 uint8_t halfV[256];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2018 uint8_t halfHV[256];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2019 copy_block17(full, src, 24, stride, 17);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2020 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
2021 put ## RND ## mpeg4_qpel16_v_lowpass(halfV, full+1, 16, 24);\
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
2022 put ## RND ## mpeg4_qpel16_v_lowpass(halfHV, halfH, 16, 16);\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2023 OPNAME ## pixels16_l2(dst, halfV, halfHV, stride, 16, 16, 16);\
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2024 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2025 static void OPNAME ## qpel16_mc32_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2026 uint8_t full[24*17];\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2027 uint8_t halfH[272];\
984
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2028 copy_block17(full, src, 24, stride, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2029 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, full, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2030 put ## RND ## pixels16_l2(halfH, halfH, full+1, 16, 16, 24, 17);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2031 OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16);\
e162c09efbe7 qpel fix
michaelni
parents: 954
diff changeset
2032 }\
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2033 static void OPNAME ## qpel16_mc22_c(uint8_t *dst, uint8_t *src, int stride){\
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2034 uint8_t halfH[272];\
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2035 put ## RND ## mpeg4_qpel16_h_lowpass(halfH, src, 16, stride, 17);\
954
13aec7e50c52 qpel in mmx2/3dnow
michaelni
parents: 945
diff changeset
2036 OPNAME ## mpeg4_qpel16_v_lowpass(dst, halfH, stride, 16);\
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
2037 }
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
2038
651
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2039 #define op_avg(a, b) a = (((a)+cm[((b) + 16)>>5]+1)>>1)
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2040 #define op_avg_no_rnd(a, b) a = (((a)+cm[((b) + 15)>>5])>>1)
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2041 #define op_put(a, b) a = cm[((b) + 16)>>5]
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2042 #define op_put_no_rnd(a, b) a = cm[((b) + 15)>>5]
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2043
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2044 QPEL_MC(0, put_ , _ , op_put)
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2045 QPEL_MC(1, put_no_rnd_, _no_rnd_, op_put_no_rnd)
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2046 QPEL_MC(0, avg_ , _ , op_avg)
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2047 //QPEL_MC(1, avg_no_rnd , _ , op_avg)
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2048 #undef op_avg
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2049 #undef op_avg_no_rnd
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2050 #undef op_put
45e8f39fda50 put/avg_pixels16
michaelni
parents: 638
diff changeset
2051 #undef op_put_no_rnd
255
db20b987c32d divx5-gmc support
michaelni
parents: 252
diff changeset
2052
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2053 #if 1
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2054 #define H264_LOWPASS(OPNAME, OP, OP2) \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2055 static void OPNAME ## h264_qpel4_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2056 const int h=4;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2057 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2058 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2059 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2060 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2061 OP(dst[0], (src[0]+src[1])*20 - (src[-1]+src[2])*5 + (src[-2]+src[3]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2062 OP(dst[1], (src[1]+src[2])*20 - (src[0 ]+src[3])*5 + (src[-1]+src[4]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2063 OP(dst[2], (src[2]+src[3])*20 - (src[1 ]+src[4])*5 + (src[0 ]+src[5]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2064 OP(dst[3], (src[3]+src[4])*20 - (src[2 ]+src[5])*5 + (src[1 ]+src[6]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2065 dst+=dstStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2066 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2067 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2068 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2069 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2070 static void OPNAME ## h264_qpel4_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2071 const int w=4;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2072 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2073 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2074 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2075 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2076 const int srcB= src[-2*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2077 const int srcA= src[-1*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2078 const int src0= src[0 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2079 const int src1= src[1 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2080 const int src2= src[2 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2081 const int src3= src[3 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2082 const int src4= src[4 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2083 const int src5= src[5 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2084 const int src6= src[6 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2085 OP(dst[0*dstStride], (src0+src1)*20 - (srcA+src2)*5 + (srcB+src3));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2086 OP(dst[1*dstStride], (src1+src2)*20 - (src0+src3)*5 + (srcA+src4));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2087 OP(dst[2*dstStride], (src2+src3)*20 - (src1+src4)*5 + (src0+src5));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2088 OP(dst[3*dstStride], (src3+src4)*20 - (src2+src5)*5 + (src1+src6));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2089 dst++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2090 src++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2091 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2092 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2093 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2094 static void OPNAME ## h264_qpel4_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2095 const int h=4;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2096 const int w=4;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2097 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2098 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2099 src -= 2*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2100 for(i=0; i<h+5; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2101 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2102 tmp[0]= (src[0]+src[1])*20 - (src[-1]+src[2])*5 + (src[-2]+src[3]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2103 tmp[1]= (src[1]+src[2])*20 - (src[0 ]+src[3])*5 + (src[-1]+src[4]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2104 tmp[2]= (src[2]+src[3])*20 - (src[1 ]+src[4])*5 + (src[0 ]+src[5]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2105 tmp[3]= (src[3]+src[4])*20 - (src[2 ]+src[5])*5 + (src[1 ]+src[6]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2106 tmp+=tmpStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2107 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2108 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2109 tmp -= tmpStride*(h+5-2);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2110 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2111 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2112 const int tmpB= tmp[-2*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2113 const int tmpA= tmp[-1*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2114 const int tmp0= tmp[0 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2115 const int tmp1= tmp[1 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2116 const int tmp2= tmp[2 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2117 const int tmp3= tmp[3 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2118 const int tmp4= tmp[4 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2119 const int tmp5= tmp[5 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2120 const int tmp6= tmp[6 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2121 OP2(dst[0*dstStride], (tmp0+tmp1)*20 - (tmpA+tmp2)*5 + (tmpB+tmp3));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2122 OP2(dst[1*dstStride], (tmp1+tmp2)*20 - (tmp0+tmp3)*5 + (tmpA+tmp4));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2123 OP2(dst[2*dstStride], (tmp2+tmp3)*20 - (tmp1+tmp4)*5 + (tmp0+tmp5));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2124 OP2(dst[3*dstStride], (tmp3+tmp4)*20 - (tmp2+tmp5)*5 + (tmp1+tmp6));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2125 dst++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2126 tmp++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2127 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2128 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2129 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2130 static void OPNAME ## h264_qpel8_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2131 const int h=8;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2132 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2133 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2134 for(i=0; i<h; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2135 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2136 OP(dst[0], (src[0]+src[1])*20 - (src[-1]+src[2])*5 + (src[-2]+src[3 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2137 OP(dst[1], (src[1]+src[2])*20 - (src[0 ]+src[3])*5 + (src[-1]+src[4 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2138 OP(dst[2], (src[2]+src[3])*20 - (src[1 ]+src[4])*5 + (src[0 ]+src[5 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2139 OP(dst[3], (src[3]+src[4])*20 - (src[2 ]+src[5])*5 + (src[1 ]+src[6 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2140 OP(dst[4], (src[4]+src[5])*20 - (src[3 ]+src[6])*5 + (src[2 ]+src[7 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2141 OP(dst[5], (src[5]+src[6])*20 - (src[4 ]+src[7])*5 + (src[3 ]+src[8 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2142 OP(dst[6], (src[6]+src[7])*20 - (src[5 ]+src[8])*5 + (src[4 ]+src[9 ]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2143 OP(dst[7], (src[7]+src[8])*20 - (src[6 ]+src[9])*5 + (src[5 ]+src[10]));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2144 dst+=dstStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2145 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2146 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2147 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2148 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2149 static void OPNAME ## h264_qpel8_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2150 const int w=8;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2151 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2152 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2153 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2154 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2155 const int srcB= src[-2*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2156 const int srcA= src[-1*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2157 const int src0= src[0 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2158 const int src1= src[1 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2159 const int src2= src[2 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2160 const int src3= src[3 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2161 const int src4= src[4 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2162 const int src5= src[5 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2163 const int src6= src[6 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2164 const int src7= src[7 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2165 const int src8= src[8 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2166 const int src9= src[9 *srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2167 const int src10=src[10*srcStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2168 OP(dst[0*dstStride], (src0+src1)*20 - (srcA+src2)*5 + (srcB+src3));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2169 OP(dst[1*dstStride], (src1+src2)*20 - (src0+src3)*5 + (srcA+src4));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2170 OP(dst[2*dstStride], (src2+src3)*20 - (src1+src4)*5 + (src0+src5));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2171 OP(dst[3*dstStride], (src3+src4)*20 - (src2+src5)*5 + (src1+src6));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2172 OP(dst[4*dstStride], (src4+src5)*20 - (src3+src6)*5 + (src2+src7));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2173 OP(dst[5*dstStride], (src5+src6)*20 - (src4+src7)*5 + (src3+src8));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2174 OP(dst[6*dstStride], (src6+src7)*20 - (src5+src8)*5 + (src4+src9));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2175 OP(dst[7*dstStride], (src7+src8)*20 - (src6+src9)*5 + (src5+src10));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2176 dst++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2177 src++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2178 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2179 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2180 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2181 static void OPNAME ## h264_qpel8_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2182 const int h=8;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2183 const int w=8;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2184 uint8_t *cm = cropTbl + MAX_NEG_CROP;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2185 int i;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2186 src -= 2*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2187 for(i=0; i<h+5; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2188 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2189 tmp[0]= (src[0]+src[1])*20 - (src[-1]+src[2])*5 + (src[-2]+src[3 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2190 tmp[1]= (src[1]+src[2])*20 - (src[0 ]+src[3])*5 + (src[-1]+src[4 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2191 tmp[2]= (src[2]+src[3])*20 - (src[1 ]+src[4])*5 + (src[0 ]+src[5 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2192 tmp[3]= (src[3]+src[4])*20 - (src[2 ]+src[5])*5 + (src[1 ]+src[6 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2193 tmp[4]= (src[4]+src[5])*20 - (src[3 ]+src[6])*5 + (src[2 ]+src[7 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2194 tmp[5]= (src[5]+src[6])*20 - (src[4 ]+src[7])*5 + (src[3 ]+src[8 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2195 tmp[6]= (src[6]+src[7])*20 - (src[5 ]+src[8])*5 + (src[4 ]+src[9 ]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2196 tmp[7]= (src[7]+src[8])*20 - (src[6 ]+src[9])*5 + (src[5 ]+src[10]);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2197 tmp+=tmpStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2198 src+=srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2199 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2200 tmp -= tmpStride*(h+5-2);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2201 for(i=0; i<w; i++)\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2202 {\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2203 const int tmpB= tmp[-2*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2204 const int tmpA= tmp[-1*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2205 const int tmp0= tmp[0 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2206 const int tmp1= tmp[1 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2207 const int tmp2= tmp[2 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2208 const int tmp3= tmp[3 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2209 const int tmp4= tmp[4 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2210 const int tmp5= tmp[5 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2211 const int tmp6= tmp[6 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2212 const int tmp7= tmp[7 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2213 const int tmp8= tmp[8 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2214 const int tmp9= tmp[9 *tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2215 const int tmp10=tmp[10*tmpStride];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2216 OP2(dst[0*dstStride], (tmp0+tmp1)*20 - (tmpA+tmp2)*5 + (tmpB+tmp3));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2217 OP2(dst[1*dstStride], (tmp1+tmp2)*20 - (tmp0+tmp3)*5 + (tmpA+tmp4));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2218 OP2(dst[2*dstStride], (tmp2+tmp3)*20 - (tmp1+tmp4)*5 + (tmp0+tmp5));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2219 OP2(dst[3*dstStride], (tmp3+tmp4)*20 - (tmp2+tmp5)*5 + (tmp1+tmp6));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2220 OP2(dst[4*dstStride], (tmp4+tmp5)*20 - (tmp3+tmp6)*5 + (tmp2+tmp7));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2221 OP2(dst[5*dstStride], (tmp5+tmp6)*20 - (tmp4+tmp7)*5 + (tmp3+tmp8));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2222 OP2(dst[6*dstStride], (tmp6+tmp7)*20 - (tmp5+tmp8)*5 + (tmp4+tmp9));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2223 OP2(dst[7*dstStride], (tmp7+tmp8)*20 - (tmp6+tmp9)*5 + (tmp5+tmp10));\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2224 dst++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2225 tmp++;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2226 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2227 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2228 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2229 static void OPNAME ## h264_qpel16_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2230 OPNAME ## h264_qpel8_v_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2231 OPNAME ## h264_qpel8_v_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2232 src += 8*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2233 dst += 8*dstStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2234 OPNAME ## h264_qpel8_v_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2235 OPNAME ## h264_qpel8_v_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2236 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2237 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2238 static void OPNAME ## h264_qpel16_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2239 OPNAME ## h264_qpel8_h_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2240 OPNAME ## h264_qpel8_h_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2241 src += 8*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2242 dst += 8*dstStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2243 OPNAME ## h264_qpel8_h_lowpass(dst , src , dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2244 OPNAME ## h264_qpel8_h_lowpass(dst+8, src+8, dstStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2245 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2246 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2247 static void OPNAME ## h264_qpel16_hv_lowpass(uint8_t *dst, int16_t *tmp, uint8_t *src, int dstStride, int tmpStride, int srcStride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2248 OPNAME ## h264_qpel8_hv_lowpass(dst , tmp , src , dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2249 OPNAME ## h264_qpel8_hv_lowpass(dst+8, tmp+8, src+8, dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2250 src += 8*srcStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2251 dst += 8*dstStride;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2252 OPNAME ## h264_qpel8_hv_lowpass(dst , tmp , src , dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2253 OPNAME ## h264_qpel8_hv_lowpass(dst+8, tmp+8, src+8, dstStride, tmpStride, srcStride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2254 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2255
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2256 #define H264_MC(OPNAME, SIZE) \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2257 static void OPNAME ## h264_qpel ## SIZE ## _mc00_c (uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2258 OPNAME ## pixels ## SIZE ## _c(dst, src, stride, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2259 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2260 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2261 static void OPNAME ## h264_qpel ## SIZE ## _mc10_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2262 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2263 put_h264_qpel ## SIZE ## _h_lowpass(half, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2264 OPNAME ## pixels ## SIZE ## _l2(dst, src, half, stride, stride, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2265 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2266 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2267 static void OPNAME ## h264_qpel ## SIZE ## _mc20_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2268 OPNAME ## h264_qpel ## SIZE ## _h_lowpass(dst, src, stride, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2269 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2270 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2271 static void OPNAME ## h264_qpel ## SIZE ## _mc30_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2272 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2273 put_h264_qpel ## SIZE ## _h_lowpass(half, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2274 OPNAME ## pixels ## SIZE ## _l2(dst, src+1, half, stride, stride, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2275 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2276 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2277 static void OPNAME ## h264_qpel ## SIZE ## _mc01_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2278 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2279 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2280 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2281 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2282 put_h264_qpel ## SIZE ## _v_lowpass(half, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2283 OPNAME ## pixels ## SIZE ## _l2(dst, full_mid, half, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2284 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2285 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2286 static void OPNAME ## h264_qpel ## SIZE ## _mc02_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2287 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2288 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2289 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2290 OPNAME ## h264_qpel ## SIZE ## _v_lowpass(dst, full_mid, stride, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2291 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2292 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2293 static void OPNAME ## h264_qpel ## SIZE ## _mc03_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2294 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2295 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2296 uint8_t half[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2297 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2298 put_h264_qpel ## SIZE ## _v_lowpass(half, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2299 OPNAME ## pixels ## SIZE ## _l2(dst, full_mid+SIZE, half, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2300 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2301 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2302 static void OPNAME ## h264_qpel ## SIZE ## _mc11_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2303 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2304 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2305 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2306 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2307 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2308 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2309 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2310 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2311 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2312 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2313 static void OPNAME ## h264_qpel ## SIZE ## _mc31_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2314 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2315 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2316 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2317 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2318 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2319 copy_block ## SIZE (full, src - stride*2 + 1, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2320 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2321 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2322 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2323 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2324 static void OPNAME ## h264_qpel ## SIZE ## _mc13_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2325 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2326 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2327 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2328 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2329 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src + stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2330 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2331 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2332 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2333 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2334 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2335 static void OPNAME ## h264_qpel ## SIZE ## _mc33_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2336 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2337 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2338 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2339 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2340 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src + stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2341 copy_block ## SIZE (full, src - stride*2 + 1, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2342 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2343 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2344 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2345 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2346 static void OPNAME ## h264_qpel ## SIZE ## _mc22_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2347 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2348 OPNAME ## h264_qpel ## SIZE ## _hv_lowpass(dst, tmp, src, stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2349 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2350 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2351 static void OPNAME ## h264_qpel ## SIZE ## _mc21_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2352 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2353 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2354 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2355 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2356 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2357 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2358 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2359 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2360 static void OPNAME ## h264_qpel ## SIZE ## _mc23_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2361 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2362 uint8_t halfH[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2363 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2364 put_h264_qpel ## SIZE ## _h_lowpass(halfH, src + stride, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2365 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2366 OPNAME ## pixels ## SIZE ## _l2(dst, halfH, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2367 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2368 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2369 static void OPNAME ## h264_qpel ## SIZE ## _mc12_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2370 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2371 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2372 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2373 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2374 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2375 copy_block ## SIZE (full, src - stride*2, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2376 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2377 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2378 OPNAME ## pixels ## SIZE ## _l2(dst, halfV, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2379 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2380 \
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2381 static void OPNAME ## h264_qpel ## SIZE ## _mc32_c(uint8_t *dst, uint8_t *src, int stride){\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2382 uint8_t full[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2383 uint8_t * const full_mid= full + SIZE*2;\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2384 int16_t tmp[SIZE*(SIZE+5)];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2385 uint8_t halfV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2386 uint8_t halfHV[SIZE*SIZE];\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2387 copy_block ## SIZE (full, src - stride*2 + 1, SIZE, stride, SIZE + 5);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2388 put_h264_qpel ## SIZE ## _v_lowpass(halfV, full_mid, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2389 put_h264_qpel ## SIZE ## _hv_lowpass(halfHV, tmp, src, SIZE, SIZE, stride);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2390 OPNAME ## pixels ## SIZE ## _l2(dst, halfV, halfHV, stride, SIZE, SIZE, SIZE);\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2391 }\
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2392
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2393 #define op_avg(a, b) a = (((a)+cm[((b) + 16)>>5]+1)>>1)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2394 //#define op_avg2(a, b) a = (((a)*w1+cm[((b) + 16)>>5]*w2 + o + 64)>>7)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2395 #define op_put(a, b) a = cm[((b) + 16)>>5]
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2396 #define op2_avg(a, b) a = (((a)+cm[((b) + 512)>>10]+1)>>1)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2397 #define op2_put(a, b) a = cm[((b) + 512)>>10]
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2398
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2399 H264_LOWPASS(put_ , op_put, op2_put)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2400 H264_LOWPASS(avg_ , op_avg, op2_avg)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2401 H264_MC(put_, 4)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2402 H264_MC(put_, 8)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2403 H264_MC(put_, 16)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2404 H264_MC(avg_, 4)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2405 H264_MC(avg_, 8)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2406 H264_MC(avg_, 16)
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2407
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2408 #undef op_avg
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2409 #undef op_put
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2410 #undef op2_avg
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2411 #undef op2_put
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2412 #endif
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
2413
2448
bfa9192a22ce use clip_uint8()
michael
parents: 2415
diff changeset
2414 #define op_scale1(x) block[x] = clip_uint8( (block[x]*weight + offset) >> log2_denom )
bfa9192a22ce use clip_uint8()
michael
parents: 2415
diff changeset
2415 #define op_scale2(x) dst[x] = clip_uint8( (src[x]*weights + dst[x]*weightd + offset) >> (log2_denom+1))
2415
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2416 #define H264_WEIGHT(W,H) \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2417 static void weight_h264_pixels ## W ## x ## H ## _c(uint8_t *block, int stride, int log2_denom, int weight, int offset){ \
2522
e25782262d7d kill warnings patch by (Mns Rullgrd <mru inprovide com>)
michael
parents: 2448
diff changeset
2418 int attribute_unused x, y; \
2415
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2419 offset <<= log2_denom; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2420 if(log2_denom) offset += 1<<(log2_denom-1); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2421 for(y=0; y<H; y++, block += stride){ \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2422 op_scale1(0); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2423 op_scale1(1); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2424 if(W==2) continue; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2425 op_scale1(2); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2426 op_scale1(3); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2427 if(W==4) continue; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2428 op_scale1(4); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2429 op_scale1(5); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2430 op_scale1(6); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2431 op_scale1(7); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2432 if(W==8) continue; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2433 op_scale1(8); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2434 op_scale1(9); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2435 op_scale1(10); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2436 op_scale1(11); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2437 op_scale1(12); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2438 op_scale1(13); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2439 op_scale1(14); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2440 op_scale1(15); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2441 } \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2442 } \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2443 static void biweight_h264_pixels ## W ## x ## H ## _c(uint8_t *dst, uint8_t *src, int stride, int log2_denom, int weightd, int weights, int offsetd, int offsets){ \
2522
e25782262d7d kill warnings patch by (Mns Rullgrd <mru inprovide com>)
michael
parents: 2448
diff changeset
2444 int attribute_unused x, y; \
2415
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2445 int offset = (offsets + offsetd + 1) >> 1; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2446 offset = ((offset << 1) + 1) << log2_denom; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2447 for(y=0; y<H; y++, dst += stride, src += stride){ \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2448 op_scale2(0); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2449 op_scale2(1); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2450 if(W==2) continue; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2451 op_scale2(2); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2452 op_scale2(3); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2453 if(W==4) continue; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2454 op_scale2(4); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2455 op_scale2(5); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2456 op_scale2(6); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2457 op_scale2(7); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2458 if(W==8) continue; \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2459 op_scale2(8); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2460 op_scale2(9); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2461 op_scale2(10); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2462 op_scale2(11); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2463 op_scale2(12); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2464 op_scale2(13); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2465 op_scale2(14); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2466 op_scale2(15); \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2467 } \
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2468 }
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2469
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2470 H264_WEIGHT(16,16)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2471 H264_WEIGHT(16,8)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2472 H264_WEIGHT(8,16)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2473 H264_WEIGHT(8,8)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2474 H264_WEIGHT(8,4)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2475 H264_WEIGHT(4,8)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2476 H264_WEIGHT(4,4)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2477 H264_WEIGHT(4,2)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2478 H264_WEIGHT(2,4)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2479 H264_WEIGHT(2,2)
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2480
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2481 #undef op_scale1
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2482 #undef op_scale2
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2483 #undef H264_WEIGHT
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
2484
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2485 static void wmv2_mspel8_h_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int h){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2486 uint8_t *cm = cropTbl + MAX_NEG_CROP;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2487 int i;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2488
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2489 for(i=0; i<h; i++){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2490 dst[0]= cm[(9*(src[0] + src[1]) - (src[-1] + src[2]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2491 dst[1]= cm[(9*(src[1] + src[2]) - (src[ 0] + src[3]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2492 dst[2]= cm[(9*(src[2] + src[3]) - (src[ 1] + src[4]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2493 dst[3]= cm[(9*(src[3] + src[4]) - (src[ 2] + src[5]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2494 dst[4]= cm[(9*(src[4] + src[5]) - (src[ 3] + src[6]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2495 dst[5]= cm[(9*(src[5] + src[6]) - (src[ 4] + src[7]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2496 dst[6]= cm[(9*(src[6] + src[7]) - (src[ 5] + src[8]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2497 dst[7]= cm[(9*(src[7] + src[8]) - (src[ 6] + src[9]) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2498 dst+=dstStride;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2499 src+=srcStride;
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2500 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2501 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2502
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2503 static void wmv2_mspel8_v_lowpass(uint8_t *dst, uint8_t *src, int dstStride, int srcStride, int w){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2504 uint8_t *cm = cropTbl + MAX_NEG_CROP;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2505 int i;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2506
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2507 for(i=0; i<w; i++){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2508 const int src_1= src[ -srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2509 const int src0 = src[0 ];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2510 const int src1 = src[ srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2511 const int src2 = src[2*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2512 const int src3 = src[3*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2513 const int src4 = src[4*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2514 const int src5 = src[5*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2515 const int src6 = src[6*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2516 const int src7 = src[7*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2517 const int src8 = src[8*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2518 const int src9 = src[9*srcStride];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2519 dst[0*dstStride]= cm[(9*(src0 + src1) - (src_1 + src2) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2520 dst[1*dstStride]= cm[(9*(src1 + src2) - (src0 + src3) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2521 dst[2*dstStride]= cm[(9*(src2 + src3) - (src1 + src4) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2522 dst[3*dstStride]= cm[(9*(src3 + src4) - (src2 + src5) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2523 dst[4*dstStride]= cm[(9*(src4 + src5) - (src3 + src6) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2524 dst[5*dstStride]= cm[(9*(src5 + src6) - (src4 + src7) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2525 dst[6*dstStride]= cm[(9*(src6 + src7) - (src5 + src8) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2526 dst[7*dstStride]= cm[(9*(src7 + src8) - (src6 + src9) + 8)>>4];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2527 src++;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2528 dst++;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2529 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2530 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2531
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2532 static void put_mspel8_mc00_c (uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2533 put_pixels8_c(dst, src, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2534 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2535
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2536 static void put_mspel8_mc10_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2537 uint8_t half[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2538 wmv2_mspel8_h_lowpass(half, src, 8, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2539 put_pixels8_l2(dst, src, half, stride, stride, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2540 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2541
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2542 static void put_mspel8_mc20_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2543 wmv2_mspel8_h_lowpass(dst, src, stride, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2544 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2545
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2546 static void put_mspel8_mc30_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2547 uint8_t half[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2548 wmv2_mspel8_h_lowpass(half, src, 8, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2549 put_pixels8_l2(dst, src+1, half, stride, stride, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2550 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2551
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2552 static void put_mspel8_mc02_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2553 wmv2_mspel8_v_lowpass(dst, src, stride, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2554 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2555
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2556 static void put_mspel8_mc12_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2557 uint8_t halfH[88];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2558 uint8_t halfV[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2559 uint8_t halfHV[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2560 wmv2_mspel8_h_lowpass(halfH, src-stride, 8, stride, 11);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2561 wmv2_mspel8_v_lowpass(halfV, src, 8, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2562 wmv2_mspel8_v_lowpass(halfHV, halfH+8, 8, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2563 put_pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2564 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2565 static void put_mspel8_mc32_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2566 uint8_t halfH[88];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2567 uint8_t halfV[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2568 uint8_t halfHV[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2569 wmv2_mspel8_h_lowpass(halfH, src-stride, 8, stride, 11);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2570 wmv2_mspel8_v_lowpass(halfV, src+1, 8, stride, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2571 wmv2_mspel8_v_lowpass(halfHV, halfH+8, 8, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2572 put_pixels8_l2(dst, halfV, halfHV, stride, 8, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2573 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2574 static void put_mspel8_mc22_c(uint8_t *dst, uint8_t *src, int stride){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2575 uint8_t halfH[88];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2576 wmv2_mspel8_h_lowpass(halfH, src-stride, 8, stride, 11);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2577 wmv2_mspel8_v_lowpass(dst, halfH+8, stride, 8, 8);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2578 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2579
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2580 static void h263_v_loop_filter_c(uint8_t *src, int stride, int qscale){
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2581 int x;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2582 const int strength= ff_h263_loop_filter_strength[qscale];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2583
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2584 for(x=0; x<8; x++){
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2585 int d1, d2, ad1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2586 int p0= src[x-2*stride];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2587 int p1= src[x-1*stride];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2588 int p2= src[x+0*stride];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2589 int p3= src[x+1*stride];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2590 int d = (p0 - p3 + 4*(p2 - p1)) / 8;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2591
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2592 if (d<-2*strength) d1= 0;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2593 else if(d<- strength) d1=-2*strength - d;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2594 else if(d< strength) d1= d;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2595 else if(d< 2*strength) d1= 2*strength - d;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2596 else d1= 0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2597
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2598 p1 += d1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2599 p2 -= d1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2600 if(p1&256) p1= ~(p1>>31);
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2601 if(p2&256) p2= ~(p2>>31);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2602
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2603 src[x-1*stride] = p1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2604 src[x+0*stride] = p2;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2605
1645
michael
parents: 1644
diff changeset
2606 ad1= ABS(d1)>>1;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2607
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2608 d2= clip((p0-p3)/4, -ad1, ad1);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2609
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2610 src[x-2*stride] = p0 - d2;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2611 src[x+ stride] = p3 + d2;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2612 }
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2613 }
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2614
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2615 static void h263_h_loop_filter_c(uint8_t *src, int stride, int qscale){
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2616 int y;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2617 const int strength= ff_h263_loop_filter_strength[qscale];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2618
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2619 for(y=0; y<8; y++){
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2620 int d1, d2, ad1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2621 int p0= src[y*stride-2];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2622 int p1= src[y*stride-1];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2623 int p2= src[y*stride+0];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2624 int p3= src[y*stride+1];
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2625 int d = (p0 - p3 + 4*(p2 - p1)) / 8;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2626
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2627 if (d<-2*strength) d1= 0;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2628 else if(d<- strength) d1=-2*strength - d;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2629 else if(d< strength) d1= d;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2630 else if(d< 2*strength) d1= 2*strength - d;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2631 else d1= 0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2632
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2633 p1 += d1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2634 p2 -= d1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2635 if(p1&256) p1= ~(p1>>31);
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2636 if(p2&256) p2= ~(p2>>31);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2637
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2638 src[y*stride-1] = p1;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2639 src[y*stride+0] = p2;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2640
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2641 ad1= ABS(d1)>>1;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2642
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2643 d2= clip((p0-p3)/4, -ad1, ad1);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2644
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2645 src[y*stride-2] = p0 - d2;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2646 src[y*stride+1] = p3 + d2;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2647 }
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
2648 }
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
2649
2045
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2650 static void h261_loop_filter_c(uint8_t *src, int stride){
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2651 int x,y,xy,yz;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2652 int temp[64];
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2653
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2654 for(x=0; x<8; x++){
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2655 temp[x ] = 4*src[x ];
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2656 temp[x + 7*8] = 4*src[x + 7*stride];
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2657 }
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2658 for(y=1; y<7; y++){
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2659 for(x=0; x<8; x++){
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2660 xy = y * stride + x;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2661 yz = y * 8 + x;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2662 temp[yz] = src[xy - stride] + 2*src[xy] + src[xy + stride];
2044
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>)
michael
parents: 1984
diff changeset
2663 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>)
michael
parents: 1984
diff changeset
2664 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2665
2045
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2666 for(y=0; y<8; y++){
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2667 src[ y*stride] = (temp[ y*8] + 2)>>2;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2668 src[7+y*stride] = (temp[7+y*8] + 2)>>2;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2669 for(x=1; x<7; x++){
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2670 xy = y * stride + x;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2671 yz = y * 8 + x;
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
2672 src[xy] = (temp[yz-1] + 2*temp[yz] + temp[yz+1] + 8)>>4;
2044
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>)
michael
parents: 1984
diff changeset
2673 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>)
michael
parents: 1984
diff changeset
2674 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>)
michael
parents: 1984
diff changeset
2675 }
b6f2add2511e h261 decoder by (Maarten Daniels <maarten.daniels at student dot luc dot ac dot be>)
michael
parents: 1984
diff changeset
2676
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2677 static inline void h264_loop_filter_luma_c(uint8_t *pix, int xstride, int ystride, int alpha, int beta, int8_t *tc0)
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2678 {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2679 int i, d;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2680 for( i = 0; i < 4; i++ ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2681 if( tc0[i] < 0 ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2682 pix += 4*ystride;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2683 continue;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2684 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2685 for( d = 0; d < 4; d++ ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2686 const int p0 = pix[-1*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2687 const int p1 = pix[-2*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2688 const int p2 = pix[-3*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2689 const int q0 = pix[0];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2690 const int q1 = pix[1*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2691 const int q2 = pix[2*xstride];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2692
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2693 if( ABS( p0 - q0 ) < alpha &&
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2694 ABS( p1 - p0 ) < beta &&
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2695 ABS( q1 - q0 ) < beta ) {
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2696
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2697 int tc = tc0[i];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2698 int i_delta;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2699
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2700 if( ABS( p2 - p0 ) < beta ) {
2651
534f3b47afda minor optimization of the h264 loop filter
michael
parents: 2639
diff changeset
2701 pix[-2*xstride] = p1 + clip( (( p2 + ( ( p0 + q0 + 1 ) >> 1 ) ) >> 1) - p1, -tc0[i], tc0[i] );
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2702 tc++;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2703 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2704 if( ABS( q2 - q0 ) < beta ) {
2651
534f3b47afda minor optimization of the h264 loop filter
michael
parents: 2639
diff changeset
2705 pix[ xstride] = q1 + clip( (( q2 + ( ( p0 + q0 + 1 ) >> 1 ) ) >> 1) - q1, -tc0[i], tc0[i] );
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2706 tc++;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2707 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
2708
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2709 i_delta = clip( (((q0 - p0 ) << 2) + (p1 - q1) + 4) >> 3, -tc, tc );
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2710 pix[-xstride] = clip_uint8( p0 + i_delta ); /* p0' */
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2711 pix[0] = clip_uint8( q0 - i_delta ); /* q0' */
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2712 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2713 pix += ystride;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2714 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2715 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2716 }
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2717 static void h264_v_loop_filter_luma_c(uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0)
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2718 {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2719 h264_loop_filter_luma_c(pix, stride, 1, alpha, beta, tc0);
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2720 }
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2721 static void h264_h_loop_filter_luma_c(uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0)
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2722 {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2723 h264_loop_filter_luma_c(pix, 1, stride, alpha, beta, tc0);
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2724 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2725
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2726 static inline void h264_loop_filter_chroma_c(uint8_t *pix, int xstride, int ystride, int alpha, int beta, int8_t *tc0)
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2727 {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2728 int i, d;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2729 for( i = 0; i < 4; i++ ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2730 const int tc = tc0[i];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2731 if( tc <= 0 ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2732 pix += 2*ystride;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2733 continue;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2734 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2735 for( d = 0; d < 2; d++ ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2736 const int p0 = pix[-1*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2737 const int p1 = pix[-2*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2738 const int q0 = pix[0];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2739 const int q1 = pix[1*xstride];
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2740
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2741 if( ABS( p0 - q0 ) < alpha &&
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2742 ABS( p1 - p0 ) < beta &&
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2743 ABS( q1 - q0 ) < beta ) {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2744
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2745 int delta = clip( (((q0 - p0 ) << 2) + (p1 - q1) + 4) >> 3, -tc, tc );
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2746
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2747 pix[-xstride] = clip_uint8( p0 + delta ); /* p0' */
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2748 pix[0] = clip_uint8( q0 - delta ); /* q0' */
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2749 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2750 pix += ystride;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2751 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2752 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2753 }
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2754 static void h264_v_loop_filter_chroma_c(uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0)
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2755 {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2756 h264_loop_filter_chroma_c(pix, stride, 1, alpha, beta, tc0);
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2757 }
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2758 static void h264_h_loop_filter_chroma_c(uint8_t *pix, int stride, int alpha, int beta, int8_t *tc0)
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2759 {
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2760 h264_loop_filter_chroma_c(pix, 1, stride, alpha, beta, tc0);
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2761 }
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
2762
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2763 static inline void h264_loop_filter_chroma_intra_c(uint8_t *pix, int xstride, int ystride, int alpha, int beta)
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2764 {
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2765 int d;
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2766 for( d = 0; d < 8; d++ ) {
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2767 const int p0 = pix[-1*xstride];
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2768 const int p1 = pix[-2*xstride];
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2769 const int q0 = pix[0];
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2770 const int q1 = pix[1*xstride];
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2771
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2772 if( ABS( p0 - q0 ) < alpha &&
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2773 ABS( p1 - p0 ) < beta &&
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2774 ABS( q1 - q0 ) < beta ) {
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2775
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2776 pix[-xstride] = ( 2*p1 + p0 + q1 + 2 ) >> 2; /* p0' */
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2777 pix[0] = ( 2*q1 + q0 + p1 + 2 ) >> 2; /* q0' */
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2778 }
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2779 pix += ystride;
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2780 }
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2781 }
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2782 static void h264_v_loop_filter_chroma_intra_c(uint8_t *pix, int stride, int alpha, int beta)
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2783 {
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2784 h264_loop_filter_chroma_intra_c(pix, stride, 1, alpha, beta);
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2785 }
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2786 static void h264_h_loop_filter_chroma_intra_c(uint8_t *pix, int stride, int alpha, int beta)
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2787 {
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2788 h264_loop_filter_chroma_intra_c(pix, 1, stride, alpha, beta);
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2789 }
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
2790
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2791 static inline int pix_abs16_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2792 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
2793 int s, i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2794
986e461dc072 Initial revision
glantau
parents:
diff changeset
2795 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2796 for(i=0;i<h;i++) {
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2797 s += abs(pix1[0] - pix2[0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2798 s += abs(pix1[1] - pix2[1]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2799 s += abs(pix1[2] - pix2[2]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2800 s += abs(pix1[3] - pix2[3]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2801 s += abs(pix1[4] - pix2[4]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2802 s += abs(pix1[5] - pix2[5]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2803 s += abs(pix1[6] - pix2[6]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2804 s += abs(pix1[7] - pix2[7]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2805 s += abs(pix1[8] - pix2[8]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2806 s += abs(pix1[9] - pix2[9]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2807 s += abs(pix1[10] - pix2[10]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2808 s += abs(pix1[11] - pix2[11]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2809 s += abs(pix1[12] - pix2[12]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2810 s += abs(pix1[13] - pix2[13]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2811 s += abs(pix1[14] - pix2[14]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2812 s += abs(pix1[15] - pix2[15]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
2813 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2814 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2815 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2816 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2817 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2818
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2819 static int pix_abs16_x2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2820 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
2821 int s, i;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2822
986e461dc072 Initial revision
glantau
parents:
diff changeset
2823 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2824 for(i=0;i<h;i++) {
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2825 s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2826 s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2827 s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2828 s += abs(pix1[3] - avg2(pix2[3], pix2[4]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2829 s += abs(pix1[4] - avg2(pix2[4], pix2[5]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2830 s += abs(pix1[5] - avg2(pix2[5], pix2[6]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2831 s += abs(pix1[6] - avg2(pix2[6], pix2[7]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2832 s += abs(pix1[7] - avg2(pix2[7], pix2[8]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2833 s += abs(pix1[8] - avg2(pix2[8], pix2[9]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2834 s += abs(pix1[9] - avg2(pix2[9], pix2[10]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2835 s += abs(pix1[10] - avg2(pix2[10], pix2[11]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2836 s += abs(pix1[11] - avg2(pix2[11], pix2[12]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2837 s += abs(pix1[12] - avg2(pix2[12], pix2[13]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2838 s += abs(pix1[13] - avg2(pix2[13], pix2[14]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2839 s += abs(pix1[14] - avg2(pix2[14], pix2[15]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2840 s += abs(pix1[15] - avg2(pix2[15], pix2[16]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2841 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2842 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2843 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2844 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2845 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2846
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2847 static int pix_abs16_y2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2848 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
2849 int s, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2850 uint8_t *pix3 = pix2 + line_size;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2851
986e461dc072 Initial revision
glantau
parents:
diff changeset
2852 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2853 for(i=0;i<h;i++) {
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2854 s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2855 s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2856 s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2857 s += abs(pix1[3] - avg2(pix2[3], pix3[3]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2858 s += abs(pix1[4] - avg2(pix2[4], pix3[4]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2859 s += abs(pix1[5] - avg2(pix2[5], pix3[5]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2860 s += abs(pix1[6] - avg2(pix2[6], pix3[6]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2861 s += abs(pix1[7] - avg2(pix2[7], pix3[7]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2862 s += abs(pix1[8] - avg2(pix2[8], pix3[8]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2863 s += abs(pix1[9] - avg2(pix2[9], pix3[9]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2864 s += abs(pix1[10] - avg2(pix2[10], pix3[10]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2865 s += abs(pix1[11] - avg2(pix2[11], pix3[11]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2866 s += abs(pix1[12] - avg2(pix2[12], pix3[12]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2867 s += abs(pix1[13] - avg2(pix2[13], pix3[13]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2868 s += abs(pix1[14] - avg2(pix2[14], pix3[14]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2869 s += abs(pix1[15] - avg2(pix2[15], pix3[15]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2870 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2871 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2872 pix3 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2873 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2874 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2875 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2876
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2877 static int pix_abs16_xy2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2878 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
2879 int s, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2880 uint8_t *pix3 = pix2 + line_size;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2881
986e461dc072 Initial revision
glantau
parents:
diff changeset
2882 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2883 for(i=0;i<h;i++) {
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
2884 s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2885 s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2886 s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2887 s += abs(pix1[3] - avg4(pix2[3], pix2[4], pix3[3], pix3[4]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2888 s += abs(pix1[4] - avg4(pix2[4], pix2[5], pix3[4], pix3[5]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2889 s += abs(pix1[5] - avg4(pix2[5], pix2[6], pix3[5], pix3[6]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2890 s += abs(pix1[6] - avg4(pix2[6], pix2[7], pix3[6], pix3[7]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2891 s += abs(pix1[7] - avg4(pix2[7], pix2[8], pix3[7], pix3[8]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2892 s += abs(pix1[8] - avg4(pix2[8], pix2[9], pix3[8], pix3[9]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2893 s += abs(pix1[9] - avg4(pix2[9], pix2[10], pix3[9], pix3[10]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2894 s += abs(pix1[10] - avg4(pix2[10], pix2[11], pix3[10], pix3[11]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2895 s += abs(pix1[11] - avg4(pix2[11], pix2[12], pix3[11], pix3[12]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2896 s += abs(pix1[12] - avg4(pix2[12], pix2[13], pix3[12], pix3[13]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2897 s += abs(pix1[13] - avg4(pix2[13], pix2[14], pix3[13], pix3[14]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2898 s += abs(pix1[14] - avg4(pix2[14], pix2[15], pix3[14], pix3[15]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2899 s += abs(pix1[15] - avg4(pix2[15], pix2[16], pix3[15], pix3[16]));
986e461dc072 Initial revision
glantau
parents:
diff changeset
2900 pix1 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2901 pix2 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2902 pix3 += line_size;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2903 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2904 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
2905 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
2906
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2907 static inline int pix_abs8_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2908 {
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2909 int s, i;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2910
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2911 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2912 for(i=0;i<h;i++) {
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2913 s += abs(pix1[0] - pix2[0]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2914 s += abs(pix1[1] - pix2[1]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2915 s += abs(pix1[2] - pix2[2]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2916 s += abs(pix1[3] - pix2[3]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2917 s += abs(pix1[4] - pix2[4]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2918 s += abs(pix1[5] - pix2[5]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2919 s += abs(pix1[6] - pix2[6]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2920 s += abs(pix1[7] - pix2[7]);
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2921 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2922 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2923 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2924 return s;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2925 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2926
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2927 static int pix_abs8_x2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2928 {
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2929 int s, i;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2930
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2931 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2932 for(i=0;i<h;i++) {
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2933 s += abs(pix1[0] - avg2(pix2[0], pix2[1]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2934 s += abs(pix1[1] - avg2(pix2[1], pix2[2]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2935 s += abs(pix1[2] - avg2(pix2[2], pix2[3]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2936 s += abs(pix1[3] - avg2(pix2[3], pix2[4]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2937 s += abs(pix1[4] - avg2(pix2[4], pix2[5]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2938 s += abs(pix1[5] - avg2(pix2[5], pix2[6]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2939 s += abs(pix1[6] - avg2(pix2[6], pix2[7]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2940 s += abs(pix1[7] - avg2(pix2[7], pix2[8]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2941 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2942 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2943 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2944 return s;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2945 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2946
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2947 static int pix_abs8_y2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2948 {
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2949 int s, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2950 uint8_t *pix3 = pix2 + line_size;
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2951
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2952 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2953 for(i=0;i<h;i++) {
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2954 s += abs(pix1[0] - avg2(pix2[0], pix3[0]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2955 s += abs(pix1[1] - avg2(pix2[1], pix3[1]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2956 s += abs(pix1[2] - avg2(pix2[2], pix3[2]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2957 s += abs(pix1[3] - avg2(pix2[3], pix3[3]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2958 s += abs(pix1[4] - avg2(pix2[4], pix3[4]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2959 s += abs(pix1[5] - avg2(pix2[5], pix3[5]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2960 s += abs(pix1[6] - avg2(pix2[6], pix3[6]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2961 s += abs(pix1[7] - avg2(pix2[7], pix3[7]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2962 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2963 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2964 pix3 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2965 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2966 return s;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2967 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2968
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2969 static int pix_abs8_xy2_c(void *v, uint8_t *pix1, uint8_t *pix2, int line_size, int h)
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2970 {
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2971 int s, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
2972 uint8_t *pix3 = pix2 + line_size;
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2973
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2974 s = 0;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
2975 for(i=0;i<h;i++) {
294
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2976 s += abs(pix1[0] - avg4(pix2[0], pix2[1], pix3[0], pix3[1]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2977 s += abs(pix1[1] - avg4(pix2[1], pix2[2], pix3[1], pix3[2]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2978 s += abs(pix1[2] - avg4(pix2[2], pix2[3], pix3[2], pix3[3]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2979 s += abs(pix1[3] - avg4(pix2[3], pix2[4], pix3[3], pix3[4]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2980 s += abs(pix1[4] - avg4(pix2[4], pix2[5], pix3[4], pix3[5]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2981 s += abs(pix1[5] - avg4(pix2[5], pix2[6], pix3[5], pix3[6]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2982 s += abs(pix1[6] - avg4(pix2[6], pix2[7], pix3[6], pix3[7]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2983 s += abs(pix1[7] - avg4(pix2[7], pix2[8], pix3[7], pix3[8]));
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2984 pix1 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2985 pix2 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2986 pix3 += line_size;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2987 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2988 return s;
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2989 }
944632089814 4MV motion estimation (not finished yet)
michaelni
parents: 256
diff changeset
2990
2834
fd5d7c732c6b kill a bunch of compiler warnings
mru
parents: 2763
diff changeset
2991 static int nsse16_c(void *v, uint8_t *s1, uint8_t *s2, int stride, int h){
fd5d7c732c6b kill a bunch of compiler warnings
mru
parents: 2763
diff changeset
2992 MpegEncContext *c = v;
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
2993 int score1=0;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
2994 int score2=0;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
2995 int x,y;
2066
4bfb146e701b nsse weight
michael
parents: 2065
diff changeset
2996
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
2997 for(y=0; y<h; y++){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
2998 for(x=0; x<16; x++){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
2999 score1+= (s1[x ] - s2[x ])*(s1[x ] - s2[x ]);
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3000 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3001 if(y+1<h){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3002 for(x=0; x<15; x++){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3003 score2+= ABS( s1[x ] - s1[x +stride]
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3004 - s1[x+1] + s1[x+1+stride])
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3005 -ABS( s2[x ] - s2[x +stride]
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3006 - s2[x+1] + s2[x+1+stride]);
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3007 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3008 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3009 s1+= stride;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3010 s2+= stride;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3011 }
2066
4bfb146e701b nsse weight
michael
parents: 2065
diff changeset
3012
4bfb146e701b nsse weight
michael
parents: 2065
diff changeset
3013 if(c) return score1 + ABS(score2)*c->avctx->nsse_weight;
4bfb146e701b nsse weight
michael
parents: 2065
diff changeset
3014 else return score1 + ABS(score2)*8;
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3015 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3016
2834
fd5d7c732c6b kill a bunch of compiler warnings
mru
parents: 2763
diff changeset
3017 static int nsse8_c(void *v, uint8_t *s1, uint8_t *s2, int stride, int h){
fd5d7c732c6b kill a bunch of compiler warnings
mru
parents: 2763
diff changeset
3018 MpegEncContext *c = v;
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3019 int score1=0;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3020 int score2=0;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3021 int x,y;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3022
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3023 for(y=0; y<h; y++){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3024 for(x=0; x<8; x++){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3025 score1+= (s1[x ] - s2[x ])*(s1[x ] - s2[x ]);
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3026 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3027 if(y+1<h){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3028 for(x=0; x<7; x++){
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3029 score2+= ABS( s1[x ] - s1[x +stride]
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3030 - s1[x+1] + s1[x+1+stride])
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3031 -ABS( s2[x ] - s2[x +stride]
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3032 - s2[x+1] + s2[x+1+stride]);
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3033 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3034 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3035 s1+= stride;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3036 s2+= stride;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3037 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3038
2066
4bfb146e701b nsse weight
michael
parents: 2065
diff changeset
3039 if(c) return score1 + ABS(score2)*c->avctx->nsse_weight;
4bfb146e701b nsse weight
michael
parents: 2065
diff changeset
3040 else return score1 + ABS(score2)*8;
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3041 }
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3042
1784
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3043 static int try_8x8basis_c(int16_t rem[64], int16_t weight[64], int16_t basis[64], int scale){
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3044 int i;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3045 unsigned int sum=0;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3046
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3047 for(i=0; i<8*8; i++){
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3048 int b= rem[i] + ((basis[i]*scale + (1<<(BASIS_SHIFT - RECON_SHIFT-1)))>>(BASIS_SHIFT - RECON_SHIFT));
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3049 int w= weight[i];
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3050 b>>= RECON_SHIFT;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3051 assert(-512<b && b<512);
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3052
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3053 sum += (w*b)*(w*b)>>4;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3054 }
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3055 return sum>>2;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3056 }
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3057
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3058 static void add_8x8basis_c(int16_t rem[64], int16_t basis[64], int scale){
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3059 int i;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3060
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3061 for(i=0; i<8*8; i++){
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3062 rem[i] += (basis[i]*scale + (1<<(BASIS_SHIFT - RECON_SHIFT-1)))>>(BASIS_SHIFT - RECON_SHIFT);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3063 }
1784
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3064 }
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3065
1100
207f27932628 ff_block_permute() dox
michaelni
parents: 1092
diff changeset
3066 /**
207f27932628 ff_block_permute() dox
michaelni
parents: 1092
diff changeset
3067 * permutes an 8x8 block.
1101
a3a8017dee70 more idiot proof dox
michaelni
parents: 1100
diff changeset
3068 * @param block the block which will be permuted according to the given permutation vector
1100
207f27932628 ff_block_permute() dox
michaelni
parents: 1092
diff changeset
3069 * @param permutation the permutation vector
207f27932628 ff_block_permute() dox
michaelni
parents: 1092
diff changeset
3070 * @param last the last non zero coefficient in scantable order, used to speed the permutation up
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3071 * @param scantable the used scantable, this is only used to speed the permutation up, the block is not
1101
a3a8017dee70 more idiot proof dox
michaelni
parents: 1100
diff changeset
3072 * (inverse) permutated to scantable order!
1100
207f27932628 ff_block_permute() dox
michaelni
parents: 1092
diff changeset
3073 */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
3074 void ff_block_permute(DCTELEM *block, uint8_t *permutation, const uint8_t *scantable, int last)
174
ac5075a55488 new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
arpi_esp
parents: 88
diff changeset
3075 {
764
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3076 int i;
945
463f7260b155 trellis quantization
michaelni
parents: 936
diff changeset
3077 DCTELEM temp[64];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3078
764
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3079 if(last<=0) return;
882
34943cb0c2fb * remaining part of John Ryland's patch
kabi
parents: 866
diff changeset
3080 //if(permutation[1]==1) return; //FIXME its ok but not clean and might fail for some perms
174
ac5075a55488 new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
arpi_esp
parents: 88
diff changeset
3081
764
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3082 for(i=0; i<=last; i++){
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3083 const int j= scantable[i];
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3084 temp[j]= block[j];
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3085 block[j]=0;
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3086 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3087
764
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3088 for(i=0; i<=last; i++){
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3089 const int j= scantable[i];
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3090 const int perm_j= permutation[j];
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3091 block[perm_j]= temp[j];
d4726182dfd2 optimize block_permute()
michaelni
parents: 753
diff changeset
3092 }
174
ac5075a55488 new IDCT code by Michael Niedermayer (michaelni@gmx.at) - #define SIMPLE_IDCT to enable
arpi_esp
parents: 88
diff changeset
3093 }
34
2733a4c1c693 added block permutation functions
glantau
parents: 19
diff changeset
3094
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3095 static int zero_cmp(void *s, uint8_t *a, uint8_t *b, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3096 return 0;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3097 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3098
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3099 void ff_set_cmp(DSPContext* c, me_cmp_func *cmp, int type){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3100 int i;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3101
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3102 memset(cmp, 0, sizeof(void*)*5);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3103
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3104 for(i=0; i<5; i++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3105 switch(type&0xFF){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3106 case FF_CMP_SAD:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3107 cmp[i]= c->sad[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3108 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3109 case FF_CMP_SATD:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3110 cmp[i]= c->hadamard8_diff[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3111 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3112 case FF_CMP_SSE:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3113 cmp[i]= c->sse[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3114 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3115 case FF_CMP_DCT:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3116 cmp[i]= c->dct_sad[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3117 break;
3010
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3118 case FF_CMP_DCT264:
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3119 cmp[i]= c->dct264_sad[i];
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3120 break;
2382
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3121 case FF_CMP_DCTMAX:
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3122 cmp[i]= c->dct_max[i];
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3123 break;
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3124 case FF_CMP_PSNR:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3125 cmp[i]= c->quant_psnr[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3126 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3127 case FF_CMP_BIT:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3128 cmp[i]= c->bit[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3129 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3130 case FF_CMP_RD:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3131 cmp[i]= c->rd[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3132 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3133 case FF_CMP_VSAD:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3134 cmp[i]= c->vsad[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3135 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3136 case FF_CMP_VSSE:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3137 cmp[i]= c->vsse[i];
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3138 break;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3139 case FF_CMP_ZERO:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3140 cmp[i]= zero_cmp;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3141 break;
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3142 case FF_CMP_NSSE:
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3143 cmp[i]= c->nsse[i];
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3144 break;
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3145 case FF_CMP_W53:
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3146 cmp[i]= c->w53[i];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3147 break;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3148 case FF_CMP_W97:
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3149 cmp[i]= c->w97[i];
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3150 break;
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3151 default:
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3152 av_log(NULL, AV_LOG_ERROR,"internal error in cmp function selection\n");
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3153 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3154 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3155 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3156
1101
a3a8017dee70 more idiot proof dox
michaelni
parents: 1100
diff changeset
3157 /**
a3a8017dee70 more idiot proof dox
michaelni
parents: 1100
diff changeset
3158 * memset(blocks, 0, sizeof(DCTELEM)*6*64)
a3a8017dee70 more idiot proof dox
michaelni
parents: 1100
diff changeset
3159 */
853
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3160 static void clear_blocks_c(DCTELEM *blocks)
296
c1a8a1b4a24b sizeof(s->block) isnt 64*6*2 anymore bugfix
michaelni
parents: 294
diff changeset
3161 {
c1a8a1b4a24b sizeof(s->block) isnt 64*6*2 anymore bugfix
michaelni
parents: 294
diff changeset
3162 memset(blocks, 0, sizeof(DCTELEM)*6*64);
c1a8a1b4a24b sizeof(s->block) isnt 64*6*2 anymore bugfix
michaelni
parents: 294
diff changeset
3163 }
c1a8a1b4a24b sizeof(s->block) isnt 64*6*2 anymore bugfix
michaelni
parents: 294
diff changeset
3164
866
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3165 static void add_bytes_c(uint8_t *dst, uint8_t *src, int w){
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3166 int i;
996
ad44196ea483 add/diff_bytes bugfix patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>)
michaelni
parents: 984
diff changeset
3167 for(i=0; i+7<w; i+=8){
866
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3168 dst[i+0] += src[i+0];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3169 dst[i+1] += src[i+1];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3170 dst[i+2] += src[i+2];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3171 dst[i+3] += src[i+3];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3172 dst[i+4] += src[i+4];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3173 dst[i+5] += src[i+5];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3174 dst[i+6] += src[i+6];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3175 dst[i+7] += src[i+7];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3176 }
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3177 for(; i<w; i++)
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3178 dst[i+0] += src[i+0];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3179 }
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3180
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3181 static void diff_bytes_c(uint8_t *dst, uint8_t *src1, uint8_t *src2, int w){
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3182 int i;
996
ad44196ea483 add/diff_bytes bugfix patch by (Felix von Leitner <felix-ffmpeg at fefe dot de>)
michaelni
parents: 984
diff changeset
3183 for(i=0; i+7<w; i+=8){
866
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3184 dst[i+0] = src1[i+0]-src2[i+0];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3185 dst[i+1] = src1[i+1]-src2[i+1];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3186 dst[i+2] = src1[i+2]-src2[i+2];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3187 dst[i+3] = src1[i+3]-src2[i+3];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3188 dst[i+4] = src1[i+4]-src2[i+4];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3189 dst[i+5] = src1[i+5]-src2[i+5];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3190 dst[i+6] = src1[i+6]-src2[i+6];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3191 dst[i+7] = src1[i+7]-src2[i+7];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3192 }
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3193 for(; i<w; i++)
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3194 dst[i+0] = src1[i+0]-src2[i+0];
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3195 }
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3196
1527
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3197 static void sub_hfyu_median_prediction_c(uint8_t *dst, uint8_t *src1, uint8_t *src2, int w, int *left, int *left_top){
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3198 int i;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3199 uint8_t l, lt;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3200
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3201 l= *left;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3202 lt= *left_top;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3203
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3204 for(i=0; i<w; i++){
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3205 const int pred= mid_pred(l, src1[i], (l + src1[i] - lt)&0xFF);
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3206 lt= src1[i];
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3207 l= src2[i];
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3208 dst[i]= l - pred;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3209 }
1527
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3210
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3211 *left= l;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3212 *left_top= lt;
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3213 }
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3214
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3215 #define BUTTERFLY2(o1,o2,i1,i2) \
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3216 o1= (i1)+(i2);\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3217 o2= (i1)-(i2);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3218
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3219 #define BUTTERFLY1(x,y) \
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3220 {\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3221 int a,b;\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3222 a= x;\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3223 b= y;\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3224 x= a+b;\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3225 y= a-b;\
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3226 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3227
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3228 #define BUTTERFLYA(x,y) (ABS((x)+(y)) + ABS((x)-(y)))
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3229
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3230 static int hadamard8_diff8x8_c(/*MpegEncContext*/ void *s, uint8_t *dst, uint8_t *src, int stride, int h){
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3231 int i;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3232 int temp[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3233 int sum=0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3234
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3235 assert(h==8);
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3236
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3237 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3238 //FIXME try pointer walks
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3239 BUTTERFLY2(temp[8*i+0], temp[8*i+1], src[stride*i+0]-dst[stride*i+0],src[stride*i+1]-dst[stride*i+1]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3240 BUTTERFLY2(temp[8*i+2], temp[8*i+3], src[stride*i+2]-dst[stride*i+2],src[stride*i+3]-dst[stride*i+3]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3241 BUTTERFLY2(temp[8*i+4], temp[8*i+5], src[stride*i+4]-dst[stride*i+4],src[stride*i+5]-dst[stride*i+5]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3242 BUTTERFLY2(temp[8*i+6], temp[8*i+7], src[stride*i+6]-dst[stride*i+6],src[stride*i+7]-dst[stride*i+7]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3243
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3244 BUTTERFLY1(temp[8*i+0], temp[8*i+2]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3245 BUTTERFLY1(temp[8*i+1], temp[8*i+3]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3246 BUTTERFLY1(temp[8*i+4], temp[8*i+6]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3247 BUTTERFLY1(temp[8*i+5], temp[8*i+7]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3248
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3249 BUTTERFLY1(temp[8*i+0], temp[8*i+4]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3250 BUTTERFLY1(temp[8*i+1], temp[8*i+5]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3251 BUTTERFLY1(temp[8*i+2], temp[8*i+6]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3252 BUTTERFLY1(temp[8*i+3], temp[8*i+7]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3253 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3254
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3255 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3256 BUTTERFLY1(temp[8*0+i], temp[8*1+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3257 BUTTERFLY1(temp[8*2+i], temp[8*3+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3258 BUTTERFLY1(temp[8*4+i], temp[8*5+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3259 BUTTERFLY1(temp[8*6+i], temp[8*7+i]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3260
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3261 BUTTERFLY1(temp[8*0+i], temp[8*2+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3262 BUTTERFLY1(temp[8*1+i], temp[8*3+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3263 BUTTERFLY1(temp[8*4+i], temp[8*6+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3264 BUTTERFLY1(temp[8*5+i], temp[8*7+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3265
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3266 sum +=
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3267 BUTTERFLYA(temp[8*0+i], temp[8*4+i])
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3268 +BUTTERFLYA(temp[8*1+i], temp[8*5+i])
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3269 +BUTTERFLYA(temp[8*2+i], temp[8*6+i])
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3270 +BUTTERFLYA(temp[8*3+i], temp[8*7+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3271 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3272 #if 0
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3273 static int maxi=0;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3274 if(sum>maxi){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3275 maxi=sum;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3276 printf("MAX:%d\n", maxi);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3277 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3278 #endif
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3279 return sum;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3280 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3281
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3282 static int hadamard8_intra8x8_c(/*MpegEncContext*/ void *s, uint8_t *src, uint8_t *dummy, int stride, int h){
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3283 int i;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3284 int temp[64];
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3285 int sum=0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3286
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3287 assert(h==8);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3288
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3289 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3290 //FIXME try pointer walks
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3291 BUTTERFLY2(temp[8*i+0], temp[8*i+1], src[stride*i+0],src[stride*i+1]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3292 BUTTERFLY2(temp[8*i+2], temp[8*i+3], src[stride*i+2],src[stride*i+3]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3293 BUTTERFLY2(temp[8*i+4], temp[8*i+5], src[stride*i+4],src[stride*i+5]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3294 BUTTERFLY2(temp[8*i+6], temp[8*i+7], src[stride*i+6],src[stride*i+7]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3295
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3296 BUTTERFLY1(temp[8*i+0], temp[8*i+2]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3297 BUTTERFLY1(temp[8*i+1], temp[8*i+3]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3298 BUTTERFLY1(temp[8*i+4], temp[8*i+6]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3299 BUTTERFLY1(temp[8*i+5], temp[8*i+7]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3300
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3301 BUTTERFLY1(temp[8*i+0], temp[8*i+4]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3302 BUTTERFLY1(temp[8*i+1], temp[8*i+5]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3303 BUTTERFLY1(temp[8*i+2], temp[8*i+6]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3304 BUTTERFLY1(temp[8*i+3], temp[8*i+7]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3305 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3306
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3307 for(i=0; i<8; i++){
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3308 BUTTERFLY1(temp[8*0+i], temp[8*1+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3309 BUTTERFLY1(temp[8*2+i], temp[8*3+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3310 BUTTERFLY1(temp[8*4+i], temp[8*5+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3311 BUTTERFLY1(temp[8*6+i], temp[8*7+i]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3312
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3313 BUTTERFLY1(temp[8*0+i], temp[8*2+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3314 BUTTERFLY1(temp[8*1+i], temp[8*3+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3315 BUTTERFLY1(temp[8*4+i], temp[8*6+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3316 BUTTERFLY1(temp[8*5+i], temp[8*7+i]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3317
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3318 sum +=
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3319 BUTTERFLYA(temp[8*0+i], temp[8*4+i])
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3320 +BUTTERFLYA(temp[8*1+i], temp[8*5+i])
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3321 +BUTTERFLYA(temp[8*2+i], temp[8*6+i])
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3322 +BUTTERFLYA(temp[8*3+i], temp[8*7+i]);
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3323 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3324
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3325 sum -= ABS(temp[8*0] + temp[8*4]); // -mean
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3326
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3327 return sum;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3328 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3329
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3330 static int dct_sad8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3331 MpegEncContext * const s= (MpegEncContext *)c;
1016
michaelni
parents: 1013
diff changeset
3332 uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
michaelni
parents: 1013
diff changeset
3333 DCTELEM * const temp= (DCTELEM*)aligned_temp;
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3334 int sum=0, i;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3335
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3336 assert(h==8);
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3337
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3338 s->dsp.diff_pixels(temp, src1, src2, stride);
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3339 s->dsp.fdct(temp);
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3340
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3341 for(i=0; i<64; i++)
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3342 sum+= ABS(temp[i]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3343
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3344 return sum;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3345 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3346
3010
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3347 #ifdef CONFIG_GPL
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3348 #define DCT8_1D {\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3349 const int s07 = SRC(0) + SRC(7);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3350 const int s16 = SRC(1) + SRC(6);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3351 const int s25 = SRC(2) + SRC(5);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3352 const int s34 = SRC(3) + SRC(4);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3353 const int a0 = s07 + s34;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3354 const int a1 = s16 + s25;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3355 const int a2 = s07 - s34;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3356 const int a3 = s16 - s25;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3357 const int d07 = SRC(0) - SRC(7);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3358 const int d16 = SRC(1) - SRC(6);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3359 const int d25 = SRC(2) - SRC(5);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3360 const int d34 = SRC(3) - SRC(4);\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3361 const int a4 = d16 + d25 + (d07 + (d07>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3362 const int a5 = d07 - d34 - (d25 + (d25>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3363 const int a6 = d07 + d34 - (d16 + (d16>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3364 const int a7 = d16 - d25 + (d34 + (d34>>1));\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3365 DST(0, a0 + a1 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3366 DST(1, a4 + (a7>>2)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3367 DST(2, a2 + (a3>>1)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3368 DST(3, a5 + (a6>>2)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3369 DST(4, a0 - a1 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3370 DST(5, a6 - (a5>>2)) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3371 DST(6, (a2>>1) - a3 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3372 DST(7, (a4>>2) - a7 ) ;\
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3373 }
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3374
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3375 static int dct264_sad8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3376 MpegEncContext * const s= (MpegEncContext *)c;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3377 int16_t dct[8][8];
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3378 int i;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3379 int sum=0;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3380
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3381 s->dsp.diff_pixels(dct, src1, src2, stride);
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3382
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3383 #define SRC(x) dct[i][x]
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3384 #define DST(x,v) dct[i][x]= v
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3385 for( i = 0; i < 8; i++ )
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3386 DCT8_1D
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3387 #undef SRC
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3388 #undef DST
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3389
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3390 #define SRC(x) dct[x][i]
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3391 #define DST(x,v) sum += ABS(v)
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3392 for( i = 0; i < 8; i++ )
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3393 DCT8_1D
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3394 #undef SRC
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3395 #undef DST
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3396 return sum;
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3397 }
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3398 #endif
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3399
2382
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3400 static int dct_max8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3401 MpegEncContext * const s= (MpegEncContext *)c;
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3402 uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3403 DCTELEM * const temp= (DCTELEM*)aligned_temp;
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3404 int sum=0, i;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3405
2382
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3406 assert(h==8);
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3407
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3408 s->dsp.diff_pixels(temp, src1, src2, stride);
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3409 s->dsp.fdct(temp);
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3410
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3411 for(i=0; i<64; i++)
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3412 sum= FFMAX(sum, ABS(temp[i]));
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3413
2382
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3414 return sum;
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3415 }
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3416
1008
fb6cbb8a04a3 fixing DCTELEM != short
michaelni
parents: 1007
diff changeset
3417 void simple_idct(DCTELEM *block); //FIXME
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3418
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3419 static int quant_psnr8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3420 MpegEncContext * const s= (MpegEncContext *)c;
1016
michaelni
parents: 1013
diff changeset
3421 uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64*2/8];
michaelni
parents: 1013
diff changeset
3422 DCTELEM * const temp= (DCTELEM*)aligned_temp;
michaelni
parents: 1013
diff changeset
3423 DCTELEM * const bak = ((DCTELEM*)aligned_temp)+64;
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3424 int sum=0, i;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3425
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3426 assert(h==8);
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3427 s->mb_intra=0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3428
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3429 s->dsp.diff_pixels(temp, src1, src2, stride);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3430
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3431 memcpy(bak, temp, 64*sizeof(DCTELEM));
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3432
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3433 s->block_last_index[0/*FIXME*/]= s->fast_dct_quantize(s, temp, 0/*FIXME*/, s->qscale, &i);
1689
1a2db2073848 split intra / inter dequantization
michael
parents: 1645
diff changeset
3434 s->dct_unquantize_inter(s, temp, 0, s->qscale);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3435 simple_idct(temp); //FIXME
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3436
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3437 for(i=0; i<64; i++)
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3438 sum+= (temp[i]-bak[i])*(temp[i]-bak[i]);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3439
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3440 return sum;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3441 }
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3442
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3443 static int rd8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3444 MpegEncContext * const s= (MpegEncContext *)c;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
3445 const uint8_t *scantable= s->intra_scantable.permutated;
1016
michaelni
parents: 1013
diff changeset
3446 uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
michaelni
parents: 1013
diff changeset
3447 uint64_t __align8 aligned_bak[stride];
michaelni
parents: 1013
diff changeset
3448 DCTELEM * const temp= (DCTELEM*)aligned_temp;
michaelni
parents: 1013
diff changeset
3449 uint8_t * const bak= (uint8_t*)aligned_bak;
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3450 int i, last, run, bits, level, distoration, start_i;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3451 const int esc_length= s->ac_esc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3452 uint8_t * length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3453 uint8_t * last_length;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3454
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3455 assert(h==8);
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3456
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3457 for(i=0; i<8; i++){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3458 ((uint32_t*)(bak + i*stride))[0]= ((uint32_t*)(src2 + i*stride))[0];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3459 ((uint32_t*)(bak + i*stride))[1]= ((uint32_t*)(src2 + i*stride))[1];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3460 }
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3461
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3462 s->dsp.diff_pixels(temp, src1, src2, stride);
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3463
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3464 s->block_last_index[0/*FIXME*/]= last= s->fast_dct_quantize(s, temp, 0/*FIXME*/, s->qscale, &i);
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3465
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3466 bits=0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3467
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3468 if (s->mb_intra) {
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3469 start_i = 1;
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3470 length = s->intra_ac_vlc_length;
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3471 last_length= s->intra_ac_vlc_last_length;
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3472 bits+= s->luma_dc_vlc_length[temp[0] + 256]; //FIXME chroma
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3473 } else {
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3474 start_i = 0;
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3475 length = s->inter_ac_vlc_length;
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3476 last_length= s->inter_ac_vlc_last_length;
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3477 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3478
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3479 if(last>=start_i){
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3480 run=0;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3481 for(i=start_i; i<last; i++){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3482 int j= scantable[i];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3483 level= temp[j];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3484
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3485 if(level){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3486 level+=64;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3487 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3488 bits+= length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3489 }else
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3490 bits+= esc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3491 run=0;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3492 }else
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3493 run++;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3494 }
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3495 i= scantable[last];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3496
1011
michaelni
parents: 1008
diff changeset
3497 level= temp[i] + 64;
michaelni
parents: 1008
diff changeset
3498
michaelni
parents: 1008
diff changeset
3499 assert(level - 64);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3500
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3501 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3502 bits+= last_length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3503 }else
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3504 bits+= esc_length;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3505
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3506 }
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3507
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3508 if(last>=0){
1689
1a2db2073848 split intra / inter dequantization
michael
parents: 1645
diff changeset
3509 if(s->mb_intra)
1a2db2073848 split intra / inter dequantization
michael
parents: 1645
diff changeset
3510 s->dct_unquantize_intra(s, temp, 0, s->qscale);
1a2db2073848 split intra / inter dequantization
michael
parents: 1645
diff changeset
3511 else
1a2db2073848 split intra / inter dequantization
michael
parents: 1645
diff changeset
3512 s->dct_unquantize_inter(s, temp, 0, s->qscale);
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3513 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3514
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3515 s->dsp.idct_add(bak, stride, temp);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3516
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3517 distoration= s->dsp.sse[1](NULL, bak, src1, stride, 8);
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3518
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3519 return distoration + ((bits*s->qscale*s->qscale*109 + 64)>>7);
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3520 }
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3521
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3522 static int bit8x8_c(/*MpegEncContext*/ void *c, uint8_t *src1, uint8_t *src2, int stride, int h){
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3523 MpegEncContext * const s= (MpegEncContext *)c;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1016
diff changeset
3524 const uint8_t *scantable= s->intra_scantable.permutated;
1016
michaelni
parents: 1013
diff changeset
3525 uint64_t __align8 aligned_temp[sizeof(DCTELEM)*64/8];
michaelni
parents: 1013
diff changeset
3526 DCTELEM * const temp= (DCTELEM*)aligned_temp;
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3527 int i, last, run, bits, level, start_i;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3528 const int esc_length= s->ac_esc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3529 uint8_t * length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3530 uint8_t * last_length;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3531
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3532 assert(h==8);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3533
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3534 s->dsp.diff_pixels(temp, src1, src2, stride);
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3535
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3536 s->block_last_index[0/*FIXME*/]= last= s->fast_dct_quantize(s, temp, 0/*FIXME*/, s->qscale, &i);
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3537
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3538 bits=0;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3539
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3540 if (s->mb_intra) {
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3541 start_i = 1;
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3542 length = s->intra_ac_vlc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3543 last_length= s->intra_ac_vlc_last_length;
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3544 bits+= s->luma_dc_vlc_length[temp[0] + 256]; //FIXME chroma
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3545 } else {
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3546 start_i = 0;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3547 length = s->inter_ac_vlc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3548 last_length= s->inter_ac_vlc_last_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3549 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3550
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3551 if(last>=start_i){
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3552 run=0;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3553 for(i=start_i; i<last; i++){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3554 int j= scantable[i];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3555 level= temp[j];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3556
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3557 if(level){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3558 level+=64;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3559 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3560 bits+= length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3561 }else
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3562 bits+= esc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3563 run=0;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3564 }else
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3565 run++;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3566 }
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3567 i= scantable[last];
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3568
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3569 level= temp[i] + 64;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3570
1013
5d4c95f323d0 finetuneing thresholds/factors
michaelni
parents: 1012
diff changeset
3571 assert(level - 64);
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3572
1007
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3573 if((level&(~127)) == 0){
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3574 bits+= last_length[UNI_AC_ENC_INDEX(run, level)];
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3575 }else
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3576 bits+= esc_length;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3577 }
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3578
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3579 return bits;
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3580 }
b2cf2a1d9a51 more compare functions (rd & bit)
michaelni
parents: 997
diff changeset
3581
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3582 static int vsad_intra16_c(/*MpegEncContext*/ void *c, uint8_t *s, uint8_t *dummy, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3583 int score=0;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3584 int x,y;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3585
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3586 for(y=1; y<h; y++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3587 for(x=0; x<16; x+=4){
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3588 score+= ABS(s[x ] - s[x +stride]) + ABS(s[x+1] - s[x+1+stride])
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3589 +ABS(s[x+2] - s[x+2+stride]) + ABS(s[x+3] - s[x+3+stride]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3590 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3591 s+= stride;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3592 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3593
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3594 return score;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3595 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3596
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3597 static int vsad16_c(/*MpegEncContext*/ void *c, uint8_t *s1, uint8_t *s2, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3598 int score=0;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3599 int x,y;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3600
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3601 for(y=1; y<h; y++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3602 for(x=0; x<16; x++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3603 score+= ABS(s1[x ] - s2[x ] - s1[x +stride] + s2[x +stride]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3604 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3605 s1+= stride;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3606 s2+= stride;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3607 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3608
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3609 return score;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3610 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3611
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3612 #define SQ(a) ((a)*(a))
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3613 static int vsse_intra16_c(/*MpegEncContext*/ void *c, uint8_t *s, uint8_t *dummy, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3614 int score=0;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3615 int x,y;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3616
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3617 for(y=1; y<h; y++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3618 for(x=0; x<16; x+=4){
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3619 score+= SQ(s[x ] - s[x +stride]) + SQ(s[x+1] - s[x+1+stride])
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3620 +SQ(s[x+2] - s[x+2+stride]) + SQ(s[x+3] - s[x+3+stride]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3621 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3622 s+= stride;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3623 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3624
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3625 return score;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3626 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3627
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3628 static int vsse16_c(/*MpegEncContext*/ void *c, uint8_t *s1, uint8_t *s2, int stride, int h){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3629 int score=0;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3630 int x,y;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3631
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3632 for(y=1; y<h; y++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3633 for(x=0; x<16; x++){
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3634 score+= SQ(s1[x ] - s2[x ] - s1[x +stride] + s2[x +stride]);
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3635 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3636 s1+= stride;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3637 s2+= stride;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3638 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3639
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3640 return score;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3641 }
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3642
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3643 WARPER8_16_SQ(hadamard8_diff8x8_c, hadamard8_diff16_c)
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3644 WARPER8_16_SQ(hadamard8_intra8x8_c, hadamard8_intra16_c)
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3645 WARPER8_16_SQ(dct_sad8x8_c, dct_sad16_c)
3010
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3646 WARPER8_16_SQ(dct264_sad8x8_c, dct264_sad16_c)
2382
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3647 WARPER8_16_SQ(dct_max8x8_c, dct_max16_c)
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3648 WARPER8_16_SQ(quant_psnr8x8_c, quant_psnr16_c)
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3649 WARPER8_16_SQ(rd8x8_c, rd16_c)
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3650 WARPER8_16_SQ(bit8x8_c, bit16_c)
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3651
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3652 /* XXX: those functions should be suppressed ASAP when all IDCTs are
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3653 converted */
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3654 static void ff_jref_idct_put(uint8_t *dest, int line_size, DCTELEM *block)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3655 {
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3656 j_rev_dct (block);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3657 put_pixels_clamped_c(block, dest, line_size);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3658 }
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3659 static void ff_jref_idct_add(uint8_t *dest, int line_size, DCTELEM *block)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3660 {
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3661 j_rev_dct (block);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3662 add_pixels_clamped_c(block, dest, line_size);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3663 }
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3664
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3665 static void ff_jref_idct4_put(uint8_t *dest, int line_size, DCTELEM *block)
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3666 {
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3667 j_rev_dct4 (block);
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3668 put_pixels_clamped4_c(block, dest, line_size);
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3669 }
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3670 static void ff_jref_idct4_add(uint8_t *dest, int line_size, DCTELEM *block)
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3671 {
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3672 j_rev_dct4 (block);
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3673 add_pixels_clamped4_c(block, dest, line_size);
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3674 }
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3675
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3676 static void ff_jref_idct2_put(uint8_t *dest, int line_size, DCTELEM *block)
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3677 {
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3678 j_rev_dct2 (block);
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3679 put_pixels_clamped2_c(block, dest, line_size);
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3680 }
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3681 static void ff_jref_idct2_add(uint8_t *dest, int line_size, DCTELEM *block)
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3682 {
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3683 j_rev_dct2 (block);
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3684 add_pixels_clamped2_c(block, dest, line_size);
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3685 }
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3686
2259
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3687 static void ff_jref_idct1_put(uint8_t *dest, int line_size, DCTELEM *block)
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3688 {
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3689 uint8_t *cm = cropTbl + MAX_NEG_CROP;
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3690
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3691 dest[0] = cm[(block[0] + 4)>>3];
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3692 }
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3693 static void ff_jref_idct1_add(uint8_t *dest, int line_size, DCTELEM *block)
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3694 {
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3695 uint8_t *cm = cropTbl + MAX_NEG_CROP;
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3696
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3697 dest[0] = cm[dest[0] + ((block[0] + 4)>>3)];
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3698 }
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3699
1201
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3700 /* init static data */
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3701 void dsputil_static_init(void)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
3702 {
751
cbe316f082bc warning fixes
michaelni
parents: 706
diff changeset
3703 int i;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
3704
1201
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3705 for(i=0;i<256;i++) cropTbl[i + MAX_NEG_CROP] = i;
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3706 for(i=0;i<MAX_NEG_CROP;i++) {
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3707 cropTbl[i] = 0;
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3708 cropTbl[i + MAX_NEG_CROP + 256] = 255;
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3709 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3710
1201
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3711 for(i=0;i<512;i++) {
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3712 squareTbl[i] = (i - 256) * (i - 256);
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3713 }
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3714
1201
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3715 for(i=0; i<64; i++) inv_zigzag_direct16[ff_zigzag_direct[i]]= i+1;
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3716 }
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
3717
861
243cc33da3eb * init for inv_zigzag_direct16 moved to init block
kabi
parents: 860
diff changeset
3718
1201
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3719 void dsputil_init(DSPContext* c, AVCodecContext *avctx)
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3720 {
e0fc95a6eb4e fixed static init
bellard
parents: 1168
diff changeset
3721 int i;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
3722
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3723 #ifdef CONFIG_ENCODERS
1567
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
3724 if(avctx->dct_algo==FF_DCT_FASTINT) {
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3725 c->fdct = fdct_ifast;
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
3726 c->fdct248 = fdct_ifast248;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3727 }
1567
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
3728 else if(avctx->dct_algo==FF_DCT_FAAN) {
1557
5d53c03186a1 floating point AAN DCT
michael
parents: 1527
diff changeset
3729 c->fdct = ff_faandct;
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
3730 c->fdct248 = ff_faandct248;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3731 }
1567
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
3732 else {
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3733 c->fdct = ff_jpeg_fdct_islow; //slow/accurate/default
2979
bfabfdf9ce55 COSMETICS: tabs --> spaces, some prettyprinting
diego
parents: 2967
diff changeset
3734 c->fdct248 = ff_fdct248_islow;
1567
e08df4d22d27 * introducing dct248 into the DSP context.
romansh
parents: 1557
diff changeset
3735 }
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3736 #endif //CONFIG_ENCODERS
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3737
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3738 if(avctx->lowres==1){
2272
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3739 if(avctx->idct_algo==FF_IDCT_INT || avctx->idct_algo==FF_IDCT_AUTO){
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3740 c->idct_put= ff_jref_idct4_put;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3741 c->idct_add= ff_jref_idct4_add;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3742 }else{
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3743 c->idct_put= ff_h264_lowres_idct_put_c;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3744 c->idct_add= ff_h264_lowres_idct_add_c;
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3745 }
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3746 c->idct = j_rev_dct4;
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3747 c->idct_permutation_type= FF_NO_IDCT_PERM;
2257
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3748 }else if(avctx->lowres==2){
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3749 c->idct_put= ff_jref_idct2_put;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3750 c->idct_add= ff_jref_idct2_add;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3751 c->idct = j_rev_dct2;
5f64a30339e5 1/4 resolution decoding
michael
parents: 2256
diff changeset
3752 c->idct_permutation_type= FF_NO_IDCT_PERM;
2259
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3753 }else if(avctx->lowres==3){
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3754 c->idct_put= ff_jref_idct1_put;
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3755 c->idct_add= ff_jref_idct1_add;
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3756 c->idct = j_rev_dct1;
12e75af1d44c 1/8 resolution decoding
michael
parents: 2257
diff changeset
3757 c->idct_permutation_type= FF_NO_IDCT_PERM;
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3758 }else{
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3759 if(avctx->idct_algo==FF_IDCT_INT){
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3760 c->idct_put= ff_jref_idct_put;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3761 c->idct_add= ff_jref_idct_add;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3762 c->idct = j_rev_dct;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3763 c->idct_permutation_type= FF_LIBMPEG2_IDCT_PERM;
2693
02925a3903b6 porting vp3 idct over to lavc idct api
michael
parents: 2651
diff changeset
3764 }else if(avctx->idct_algo==FF_IDCT_VP3){
02925a3903b6 porting vp3 idct over to lavc idct api
michael
parents: 2651
diff changeset
3765 c->idct_put= ff_vp3_idct_put_c;
02925a3903b6 porting vp3 idct over to lavc idct api
michael
parents: 2651
diff changeset
3766 c->idct_add= ff_vp3_idct_add_c;
02925a3903b6 porting vp3 idct over to lavc idct api
michael
parents: 2651
diff changeset
3767 c->idct = ff_vp3_idct_c;
02925a3903b6 porting vp3 idct over to lavc idct api
michael
parents: 2651
diff changeset
3768 c->idct_permutation_type= FF_NO_IDCT_PERM;
2256
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3769 }else{ //accurate/default
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3770 c->idct_put= simple_idct_put;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3771 c->idct_add= simple_idct_add;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3772 c->idct = simple_idct;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3773 c->idct_permutation_type= FF_NO_IDCT_PERM;
7e0b2e86afa9 1/2 resolution decoding
michael
parents: 2208
diff changeset
3774 }
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3775 }
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3776
2272
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3777 c->h264_idct_add= ff_h264_idct_add_c;
2755
975074f04b95 decode H.264 with 8x8 transform.
lorenm
parents: 2707
diff changeset
3778 c->h264_idct8_add= ff_h264_idct8_add_c;
2272
cd43603c46f9 move h264 idct to its own file and call via function pointer in DspContext
michael
parents: 2259
diff changeset
3779
853
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3780 c->get_pixels = get_pixels_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3781 c->diff_pixels = diff_pixels_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3782 c->put_pixels_clamped = put_pixels_clamped_c;
1984
ef919e9ef73e separate out put_signed_pixels_clamped() into its own function and
melanson
parents: 1977
diff changeset
3783 c->put_signed_pixels_clamped = put_signed_pixels_clamped_c;
853
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3784 c->add_pixels_clamped = add_pixels_clamped_c;
2763
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
3785 c->add_pixels8 = add_pixels8_c;
01ed2c3b8f08 H.264 lossless mode
lorenm
parents: 2755
diff changeset
3786 c->add_pixels4 = add_pixels4_c;
853
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3787 c->gmc1 = gmc1_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3788 c->gmc = gmc_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3789 c->clear_blocks = clear_blocks_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3790 c->pix_sum = pix_sum_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3791 c->pix_norm1 = pix_norm1_c;
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3792
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3793 /* TODO [0] 16 [1] 8 */
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3794 c->pix_abs[0][0] = pix_abs16_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3795 c->pix_abs[0][1] = pix_abs16_x2_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3796 c->pix_abs[0][2] = pix_abs16_y2_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3797 c->pix_abs[0][3] = pix_abs16_xy2_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3798 c->pix_abs[1][0] = pix_abs8_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3799 c->pix_abs[1][1] = pix_abs8_x2_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3800 c->pix_abs[1][2] = pix_abs8_y2_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3801 c->pix_abs[1][3] = pix_abs8_xy2_c;
853
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3802
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3803 #define dspfunc(PFX, IDX, NUM) \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3804 c->PFX ## _pixels_tab[IDX][0] = PFX ## _pixels ## NUM ## _c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3805 c->PFX ## _pixels_tab[IDX][1] = PFX ## _pixels ## NUM ## _x2_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3806 c->PFX ## _pixels_tab[IDX][2] = PFX ## _pixels ## NUM ## _y2_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3807 c->PFX ## _pixels_tab[IDX][3] = PFX ## _pixels ## NUM ## _xy2_c
853
eacc2dd8fd9d * using DSPContext - so each codec could use its local (sub)set of CPU extension
kabi
parents: 764
diff changeset
3808
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3809 dspfunc(put, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3810 dspfunc(put_no_rnd, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3811 dspfunc(put, 1, 8);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3812 dspfunc(put_no_rnd, 1, 8);
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3813 dspfunc(put, 2, 4);
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3814 dspfunc(put, 3, 2);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
3815
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3816 dspfunc(avg, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3817 dspfunc(avg_no_rnd, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3818 dspfunc(avg, 1, 8);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3819 dspfunc(avg_no_rnd, 1, 8);
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3820 dspfunc(avg, 2, 4);
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3821 dspfunc(avg, 3, 2);
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3822 #undef dspfunc
857
b510a7b6decd 100l for kabi (fixing qpel)
michaelni
parents: 853
diff changeset
3823
1864
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
3824 c->put_no_rnd_pixels_l2[0]= put_no_rnd_pixels16_l2_c;
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
3825 c->put_no_rnd_pixels_l2[1]= put_no_rnd_pixels8_l2_c;
9a73e6dc5d68 fix motion compensation with (x+1/2,y+1/2) MVs
michael
parents: 1784
diff changeset
3826
1267
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3827 c->put_tpel_pixels_tab[ 0] = put_tpel_pixels_mc00_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3828 c->put_tpel_pixels_tab[ 1] = put_tpel_pixels_mc10_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3829 c->put_tpel_pixels_tab[ 2] = put_tpel_pixels_mc20_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3830 c->put_tpel_pixels_tab[ 4] = put_tpel_pixels_mc01_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3831 c->put_tpel_pixels_tab[ 5] = put_tpel_pixels_mc11_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3832 c->put_tpel_pixels_tab[ 6] = put_tpel_pixels_mc21_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3833 c->put_tpel_pixels_tab[ 8] = put_tpel_pixels_mc02_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3834 c->put_tpel_pixels_tab[ 9] = put_tpel_pixels_mc12_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3835 c->put_tpel_pixels_tab[10] = put_tpel_pixels_mc22_c;
85b71f9f7450 moving the svq3 motion compensation stuff to dsputil (this also means that existing optimized halfpel code is used now ...)
michaelni
parents: 1264
diff changeset
3836
1319
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3837 c->avg_tpel_pixels_tab[ 0] = avg_tpel_pixels_mc00_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3838 c->avg_tpel_pixels_tab[ 1] = avg_tpel_pixels_mc10_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3839 c->avg_tpel_pixels_tab[ 2] = avg_tpel_pixels_mc20_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3840 c->avg_tpel_pixels_tab[ 4] = avg_tpel_pixels_mc01_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3841 c->avg_tpel_pixels_tab[ 5] = avg_tpel_pixels_mc11_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3842 c->avg_tpel_pixels_tab[ 6] = avg_tpel_pixels_mc21_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3843 c->avg_tpel_pixels_tab[ 8] = avg_tpel_pixels_mc02_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3844 c->avg_tpel_pixels_tab[ 9] = avg_tpel_pixels_mc12_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3845 c->avg_tpel_pixels_tab[10] = avg_tpel_pixels_mc22_c;
449f6e32b425 added support for B-frames and multiple slices
tmmm
parents: 1273
diff changeset
3846
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3847 #define dspfunc(PFX, IDX, NUM) \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3848 c->PFX ## _pixels_tab[IDX][ 0] = PFX ## NUM ## _mc00_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3849 c->PFX ## _pixels_tab[IDX][ 1] = PFX ## NUM ## _mc10_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3850 c->PFX ## _pixels_tab[IDX][ 2] = PFX ## NUM ## _mc20_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3851 c->PFX ## _pixels_tab[IDX][ 3] = PFX ## NUM ## _mc30_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3852 c->PFX ## _pixels_tab[IDX][ 4] = PFX ## NUM ## _mc01_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3853 c->PFX ## _pixels_tab[IDX][ 5] = PFX ## NUM ## _mc11_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3854 c->PFX ## _pixels_tab[IDX][ 6] = PFX ## NUM ## _mc21_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3855 c->PFX ## _pixels_tab[IDX][ 7] = PFX ## NUM ## _mc31_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3856 c->PFX ## _pixels_tab[IDX][ 8] = PFX ## NUM ## _mc02_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3857 c->PFX ## _pixels_tab[IDX][ 9] = PFX ## NUM ## _mc12_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3858 c->PFX ## _pixels_tab[IDX][10] = PFX ## NUM ## _mc22_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3859 c->PFX ## _pixels_tab[IDX][11] = PFX ## NUM ## _mc32_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3860 c->PFX ## _pixels_tab[IDX][12] = PFX ## NUM ## _mc03_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3861 c->PFX ## _pixels_tab[IDX][13] = PFX ## NUM ## _mc13_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3862 c->PFX ## _pixels_tab[IDX][14] = PFX ## NUM ## _mc23_c; \
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3863 c->PFX ## _pixels_tab[IDX][15] = PFX ## NUM ## _mc33_c
857
b510a7b6decd 100l for kabi (fixing qpel)
michaelni
parents: 853
diff changeset
3864
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3865 dspfunc(put_qpel, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3866 dspfunc(put_no_rnd_qpel, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3867
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3868 dspfunc(avg_qpel, 0, 16);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3869 /* dspfunc(avg_no_rnd_qpel, 0, 16); */
857
b510a7b6decd 100l for kabi (fixing qpel)
michaelni
parents: 853
diff changeset
3870
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3871 dspfunc(put_qpel, 1, 8);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3872 dspfunc(put_no_rnd_qpel, 1, 8);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3873
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3874 dspfunc(avg_qpel, 1, 8);
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3875 /* dspfunc(avg_no_rnd_qpel, 1, 8); */
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3876
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3877 dspfunc(put_h264_qpel, 0, 16);
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3878 dspfunc(put_h264_qpel, 1, 8);
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3879 dspfunc(put_h264_qpel, 2, 4);
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3880 dspfunc(avg_h264_qpel, 0, 16);
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3881 dspfunc(avg_h264_qpel, 1, 8);
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3882 dspfunc(avg_h264_qpel, 2, 4);
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3883
859
9512471dec40 * using macros to shorten init part
kabi
parents: 858
diff changeset
3884 #undef dspfunc
1168
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3885 c->put_h264_chroma_pixels_tab[0]= put_h264_chroma_mc8_c;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3886 c->put_h264_chroma_pixels_tab[1]= put_h264_chroma_mc4_c;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3887 c->put_h264_chroma_pixels_tab[2]= put_h264_chroma_mc2_c;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3888 c->avg_h264_chroma_pixels_tab[0]= avg_h264_chroma_mc8_c;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3889 c->avg_h264_chroma_pixels_tab[1]= avg_h264_chroma_mc4_c;
5af9aeadbdc3 H264 decoder & demuxer
michaelni
parents: 1106
diff changeset
3890 c->avg_h264_chroma_pixels_tab[2]= avg_h264_chroma_mc2_c;
857
b510a7b6decd 100l for kabi (fixing qpel)
michaelni
parents: 853
diff changeset
3891
2415
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3892 c->weight_h264_pixels_tab[0]= weight_h264_pixels16x16_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3893 c->weight_h264_pixels_tab[1]= weight_h264_pixels16x8_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3894 c->weight_h264_pixels_tab[2]= weight_h264_pixels8x16_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3895 c->weight_h264_pixels_tab[3]= weight_h264_pixels8x8_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3896 c->weight_h264_pixels_tab[4]= weight_h264_pixels8x4_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3897 c->weight_h264_pixels_tab[5]= weight_h264_pixels4x8_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3898 c->weight_h264_pixels_tab[6]= weight_h264_pixels4x4_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3899 c->weight_h264_pixels_tab[7]= weight_h264_pixels4x2_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3900 c->weight_h264_pixels_tab[8]= weight_h264_pixels2x4_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3901 c->weight_h264_pixels_tab[9]= weight_h264_pixels2x2_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3902 c->biweight_h264_pixels_tab[0]= biweight_h264_pixels16x16_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3903 c->biweight_h264_pixels_tab[1]= biweight_h264_pixels16x8_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3904 c->biweight_h264_pixels_tab[2]= biweight_h264_pixels8x16_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3905 c->biweight_h264_pixels_tab[3]= biweight_h264_pixels8x8_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3906 c->biweight_h264_pixels_tab[4]= biweight_h264_pixels8x4_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3907 c->biweight_h264_pixels_tab[5]= biweight_h264_pixels4x8_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3908 c->biweight_h264_pixels_tab[6]= biweight_h264_pixels4x4_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3909 c->biweight_h264_pixels_tab[7]= biweight_h264_pixels4x2_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3910 c->biweight_h264_pixels_tab[8]= biweight_h264_pixels2x4_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3911 c->biweight_h264_pixels_tab[9]= biweight_h264_pixels2x2_c;
db2cf6005d19 H.264 weighted prediction.
lorenm
parents: 2382
diff changeset
3912
936
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3913 c->put_mspel_pixels_tab[0]= put_mspel8_mc00_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3914 c->put_mspel_pixels_tab[1]= put_mspel8_mc10_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3915 c->put_mspel_pixels_tab[2]= put_mspel8_mc20_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3916 c->put_mspel_pixels_tab[3]= put_mspel8_mc30_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3917 c->put_mspel_pixels_tab[4]= put_mspel8_mc02_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3918 c->put_mspel_pixels_tab[5]= put_mspel8_mc12_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3919 c->put_mspel_pixels_tab[6]= put_mspel8_mc22_c;
caa77cd960c0 qpel encoding
michaelni
parents: 909
diff changeset
3920 c->put_mspel_pixels_tab[7]= put_mspel8_mc32_c;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3921
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3922 #define SET_CMP_FUNC(name) \
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3923 c->name[0]= name ## 16_c;\
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3924 c->name[1]= name ## 8x8_c;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3925
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3926 SET_CMP_FUNC(hadamard8_diff)
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3927 c->hadamard8_diff[4]= hadamard8_intra16_c;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3928 SET_CMP_FUNC(dct_sad)
2382
23e7af611c34 more flexible frame skip decission
michael
parents: 2272
diff changeset
3929 SET_CMP_FUNC(dct_max)
3010
533c6386eca9 8x8 integer dct from x264 as cmp function (under CONFIG_GPL)
michael
parents: 2979
diff changeset
3930 SET_CMP_FUNC(dct264_sad)
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3931 c->sad[0]= pix_abs16_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3932 c->sad[1]= pix_abs8_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3933 c->sse[0]= sse16_c;
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3934 c->sse[1]= sse8_c;
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3935 c->sse[2]= sse4_c;
1708
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3936 SET_CMP_FUNC(quant_psnr)
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3937 SET_CMP_FUNC(rd)
dea5b2946999 interlaced motion estimation
michael
parents: 1689
diff changeset
3938 SET_CMP_FUNC(bit)
1729
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3939 c->vsad[0]= vsad16_c;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3940 c->vsad[4]= vsad_intra16_c;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3941 c->vsse[0]= vsse16_c;
a4a5e7521339 interlaced dct decision cleanup
michael
parents: 1708
diff changeset
3942 c->vsse[4]= vsse_intra16_c;
2065
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3943 c->nsse[0]= nsse16_c;
9e4bebc39ade noise preserving sum of squares comparission function
michael
parents: 2045
diff changeset
3944 c->nsse[1]= nsse8_c;
2184
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3945 c->w53[0]= w53_16_c;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3946 c->w53[1]= w53_8_c;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3947 c->w97[0]= w97_16_c;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3948 c->w97[1]= w97_8_c;
3378d0677903 4x4 SSE compare function
michael
parents: 2169
diff changeset
3949
866
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3950 c->add_bytes= add_bytes_c;
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3951 c->diff_bytes= diff_bytes_c;
1527
8ffd0c00e6df mmx2 optimization of huffyuv median encoding
michael
parents: 1329
diff changeset
3952 c->sub_hfyu_median_prediction= sub_hfyu_median_prediction_c;
1273
a979fab41ed8 ASV1 codec
michaelni
parents: 1267
diff changeset
3953 c->bswap_buf= bswap_buf;
2633
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
3954
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
3955 c->h264_v_loop_filter_luma= h264_v_loop_filter_luma_c;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
3956 c->h264_h_loop_filter_luma= h264_h_loop_filter_luma_c;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
3957 c->h264_v_loop_filter_chroma= h264_v_loop_filter_chroma_c;
72e6ffa1f3a5 MMX for H.264 deblocking filter
lorenm
parents: 2522
diff changeset
3958 c->h264_h_loop_filter_chroma= h264_h_loop_filter_chroma_c;
2707
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
3959 c->h264_v_loop_filter_chroma_intra= h264_v_loop_filter_chroma_intra_c;
360024d31dab H.264 deblocking optimizations (mmx for chroma_bS4 case, convert existing cases to 8-bit math)
lorenm
parents: 2696
diff changeset
3960 c->h264_h_loop_filter_chroma_intra= h264_h_loop_filter_chroma_intra_c;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3961
1644
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
3962 c->h263_h_loop_filter= h263_h_loop_filter_c;
835cf346975e h263 loop filter
michael
parents: 1598
diff changeset
3963 c->h263_v_loop_filter= h263_v_loop_filter_c;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3964
2045
9447bbd8a7e9 rewrite h261 loop filter
michael
parents: 2044
diff changeset
3965 c->h261_loop_filter= h261_loop_filter_c;
2967
ef2149182f1c COSMETICS: Remove all trailing whitespace.
diego
parents: 2834
diff changeset
3966
1784
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3967 c->try_8x8basis= try_8x8basis_c;
65f7bd09f37b quantizer noise shaping optimization
michael
parents: 1739
diff changeset
3968 c->add_8x8basis= add_8x8basis_c;
866
725ef4ea3ecc huffyuv
michaelni
parents: 861
diff changeset
3969
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
3970 #ifdef HAVE_MMX
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3971 dsputil_init_mmx(c, avctx);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
3972 #endif
62
4bfc845cdfea arm optimizations
glantau
parents: 50
diff changeset
3973 #ifdef ARCH_ARMV4L
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3974 dsputil_init_armv4l(c, avctx);
62
4bfc845cdfea arm optimizations
glantau
parents: 50
diff changeset
3975 #endif
88
06f63b58d2a8 mlib merge
glantau
parents: 62
diff changeset
3976 #ifdef HAVE_MLIB
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3977 dsputil_init_mlib(c, avctx);
88
06f63b58d2a8 mlib merge
glantau
parents: 62
diff changeset
3978 #endif
1959
55b7435c59b8 VIS optimized motion compensation code. by (David S. Miller <davem at redhat dot com>)
michael
parents: 1866
diff changeset
3979 #ifdef ARCH_SPARC
55b7435c59b8 VIS optimized motion compensation code. by (David S. Miller <davem at redhat dot com>)
michael
parents: 1866
diff changeset
3980 dsputil_init_vis(c,avctx);
55b7435c59b8 VIS optimized motion compensation code. by (David S. Miller <davem at redhat dot com>)
michael
parents: 1866
diff changeset
3981 #endif
214
73df666cacc7 Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents: 209
diff changeset
3982 #ifdef ARCH_ALPHA
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3983 dsputil_init_alpha(c, avctx);
214
73df666cacc7 Alpha optimizations by Falk Hueffner <falk.hueffner@student.uni-tuebingen.de>
nickols_k
parents: 209
diff changeset
3984 #endif
623
92e99e506920 first cut at altivec support on darwin patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 612
diff changeset
3985 #ifdef ARCH_POWERPC
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3986 dsputil_init_ppc(c, avctx);
626
23a093d6e450 patch by Heliodoro Tammaro <helio at interactives dot org>
michaelni
parents: 625
diff changeset
3987 #endif
689
efcbfbd18864 ps2 idct patch by (Leon van Stuivenberg <leonvs at iae dot nl>)
michaelni
parents: 676
diff changeset
3988 #ifdef HAVE_MMI
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3989 dsputil_init_mmi(c, avctx);
689
efcbfbd18864 ps2 idct patch by (Leon van Stuivenberg <leonvs at iae dot nl>)
michaelni
parents: 676
diff changeset
3990 #endif
1259
e8c3884f2c7e sh4 optimized idct & bswap patch by (BERO <bero at geocities dot co dot jp>)
michaelni
parents: 1201
diff changeset
3991 #ifdef ARCH_SH4
e8c3884f2c7e sh4 optimized idct & bswap patch by (BERO <bero at geocities dot co dot jp>)
michaelni
parents: 1201
diff changeset
3992 dsputil_init_sh4(c,avctx);
e8c3884f2c7e sh4 optimized idct & bswap patch by (BERO <bero at geocities dot co dot jp>)
michaelni
parents: 1201
diff changeset
3993 #endif
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3994
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3995 switch(c->idct_permutation_type){
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3996 case FF_NO_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3997 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3998 c->idct_permutation[i]= i;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
3999 break;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4000 case FF_LIBMPEG2_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4001 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4002 c->idct_permutation[i]= (i & 0x38) | ((i & 6) >> 1) | ((i & 1) << 2);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4003 break;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4004 case FF_SIMPLE_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4005 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4006 c->idct_permutation[i]= simple_mmx_permutation[i];
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4007 break;
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4008 case FF_TRANSPOSE_IDCT_PERM:
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4009 for(i=0; i<64; i++)
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4010 c->idct_permutation[i]= ((i&7)<<3) | (i>>3);
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4011 break;
2696
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API
michael
parents: 2693
diff changeset
4012 case FF_PARTTRANS_IDCT_PERM:
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API
michael
parents: 2693
diff changeset
4013 for(i=0; i<64; i++)
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API
michael
parents: 2693
diff changeset
4014 c->idct_permutation[i]= (i&0x24) | ((i&3)<<3) | ((i>>3)&3);
9699d325049d porting the mmx&sse2 (sse2 untested) vp3 idcts to the lavc idct API
michael
parents: 2693
diff changeset
4015 break;
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4016 default:
1598
932d306bf1dc av_log() patch by (Michel Bardiaux <mbardiaux at peaktime dot be>)
michael
parents: 1571
diff changeset
4017 av_log(avctx, AV_LOG_ERROR, "Internal error, IDCT permutation not set\n");
1092
f59c3f66363b MpegEncContext.(i)dct_* -> DspContext.(i)dct_*
michaelni
parents: 1064
diff changeset
4018 }
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
4019 }
252
ddb1a0e94cf4 - Added PSNR feature to libavcodec and ffmpeg. By now just Y PSNR until I'm
pulento
parents: 220
diff changeset
4020