annotate imgresample.c @ 1157:57fe9c4e0c6e libavcodec

fixing cliping of c deinterlacers 5 tap lowpass deinterlacer
author michaelni
date Sat, 29 Mar 2003 13:31:12 +0000
parents 1e39f273ecd6
children 766a2f4edbea
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
1 /*
986e461dc072 Initial revision
glantau
parents:
diff changeset
2 * High quality image resampling with polyphase filters
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
3 * Copyright (c) 2001 Fabrice Bellard.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
4 *
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
5 * This library is free software; you can redistribute it and/or
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
6 * modify it under the terms of the GNU Lesser General Public
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
7 * License as published by the Free Software Foundation; either
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
8 * version 2 of the License, or (at your option) any later version.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
9 *
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
10 * This library is distributed in the hope that it will be useful,
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
13 * Lesser General Public License for more details.
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
14 *
429
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
15 * You should have received a copy of the GNU Lesser General Public
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
16 * License along with this library; if not, write to the Free Software
718a22dc121f license/copyright change
glantau
parents: 412
diff changeset
17 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
18 */
1106
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
19
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
20 /**
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
21 * @file imgresample.c
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
22 * High quality image resampling with polyphase filters .
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
23 */
1e39f273ecd6 per file doxy
michaelni
parents: 1064
diff changeset
24
396
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
25 #include "avcodec.h"
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
26 #include "dsputil.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
27
17
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
28 #ifdef USE_FASTMEMCPY
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
29 #include "fastmemcpy.h"
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
30 #endif
b69fe46fd708 Adding fastmemcpy stuff to speedup mplayer project
nickols_k
parents: 2
diff changeset
31
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
32 #define NB_COMPONENTS 3
986e461dc072 Initial revision
glantau
parents:
diff changeset
33
986e461dc072 Initial revision
glantau
parents:
diff changeset
34 #define PHASE_BITS 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
35 #define NB_PHASES (1 << PHASE_BITS)
986e461dc072 Initial revision
glantau
parents:
diff changeset
36 #define NB_TAPS 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
37 #define FCENTER 1 /* index of the center of the filter */
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
38 //#define TEST 1 /* Test it */
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
39
986e461dc072 Initial revision
glantau
parents:
diff changeset
40 #define POS_FRAC_BITS 16
986e461dc072 Initial revision
glantau
parents:
diff changeset
41 #define POS_FRAC (1 << POS_FRAC_BITS)
986e461dc072 Initial revision
glantau
parents:
diff changeset
42 /* 6 bits precision is needed for MMX */
986e461dc072 Initial revision
glantau
parents:
diff changeset
43 #define FILTER_BITS 8
986e461dc072 Initial revision
glantau
parents:
diff changeset
44
986e461dc072 Initial revision
glantau
parents:
diff changeset
45 #define LINE_BUF_HEIGHT (NB_TAPS * 4)
986e461dc072 Initial revision
glantau
parents:
diff changeset
46
986e461dc072 Initial revision
glantau
parents:
diff changeset
47 struct ImgReSampleContext {
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
48 int iwidth, iheight, owidth, oheight, topBand, bottomBand, leftBand, rightBand;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
49 int h_incr, v_incr;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
50 int16_t h_filters[NB_PHASES][NB_TAPS] __align8; /* horizontal filters */
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
51 int16_t v_filters[NB_PHASES][NB_TAPS] __align8; /* vertical filters */
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
52 uint8_t *line_buf;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
53 };
986e461dc072 Initial revision
glantau
parents:
diff changeset
54
986e461dc072 Initial revision
glantau
parents:
diff changeset
55 static inline int get_phase(int pos)
986e461dc072 Initial revision
glantau
parents:
diff changeset
56 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
57 return ((pos) >> (POS_FRAC_BITS - PHASE_BITS)) & ((1 << PHASE_BITS) - 1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
58 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
59
986e461dc072 Initial revision
glantau
parents:
diff changeset
60 /* This function must be optimized */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
61 static void h_resample_fast(uint8_t *dst, int dst_width, uint8_t *src, int src_width,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
62 int src_start, int src_incr, int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
63 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
64 int src_pos, phase, sum, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
65 uint8_t *s;
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
66 int16_t *filter;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
67
986e461dc072 Initial revision
glantau
parents:
diff changeset
68 src_pos = src_start;
986e461dc072 Initial revision
glantau
parents:
diff changeset
69 for(i=0;i<dst_width;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
70 #ifdef TEST
986e461dc072 Initial revision
glantau
parents:
diff changeset
71 /* test */
986e461dc072 Initial revision
glantau
parents:
diff changeset
72 if ((src_pos >> POS_FRAC_BITS) < 0 ||
986e461dc072 Initial revision
glantau
parents:
diff changeset
73 (src_pos >> POS_FRAC_BITS) > (src_width - NB_TAPS))
653
714795876872 Change abort() calls to av_abort() calls.
philipjsg
parents: 644
diff changeset
74 av_abort();
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
75 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
76 s = src + (src_pos >> POS_FRAC_BITS);
986e461dc072 Initial revision
glantau
parents:
diff changeset
77 phase = get_phase(src_pos);
986e461dc072 Initial revision
glantau
parents:
diff changeset
78 filter = filters + phase * NB_TAPS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
79 #if NB_TAPS == 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
80 sum = s[0] * filter[0] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
81 s[1] * filter[1] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
82 s[2] * filter[2] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
83 s[3] * filter[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
84 #else
986e461dc072 Initial revision
glantau
parents:
diff changeset
85 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
86 int j;
986e461dc072 Initial revision
glantau
parents:
diff changeset
87 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
88 for(j=0;j<NB_TAPS;j++)
986e461dc072 Initial revision
glantau
parents:
diff changeset
89 sum += s[j] * filter[j];
986e461dc072 Initial revision
glantau
parents:
diff changeset
90 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
91 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
92 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
93 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
94 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
95 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
96 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
97 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
98 src_pos += src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
99 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
100 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
101 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
102
986e461dc072 Initial revision
glantau
parents:
diff changeset
103 /* This function must be optimized */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
104 static void v_resample(uint8_t *dst, int dst_width, uint8_t *src, int wrap,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
105 int16_t *filter)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
106 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
107 int sum, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
108 uint8_t *s;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
109
986e461dc072 Initial revision
glantau
parents:
diff changeset
110 s = src;
986e461dc072 Initial revision
glantau
parents:
diff changeset
111 for(i=0;i<dst_width;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
112 #if NB_TAPS == 4
986e461dc072 Initial revision
glantau
parents:
diff changeset
113 sum = s[0 * wrap] * filter[0] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
114 s[1 * wrap] * filter[1] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
115 s[2 * wrap] * filter[2] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
116 s[3 * wrap] * filter[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
117 #else
986e461dc072 Initial revision
glantau
parents:
diff changeset
118 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
119 int j;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
120 uint8_t *s1 = s;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
121
986e461dc072 Initial revision
glantau
parents:
diff changeset
122 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
123 for(j=0;j<NB_TAPS;j++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
124 sum += s1[0] * filter[j];
986e461dc072 Initial revision
glantau
parents:
diff changeset
125 s1 += wrap;
986e461dc072 Initial revision
glantau
parents:
diff changeset
126 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
127 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
128 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
129 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
130 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
131 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
132 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
133 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
134 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
135 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
136 s++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
137 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
138 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
139
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
140 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
141
986e461dc072 Initial revision
glantau
parents:
diff changeset
142 #include "i386/mmx.h"
986e461dc072 Initial revision
glantau
parents:
diff changeset
143
986e461dc072 Initial revision
glantau
parents:
diff changeset
144 #define FILTER4(reg) \
986e461dc072 Initial revision
glantau
parents:
diff changeset
145 {\
986e461dc072 Initial revision
glantau
parents:
diff changeset
146 s = src + (src_pos >> POS_FRAC_BITS);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
147 phase = get_phase(src_pos);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
148 filter = filters + phase * NB_TAPS;\
986e461dc072 Initial revision
glantau
parents:
diff changeset
149 movq_m2r(*s, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
150 punpcklbw_r2r(mm7, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
151 movq_m2r(*filter, mm6);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
152 pmaddwd_r2r(reg, mm6);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
153 movq_r2r(mm6, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
154 psrlq_i2r(32, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
155 paddd_r2r(mm6, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
156 psrad_i2r(FILTER_BITS, reg);\
986e461dc072 Initial revision
glantau
parents:
diff changeset
157 src_pos += src_incr;\
986e461dc072 Initial revision
glantau
parents:
diff changeset
158 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
159
986e461dc072 Initial revision
glantau
parents:
diff changeset
160 #define DUMP(reg) movq_r2m(reg, tmp); printf(#reg "=%016Lx\n", tmp.uq);
986e461dc072 Initial revision
glantau
parents:
diff changeset
161
986e461dc072 Initial revision
glantau
parents:
diff changeset
162 /* XXX: do four pixels at a time */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
163 static void h_resample_fast4_mmx(uint8_t *dst, int dst_width, uint8_t *src, int src_width,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
164 int src_start, int src_incr, int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
165 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
166 int src_pos, phase;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
167 uint8_t *s;
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
168 int16_t *filter;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
169 mmx_t tmp;
986e461dc072 Initial revision
glantau
parents:
diff changeset
170
986e461dc072 Initial revision
glantau
parents:
diff changeset
171 src_pos = src_start;
986e461dc072 Initial revision
glantau
parents:
diff changeset
172 pxor_r2r(mm7, mm7);
986e461dc072 Initial revision
glantau
parents:
diff changeset
173
986e461dc072 Initial revision
glantau
parents:
diff changeset
174 while (dst_width >= 4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
175
986e461dc072 Initial revision
glantau
parents:
diff changeset
176 FILTER4(mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
177 FILTER4(mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
178 FILTER4(mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
179 FILTER4(mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
180
986e461dc072 Initial revision
glantau
parents:
diff changeset
181 packuswb_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
182 packuswb_r2r(mm7, mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
183 packuswb_r2r(mm7, mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
184 packuswb_r2r(mm7, mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
185 movq_r2m(mm0, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
186 dst[0] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
187 movq_r2m(mm1, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
188 dst[1] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
189 movq_r2m(mm2, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
190 dst[2] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
191 movq_r2m(mm3, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
192 dst[3] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
193 dst += 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
194 dst_width -= 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
195 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
196 while (dst_width > 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
197 FILTER4(mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
198 packuswb_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
199 movq_r2m(mm0, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
200 dst[0] = tmp.ub[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
201 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
202 dst_width--;
986e461dc072 Initial revision
glantau
parents:
diff changeset
203 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
204 emms();
986e461dc072 Initial revision
glantau
parents:
diff changeset
205 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
206
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
207 static void v_resample4_mmx(uint8_t *dst, int dst_width, uint8_t *src, int wrap,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
208 int16_t *filter)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
209 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
210 int sum, i, v;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
211 uint8_t *s;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
212 mmx_t tmp;
986e461dc072 Initial revision
glantau
parents:
diff changeset
213 mmx_t coefs[4];
986e461dc072 Initial revision
glantau
parents:
diff changeset
214
986e461dc072 Initial revision
glantau
parents:
diff changeset
215 for(i=0;i<4;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
216 v = filter[i];
986e461dc072 Initial revision
glantau
parents:
diff changeset
217 coefs[i].uw[0] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
218 coefs[i].uw[1] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
219 coefs[i].uw[2] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
220 coefs[i].uw[3] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
221 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
222
986e461dc072 Initial revision
glantau
parents:
diff changeset
223 pxor_r2r(mm7, mm7);
986e461dc072 Initial revision
glantau
parents:
diff changeset
224 s = src;
986e461dc072 Initial revision
glantau
parents:
diff changeset
225 while (dst_width >= 4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
226 movq_m2r(s[0 * wrap], mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
227 punpcklbw_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
228 movq_m2r(s[1 * wrap], mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
229 punpcklbw_r2r(mm7, mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
230 movq_m2r(s[2 * wrap], mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
231 punpcklbw_r2r(mm7, mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
232 movq_m2r(s[3 * wrap], mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
233 punpcklbw_r2r(mm7, mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
234
986e461dc072 Initial revision
glantau
parents:
diff changeset
235 pmullw_m2r(coefs[0], mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
236 pmullw_m2r(coefs[1], mm1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
237 pmullw_m2r(coefs[2], mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
238 pmullw_m2r(coefs[3], mm3);
986e461dc072 Initial revision
glantau
parents:
diff changeset
239
986e461dc072 Initial revision
glantau
parents:
diff changeset
240 paddw_r2r(mm1, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
241 paddw_r2r(mm3, mm2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
242 paddw_r2r(mm2, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
243 psraw_i2r(FILTER_BITS, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
244
986e461dc072 Initial revision
glantau
parents:
diff changeset
245 packuswb_r2r(mm7, mm0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
246 movq_r2m(mm0, tmp);
986e461dc072 Initial revision
glantau
parents:
diff changeset
247
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
248 *(uint32_t *)dst = tmp.ud[0];
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
249 dst += 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
250 s += 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
251 dst_width -= 4;
986e461dc072 Initial revision
glantau
parents:
diff changeset
252 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
253 while (dst_width > 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
254 sum = s[0 * wrap] * filter[0] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
255 s[1 * wrap] * filter[1] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
256 s[2 * wrap] * filter[2] +
986e461dc072 Initial revision
glantau
parents:
diff changeset
257 s[3 * wrap] * filter[3];
986e461dc072 Initial revision
glantau
parents:
diff changeset
258 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
259 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
260 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
261 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
262 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
263 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
264 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
265 s++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
266 dst_width--;
986e461dc072 Initial revision
glantau
parents:
diff changeset
267 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
268 emms();
986e461dc072 Initial revision
glantau
parents:
diff changeset
269 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
270 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
271
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
272 #ifdef HAVE_ALTIVEC
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
273 typedef union {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
274 vector unsigned char v;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
275 unsigned char c[16];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
276 } vec_uc_t;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
277
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
278 typedef union {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
279 vector signed short v;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
280 signed short s[8];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
281 } vec_ss_t;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
282
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
283 void v_resample16_altivec(uint8_t *dst, int dst_width, uint8_t *src, int wrap,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
284 int16_t *filter)
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
285 {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
286 int sum, i;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
287 uint8_t *s;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
288 vector unsigned char *tv, tmp, dstv, zero;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
289 vec_ss_t srchv[4], srclv[4], fv[4];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
290 vector signed short zeros, sumhv, sumlv;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
291 s = src;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
292
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
293 for(i=0;i<4;i++)
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
294 {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
295 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
296 The vec_madds later on does an implicit >>15 on the result.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
297 Since FILTER_BITS is 8, and we have 15 bits of magnitude in
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
298 a signed short, we have just enough bits to pre-shift our
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
299 filter constants <<7 to compensate for vec_madds.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
300 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
301 fv[i].s[0] = filter[i] << (15-FILTER_BITS);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
302 fv[i].v = vec_splat(fv[i].v, 0);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
303 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
304
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
305 zero = vec_splat_u8(0);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
306 zeros = vec_splat_s16(0);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
307
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
308
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
309 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
310 When we're resampling, we'd ideally like both our input buffers,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
311 and output buffers to be 16-byte aligned, so we can do both aligned
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
312 reads and writes. Sadly we can't always have this at the moment, so
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
313 we opt for aligned writes, as unaligned writes have a huge overhead.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
314 To do this, do enough scalar resamples to get dst 16-byte aligned.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
315 */
898
6d5e3fe7aea1 Simplify an expression and eliminate a compile warning
philipjsg
parents: 894
diff changeset
316 i = (-(int)dst) & 0xf;
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
317 while(i>0) {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
318 sum = s[0 * wrap] * filter[0] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
319 s[1 * wrap] * filter[1] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
320 s[2 * wrap] * filter[2] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
321 s[3 * wrap] * filter[3];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
322 sum = sum >> FILTER_BITS;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
323 if (sum<0) sum = 0; else if (sum>255) sum=255;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
324 dst[0] = sum;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
325 dst++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
326 s++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
327 dst_width--;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
328 i--;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
329 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
330
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
331 /* Do our altivec resampling on 16 pixels at once. */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
332 while(dst_width>=16) {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
333 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
334 Read 16 (potentially unaligned) bytes from each of
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
335 4 lines into 4 vectors, and split them into shorts.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
336 Interleave the multipy/accumulate for the resample
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
337 filter with the loads to hide the 3 cycle latency
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
338 the vec_madds have.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
339 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
340 tv = (vector unsigned char *) &s[0 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
341 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[i * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
342 srchv[0].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
343 srclv[0].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
344 sumhv = vec_madds(srchv[0].v, fv[0].v, zeros);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
345 sumlv = vec_madds(srclv[0].v, fv[0].v, zeros);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
346
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
347 tv = (vector unsigned char *) &s[1 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
348 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[1 * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
349 srchv[1].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
350 srclv[1].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
351 sumhv = vec_madds(srchv[1].v, fv[1].v, sumhv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
352 sumlv = vec_madds(srclv[1].v, fv[1].v, sumlv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
353
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
354 tv = (vector unsigned char *) &s[2 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
355 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[2 * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
356 srchv[2].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
357 srclv[2].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
358 sumhv = vec_madds(srchv[2].v, fv[2].v, sumhv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
359 sumlv = vec_madds(srclv[2].v, fv[2].v, sumlv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
360
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
361 tv = (vector unsigned char *) &s[3 * wrap];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
362 tmp = vec_perm(tv[0], tv[1], vec_lvsl(0, &s[3 * wrap]));
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
363 srchv[3].v = (vector signed short) vec_mergeh(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
364 srclv[3].v = (vector signed short) vec_mergel(zero, tmp);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
365 sumhv = vec_madds(srchv[3].v, fv[3].v, sumhv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
366 sumlv = vec_madds(srclv[3].v, fv[3].v, sumlv);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
367
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
368 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
369 Pack the results into our destination vector,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
370 and do an aligned write of that back to memory.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
371 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
372 dstv = vec_packsu(sumhv, sumlv) ;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
373 vec_st(dstv, 0, (vector unsigned char *) dst);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
374
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
375 dst+=16;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
376 s+=16;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
377 dst_width-=16;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
378 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
379
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
380 /*
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
381 If there are any leftover pixels, resample them
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
382 with the slow scalar method.
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
383 */
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
384 while(dst_width>0) {
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
385 sum = s[0 * wrap] * filter[0] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
386 s[1 * wrap] * filter[1] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
387 s[2 * wrap] * filter[2] +
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
388 s[3 * wrap] * filter[3];
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
389 sum = sum >> FILTER_BITS;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
390 if (sum<0) sum = 0; else if (sum>255) sum=255;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
391 dst[0] = sum;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
392 dst++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
393 s++;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
394 dst_width--;
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
395 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
396 }
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
397 #endif
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
398
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
399 /* slow version to handle limit cases. Does not need optimisation */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
400 static void h_resample_slow(uint8_t *dst, int dst_width, uint8_t *src, int src_width,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
401 int src_start, int src_incr, int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
402 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
403 int src_pos, phase, sum, j, v, i;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
404 uint8_t *s, *src_end;
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
405 int16_t *filter;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
406
986e461dc072 Initial revision
glantau
parents:
diff changeset
407 src_end = src + src_width;
986e461dc072 Initial revision
glantau
parents:
diff changeset
408 src_pos = src_start;
986e461dc072 Initial revision
glantau
parents:
diff changeset
409 for(i=0;i<dst_width;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
410 s = src + (src_pos >> POS_FRAC_BITS);
986e461dc072 Initial revision
glantau
parents:
diff changeset
411 phase = get_phase(src_pos);
986e461dc072 Initial revision
glantau
parents:
diff changeset
412 filter = filters + phase * NB_TAPS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
413 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
414 for(j=0;j<NB_TAPS;j++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
415 if (s < src)
986e461dc072 Initial revision
glantau
parents:
diff changeset
416 v = src[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
417 else if (s >= src_end)
986e461dc072 Initial revision
glantau
parents:
diff changeset
418 v = src_end[-1];
986e461dc072 Initial revision
glantau
parents:
diff changeset
419 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
420 v = s[0];
986e461dc072 Initial revision
glantau
parents:
diff changeset
421 sum += v * filter[j];
986e461dc072 Initial revision
glantau
parents:
diff changeset
422 s++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
423 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
424 sum = sum >> FILTER_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
425 if (sum < 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
426 sum = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
427 else if (sum > 255)
986e461dc072 Initial revision
glantau
parents:
diff changeset
428 sum = 255;
986e461dc072 Initial revision
glantau
parents:
diff changeset
429 dst[0] = sum;
986e461dc072 Initial revision
glantau
parents:
diff changeset
430 src_pos += src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
431 dst++;
986e461dc072 Initial revision
glantau
parents:
diff changeset
432 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
433 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
434
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
435 static void h_resample(uint8_t *dst, int dst_width, uint8_t *src, int src_width,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
436 int src_start, int src_incr, int16_t *filters)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
437 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
438 int n, src_end;
986e461dc072 Initial revision
glantau
parents:
diff changeset
439
986e461dc072 Initial revision
glantau
parents:
diff changeset
440 if (src_start < 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
441 n = (0 - src_start + src_incr - 1) / src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
442 h_resample_slow(dst, n, src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
443 dst += n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
444 dst_width -= n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
445 src_start += n * src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
446 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
447 src_end = src_start + dst_width * src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
448 if (src_end > ((src_width - NB_TAPS) << POS_FRAC_BITS)) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
449 n = (((src_width - NB_TAPS + 1) << POS_FRAC_BITS) - 1 - src_start) /
986e461dc072 Initial revision
glantau
parents:
diff changeset
450 src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
451 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
452 n = dst_width;
986e461dc072 Initial revision
glantau
parents:
diff changeset
453 }
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
454 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
455 if ((mm_flags & MM_MMX) && NB_TAPS == 4)
986e461dc072 Initial revision
glantau
parents:
diff changeset
456 h_resample_fast4_mmx(dst, n,
986e461dc072 Initial revision
glantau
parents:
diff changeset
457 src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
458 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
459 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
460 h_resample_fast(dst, n,
986e461dc072 Initial revision
glantau
parents:
diff changeset
461 src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
462 if (n < dst_width) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
463 dst += n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
464 dst_width -= n;
986e461dc072 Initial revision
glantau
parents:
diff changeset
465 src_start += n * src_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
466 h_resample_slow(dst, dst_width,
986e461dc072 Initial revision
glantau
parents:
diff changeset
467 src, src_width, src_start, src_incr, filters);
986e461dc072 Initial revision
glantau
parents:
diff changeset
468 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
469 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
470
986e461dc072 Initial revision
glantau
parents:
diff changeset
471 static void component_resample(ImgReSampleContext *s,
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
472 uint8_t *output, int owrap, int owidth, int oheight,
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
473 uint8_t *input, int iwrap, int iwidth, int iheight)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
474 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
475 int src_y, src_y1, last_src_y, ring_y, phase_y, y1, y;
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
476 uint8_t *new_line, *src_line;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
477
986e461dc072 Initial revision
glantau
parents:
diff changeset
478 last_src_y = - FCENTER - 1;
986e461dc072 Initial revision
glantau
parents:
diff changeset
479 /* position of the bottom of the filter in the source image */
986e461dc072 Initial revision
glantau
parents:
diff changeset
480 src_y = (last_src_y + NB_TAPS) * POS_FRAC;
986e461dc072 Initial revision
glantau
parents:
diff changeset
481 ring_y = NB_TAPS; /* position in ring buffer */
986e461dc072 Initial revision
glantau
parents:
diff changeset
482 for(y=0;y<oheight;y++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
483 /* apply horizontal filter on new lines from input if needed */
986e461dc072 Initial revision
glantau
parents:
diff changeset
484 src_y1 = src_y >> POS_FRAC_BITS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
485 while (last_src_y < src_y1) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
486 if (++ring_y >= LINE_BUF_HEIGHT + NB_TAPS)
986e461dc072 Initial revision
glantau
parents:
diff changeset
487 ring_y = NB_TAPS;
986e461dc072 Initial revision
glantau
parents:
diff changeset
488 last_src_y++;
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
489 /* handle limit conditions : replicate line (slightly
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
490 inefficient because we filter multiple times) */
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
491 y1 = last_src_y;
986e461dc072 Initial revision
glantau
parents:
diff changeset
492 if (y1 < 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
493 y1 = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
494 } else if (y1 >= iheight) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
495 y1 = iheight - 1;
986e461dc072 Initial revision
glantau
parents:
diff changeset
496 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
497 src_line = input + y1 * iwrap;
986e461dc072 Initial revision
glantau
parents:
diff changeset
498 new_line = s->line_buf + ring_y * owidth;
986e461dc072 Initial revision
glantau
parents:
diff changeset
499 /* apply filter and handle limit cases correctly */
986e461dc072 Initial revision
glantau
parents:
diff changeset
500 h_resample(new_line, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
501 src_line, iwidth, - FCENTER * POS_FRAC, s->h_incr,
986e461dc072 Initial revision
glantau
parents:
diff changeset
502 &s->h_filters[0][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
503 /* handle ring buffer wraping */
986e461dc072 Initial revision
glantau
parents:
diff changeset
504 if (ring_y >= LINE_BUF_HEIGHT) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
505 memcpy(s->line_buf + (ring_y - LINE_BUF_HEIGHT) * owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
506 new_line, owidth);
986e461dc072 Initial revision
glantau
parents:
diff changeset
507 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
508 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
509 /* apply vertical filter */
986e461dc072 Initial revision
glantau
parents:
diff changeset
510 phase_y = get_phase(src_y);
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
511 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
512 /* desactivated MMX because loss of precision */
986e461dc072 Initial revision
glantau
parents:
diff changeset
513 if ((mm_flags & MM_MMX) && NB_TAPS == 4 && 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
514 v_resample4_mmx(output, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
515 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
516 &s->v_filters[phase_y][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
517 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
518 #endif
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
519 #ifdef HAVE_ALTIVEC
920
a0ad8e3452f2 practically disabling altivec resampling code (some ppl said its broken) patch by (Dieter Shirley <dieters at schemasoft dot com>)
michaelni
parents: 898
diff changeset
520 if ((mm_flags & MM_ALTIVEC) && NB_TAPS == 4 && FILTER_BITS <= 6)
894
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
521 v_resample16_altivec(output, owidth,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
522 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth,
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
523 &s->v_filters[phase_y][0]);
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
524 else
a408778eff87 altivec accelerated v-resample patch by (Brian Foley <bfoley at compsoc dot nuigalway dot ie>)
michaelni
parents: 653
diff changeset
525 #endif
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
526 v_resample(output, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
527 s->line_buf + (ring_y - NB_TAPS + 1) * owidth, owidth,
986e461dc072 Initial revision
glantau
parents:
diff changeset
528 &s->v_filters[phase_y][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
529
986e461dc072 Initial revision
glantau
parents:
diff changeset
530 src_y += s->v_incr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
531 output += owrap;
986e461dc072 Initial revision
glantau
parents:
diff changeset
532 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
533 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
534
986e461dc072 Initial revision
glantau
parents:
diff changeset
535 /* XXX: the following filter is quite naive, but it seems to suffice
986e461dc072 Initial revision
glantau
parents:
diff changeset
536 for 4 taps */
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
537 static void build_filter(int16_t *filter, float factor)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
538 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
539 int ph, i, v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
540 float x, y, tab[NB_TAPS], norm, mult;
986e461dc072 Initial revision
glantau
parents:
diff changeset
541
986e461dc072 Initial revision
glantau
parents:
diff changeset
542 /* if upsampling, only need to interpolate, no filter */
986e461dc072 Initial revision
glantau
parents:
diff changeset
543 if (factor > 1.0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
544 factor = 1.0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
545
986e461dc072 Initial revision
glantau
parents:
diff changeset
546 for(ph=0;ph<NB_PHASES;ph++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
547 norm = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
548 for(i=0;i<NB_TAPS;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
549
986e461dc072 Initial revision
glantau
parents:
diff changeset
550 x = M_PI * ((float)(i - FCENTER) - (float)ph / NB_PHASES) * factor;
986e461dc072 Initial revision
glantau
parents:
diff changeset
551 if (x == 0)
986e461dc072 Initial revision
glantau
parents:
diff changeset
552 y = 1.0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
553 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
554 y = sin(x) / x;
986e461dc072 Initial revision
glantau
parents:
diff changeset
555 tab[i] = y;
986e461dc072 Initial revision
glantau
parents:
diff changeset
556 norm += y;
986e461dc072 Initial revision
glantau
parents:
diff changeset
557 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
558
986e461dc072 Initial revision
glantau
parents:
diff changeset
559 /* normalize so that an uniform color remains the same */
986e461dc072 Initial revision
glantau
parents:
diff changeset
560 mult = (float)(1 << FILTER_BITS) / norm;
986e461dc072 Initial revision
glantau
parents:
diff changeset
561 for(i=0;i<NB_TAPS;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
562 v = (int)(tab[i] * mult);
986e461dc072 Initial revision
glantau
parents:
diff changeset
563 filter[ph * NB_TAPS + i] = v;
986e461dc072 Initial revision
glantau
parents:
diff changeset
564 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
565 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
566 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
567
986e461dc072 Initial revision
glantau
parents:
diff changeset
568 ImgReSampleContext *img_resample_init(int owidth, int oheight,
986e461dc072 Initial revision
glantau
parents:
diff changeset
569 int iwidth, int iheight)
986e461dc072 Initial revision
glantau
parents:
diff changeset
570 {
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
571 return img_resample_full_init(owidth, oheight, iwidth, iheight, 0, 0, 0, 0);
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
572 }
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
573
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
574 ImgReSampleContext *img_resample_full_init(int owidth, int oheight,
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
575 int iwidth, int iheight,
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
576 int topBand, int bottomBand,
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
577 int leftBand, int rightBand)
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
578 {
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
579 ImgReSampleContext *s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
580
986e461dc072 Initial revision
glantau
parents:
diff changeset
581 s = av_mallocz(sizeof(ImgReSampleContext));
986e461dc072 Initial revision
glantau
parents:
diff changeset
582 if (!s)
986e461dc072 Initial revision
glantau
parents:
diff changeset
583 return NULL;
986e461dc072 Initial revision
glantau
parents:
diff changeset
584 s->line_buf = av_mallocz(owidth * (LINE_BUF_HEIGHT + NB_TAPS));
986e461dc072 Initial revision
glantau
parents:
diff changeset
585 if (!s->line_buf)
986e461dc072 Initial revision
glantau
parents:
diff changeset
586 goto fail;
986e461dc072 Initial revision
glantau
parents:
diff changeset
587
986e461dc072 Initial revision
glantau
parents:
diff changeset
588 s->owidth = owidth;
986e461dc072 Initial revision
glantau
parents:
diff changeset
589 s->oheight = oheight;
986e461dc072 Initial revision
glantau
parents:
diff changeset
590 s->iwidth = iwidth;
986e461dc072 Initial revision
glantau
parents:
diff changeset
591 s->iheight = iheight;
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
592 s->topBand = topBand;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
593 s->bottomBand = bottomBand;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
594 s->leftBand = leftBand;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
595 s->rightBand = rightBand;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
596
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
597 s->h_incr = ((iwidth - leftBand - rightBand) * POS_FRAC) / owidth;
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
598 s->v_incr = ((iheight - topBand - bottomBand) * POS_FRAC) / oheight;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
599
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
600 build_filter(&s->h_filters[0][0], (float) owidth / (float) (iwidth - leftBand - rightBand));
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
601 build_filter(&s->v_filters[0][0], (float) oheight / (float) (iheight - topBand - bottomBand));
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
602
986e461dc072 Initial revision
glantau
parents:
diff changeset
603 return s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
604 fail:
396
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
605 av_free(s);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
606 return NULL;
986e461dc072 Initial revision
glantau
parents:
diff changeset
607 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
608
986e461dc072 Initial revision
glantau
parents:
diff changeset
609 void img_resample(ImgReSampleContext *s,
986e461dc072 Initial revision
glantau
parents:
diff changeset
610 AVPicture *output, AVPicture *input)
986e461dc072 Initial revision
glantau
parents:
diff changeset
611 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
612 int i, shift;
986e461dc072 Initial revision
glantau
parents:
diff changeset
613
986e461dc072 Initial revision
glantau
parents:
diff changeset
614 for(i=0;i<3;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
615 shift = (i == 0) ? 0 : 1;
986e461dc072 Initial revision
glantau
parents:
diff changeset
616 component_resample(s, output->data[i], output->linesize[i],
986e461dc072 Initial revision
glantau
parents:
diff changeset
617 s->owidth >> shift, s->oheight >> shift,
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
618 input->data[i] + (input->linesize[i] * (s->topBand >> shift)) + (s->leftBand >> shift),
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
619 input->linesize[i], ((s->iwidth - s->leftBand - s->rightBand) >> shift),
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
620 (s->iheight - s->topBand - s->bottomBand) >> shift);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
621 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
622 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
623
986e461dc072 Initial revision
glantau
parents:
diff changeset
624 void img_resample_close(ImgReSampleContext *s)
986e461dc072 Initial revision
glantau
parents:
diff changeset
625 {
396
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
626 av_free(s->line_buf);
fce0a2520551 removed useless header includes - use av memory functions
glantau
parents: 18
diff changeset
627 av_free(s);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
628 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
629
986e461dc072 Initial revision
glantau
parents:
diff changeset
630 #ifdef TEST
986e461dc072 Initial revision
glantau
parents:
diff changeset
631
986e461dc072 Initial revision
glantau
parents:
diff changeset
632 void *av_mallocz(int size)
986e461dc072 Initial revision
glantau
parents:
diff changeset
633 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
634 void *ptr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
635 ptr = malloc(size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
636 memset(ptr, 0, size);
986e461dc072 Initial revision
glantau
parents:
diff changeset
637 return ptr;
986e461dc072 Initial revision
glantau
parents:
diff changeset
638 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
639
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
640 void av_free(void *ptr)
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
641 {
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
642 /* XXX: this test should not be needed on most libcs */
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
643 if (ptr)
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
644 free(ptr);
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
645 }
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
646
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
647 /* input */
986e461dc072 Initial revision
glantau
parents:
diff changeset
648 #define XSIZE 256
986e461dc072 Initial revision
glantau
parents:
diff changeset
649 #define YSIZE 256
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
650 uint8_t img[XSIZE * YSIZE];
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
651
986e461dc072 Initial revision
glantau
parents:
diff changeset
652 /* output */
986e461dc072 Initial revision
glantau
parents:
diff changeset
653 #define XSIZE1 512
986e461dc072 Initial revision
glantau
parents:
diff changeset
654 #define YSIZE1 512
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
655 uint8_t img1[XSIZE1 * YSIZE1];
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
656 uint8_t img2[XSIZE1 * YSIZE1];
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
657
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
658 void save_pgm(const char *filename, uint8_t *img, int xsize, int ysize)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
659 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
660 FILE *f;
986e461dc072 Initial revision
glantau
parents:
diff changeset
661 f=fopen(filename,"w");
986e461dc072 Initial revision
glantau
parents:
diff changeset
662 fprintf(f,"P5\n%d %d\n%d\n", xsize, ysize, 255);
986e461dc072 Initial revision
glantau
parents:
diff changeset
663 fwrite(img,1, xsize * ysize,f);
986e461dc072 Initial revision
glantau
parents:
diff changeset
664 fclose(f);
986e461dc072 Initial revision
glantau
parents:
diff changeset
665 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
666
1064
b32afefe7d33 * UINTX -> uintx_t INTX -> intx_t
kabi
parents: 1057
diff changeset
667 static void dump_filter(int16_t *filter)
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
668 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
669 int i, ph;
986e461dc072 Initial revision
glantau
parents:
diff changeset
670
986e461dc072 Initial revision
glantau
parents:
diff changeset
671 for(ph=0;ph<NB_PHASES;ph++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
672 printf("%2d: ", ph);
986e461dc072 Initial revision
glantau
parents:
diff changeset
673 for(i=0;i<NB_TAPS;i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
674 printf(" %5.2f", filter[ph * NB_TAPS + i] / 256.0);
986e461dc072 Initial revision
glantau
parents:
diff changeset
675 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
676 printf("\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
677 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
678 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
679
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
680 #ifdef HAVE_MMX
644
641708b5c33c fixing tests
michaelni
parents: 630
diff changeset
681 int mm_flags;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
682 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
683
986e461dc072 Initial revision
glantau
parents:
diff changeset
684 int main(int argc, char **argv)
986e461dc072 Initial revision
glantau
parents:
diff changeset
685 {
986e461dc072 Initial revision
glantau
parents:
diff changeset
686 int x, y, v, i, xsize, ysize;
986e461dc072 Initial revision
glantau
parents:
diff changeset
687 ImgReSampleContext *s;
986e461dc072 Initial revision
glantau
parents:
diff changeset
688 float fact, factors[] = { 1/2.0, 3.0/4.0, 1.0, 4.0/3.0, 16.0/9.0, 2.0 };
986e461dc072 Initial revision
glantau
parents:
diff changeset
689 char buf[256];
986e461dc072 Initial revision
glantau
parents:
diff changeset
690
986e461dc072 Initial revision
glantau
parents:
diff changeset
691 /* build test image */
986e461dc072 Initial revision
glantau
parents:
diff changeset
692 for(y=0;y<YSIZE;y++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
693 for(x=0;x<XSIZE;x++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
694 if (x < XSIZE/2 && y < YSIZE/2) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
695 if (x < XSIZE/4 && y < YSIZE/4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
696 if ((x % 10) <= 6 &&
986e461dc072 Initial revision
glantau
parents:
diff changeset
697 (y % 10) <= 6)
986e461dc072 Initial revision
glantau
parents:
diff changeset
698 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
699 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
700 v = 0x00;
986e461dc072 Initial revision
glantau
parents:
diff changeset
701 } else if (x < XSIZE/4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
702 if (x & 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
703 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
704 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
705 v = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
706 } else if (y < XSIZE/4) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
707 if (y & 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
708 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
709 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
710 v = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
711 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
712 if (y < YSIZE*3/8) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
713 if ((y+x) & 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
714 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
715 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
716 v = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
717 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
718 if (((x+3) % 4) <= 1 &&
986e461dc072 Initial revision
glantau
parents:
diff changeset
719 ((y+3) % 4) <= 1)
986e461dc072 Initial revision
glantau
parents:
diff changeset
720 v = 0xff;
986e461dc072 Initial revision
glantau
parents:
diff changeset
721 else
986e461dc072 Initial revision
glantau
parents:
diff changeset
722 v = 0x00;
986e461dc072 Initial revision
glantau
parents:
diff changeset
723 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
724 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
725 } else if (x < XSIZE/2) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
726 v = ((x - (XSIZE/2)) * 255) / (XSIZE/2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
727 } else if (y < XSIZE/2) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
728 v = ((y - (XSIZE/2)) * 255) / (XSIZE/2);
986e461dc072 Initial revision
glantau
parents:
diff changeset
729 } else {
986e461dc072 Initial revision
glantau
parents:
diff changeset
730 v = ((x + y - XSIZE) * 255) / XSIZE;
986e461dc072 Initial revision
glantau
parents:
diff changeset
731 }
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
732 img[(YSIZE - y) * XSIZE + (XSIZE - x)] = v;
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
733 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
734 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
735 save_pgm("/tmp/in.pgm", img, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
736 for(i=0;i<sizeof(factors)/sizeof(float);i++) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
737 fact = factors[i];
986e461dc072 Initial revision
glantau
parents:
diff changeset
738 xsize = (int)(XSIZE * fact);
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
739 ysize = (int)((YSIZE - 100) * fact);
644
641708b5c33c fixing tests
michaelni
parents: 630
diff changeset
740 s = img_resample_full_init(xsize, ysize, XSIZE, YSIZE, 50 ,50, 0, 0);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
741 printf("Factor=%0.2f\n", fact);
986e461dc072 Initial revision
glantau
parents:
diff changeset
742 dump_filter(&s->h_filters[0][0]);
986e461dc072 Initial revision
glantau
parents:
diff changeset
743 component_resample(s, img1, xsize, xsize, ysize,
630
b4ee42142ad1 croping patch by (talus25 at speakeasy dot net) with fixes from atmos & me
michaelni
parents: 429
diff changeset
744 img + 50 * XSIZE, XSIZE, XSIZE, YSIZE - 100);
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
745 img_resample_close(s);
986e461dc072 Initial revision
glantau
parents:
diff changeset
746
986e461dc072 Initial revision
glantau
parents:
diff changeset
747 sprintf(buf, "/tmp/out%d.pgm", i);
986e461dc072 Initial revision
glantau
parents:
diff changeset
748 save_pgm(buf, img1, xsize, ysize);
986e461dc072 Initial revision
glantau
parents:
diff changeset
749 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
750
986e461dc072 Initial revision
glantau
parents:
diff changeset
751 /* mmx test */
2
2e2c46c87460 fixed config for direct mplayer build compatibility
glantau
parents: 0
diff changeset
752 #ifdef HAVE_MMX
0
986e461dc072 Initial revision
glantau
parents:
diff changeset
753 printf("MMX test\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
754 fact = 0.72;
986e461dc072 Initial revision
glantau
parents:
diff changeset
755 xsize = (int)(XSIZE * fact);
986e461dc072 Initial revision
glantau
parents:
diff changeset
756 ysize = (int)(YSIZE * fact);
986e461dc072 Initial revision
glantau
parents:
diff changeset
757 mm_flags = MM_MMX;
986e461dc072 Initial revision
glantau
parents:
diff changeset
758 s = img_resample_init(xsize, ysize, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
759 component_resample(s, img1, xsize, xsize, ysize,
986e461dc072 Initial revision
glantau
parents:
diff changeset
760 img, XSIZE, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
761
986e461dc072 Initial revision
glantau
parents:
diff changeset
762 mm_flags = 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
763 s = img_resample_init(xsize, ysize, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
764 component_resample(s, img2, xsize, xsize, ysize,
986e461dc072 Initial revision
glantau
parents:
diff changeset
765 img, XSIZE, XSIZE, YSIZE);
986e461dc072 Initial revision
glantau
parents:
diff changeset
766 if (memcmp(img1, img2, xsize * ysize) != 0) {
986e461dc072 Initial revision
glantau
parents:
diff changeset
767 fprintf(stderr, "mmx error\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
768 exit(1);
986e461dc072 Initial revision
glantau
parents:
diff changeset
769 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
770 printf("MMX OK\n");
986e461dc072 Initial revision
glantau
parents:
diff changeset
771 #endif
986e461dc072 Initial revision
glantau
parents:
diff changeset
772 return 0;
986e461dc072 Initial revision
glantau
parents:
diff changeset
773 }
986e461dc072 Initial revision
glantau
parents:
diff changeset
774
986e461dc072 Initial revision
glantau
parents:
diff changeset
775 #endif