Mercurial > libavcodec.hg
annotate iff.c @ 11700:6bdec2a0e7e1 libavcodec
Optimize decodeplane32().
Patch by Sebastian Vater <cdgs basty googlemail com>.
author | rbultje |
---|---|
date | Mon, 10 May 2010 17:18:09 +0000 |
parents | 83b49b0997e8 |
children | 269ce565c70b |
rev | line source |
---|---|
11074 | 1 /* |
2 * IFF PBM/ILBM bitmap decoder | |
3 * Copyright (c) 2010 Peter Ross <pross@xvid.org> | |
11661
7a5f3c94b9ad
Switch some ints to unsigned (they can only have positive values, this allows
rbultje
parents:
11660
diff
changeset
|
4 * Copyright (c) 2010 Sebastian Vater <cdgs.basty@googlemail.com> |
11074 | 5 * |
6 * This file is part of FFmpeg. | |
7 * | |
8 * FFmpeg is free software; you can redistribute it and/or | |
9 * modify it under the terms of the GNU Lesser General Public | |
10 * License as published by the Free Software Foundation; either | |
11 * version 2.1 of the License, or (at your option) any later version. | |
12 * | |
13 * FFmpeg is distributed in the hope that it will be useful, | |
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of | |
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
16 * Lesser General Public License for more details. | |
17 * | |
18 * You should have received a copy of the GNU Lesser General Public | |
19 * License along with FFmpeg; if not, write to the Free Software | |
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA | |
21 */ | |
22 | |
23 /** | |
11644
7dd2a45249a9
Remove explicit filename from Doxygen @file commands.
diego
parents:
11560
diff
changeset
|
24 * @file |
11074 | 25 * IFF PBM/ILBM bitmap decoder |
26 */ | |
27 | |
28 #include "bytestream.h" | |
29 #include "avcodec.h" | |
11175 | 30 #include "get_bits.h" |
11395
5b9d41da4152
IFF: move ff_cmap_read_palette() prototype to a header file
mru
parents:
11336
diff
changeset
|
31 #include "iff.h" |
11175 | 32 |
33 typedef struct { | |
34 AVFrame frame; | |
11678
e1dd1ff1ab27
Revert r22974 int->unsigned parts that don't have any meaningful effect.
rbultje
parents:
11663
diff
changeset
|
35 int planesize; |
11175 | 36 uint8_t * planebuf; |
37 } IffContext; | |
11074 | 38 |
11691
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
39 #define LUT8_PART(plane, v) \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
40 AV_LE2ME64C(UINT64_C(0x0000000)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
41 AV_LE2ME64C(UINT64_C(0x1000000)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
42 AV_LE2ME64C(UINT64_C(0x0010000)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
43 AV_LE2ME64C(UINT64_C(0x1010000)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
44 AV_LE2ME64C(UINT64_C(0x0000100)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
45 AV_LE2ME64C(UINT64_C(0x1000100)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
46 AV_LE2ME64C(UINT64_C(0x0010100)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
47 AV_LE2ME64C(UINT64_C(0x1010100)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
48 AV_LE2ME64C(UINT64_C(0x0000001)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
49 AV_LE2ME64C(UINT64_C(0x1000001)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
50 AV_LE2ME64C(UINT64_C(0x0010001)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
51 AV_LE2ME64C(UINT64_C(0x1010001)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
52 AV_LE2ME64C(UINT64_C(0x0000101)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
53 AV_LE2ME64C(UINT64_C(0x1000101)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
54 AV_LE2ME64C(UINT64_C(0x0010101)<<32 | v) << plane, \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
55 AV_LE2ME64C(UINT64_C(0x1010101)<<32 | v) << plane |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
56 |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
57 #define LUT8(plane) { \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
58 LUT8_PART(plane, 0x0000000), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
59 LUT8_PART(plane, 0x1000000), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
60 LUT8_PART(plane, 0x0010000), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
61 LUT8_PART(plane, 0x1010000), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
62 LUT8_PART(plane, 0x0000100), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
63 LUT8_PART(plane, 0x1000100), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
64 LUT8_PART(plane, 0x0010100), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
65 LUT8_PART(plane, 0x1010100), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
66 LUT8_PART(plane, 0x0000001), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
67 LUT8_PART(plane, 0x1000001), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
68 LUT8_PART(plane, 0x0010001), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
69 LUT8_PART(plane, 0x1010001), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
70 LUT8_PART(plane, 0x0000101), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
71 LUT8_PART(plane, 0x1000101), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
72 LUT8_PART(plane, 0x0010101), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
73 LUT8_PART(plane, 0x1010101), \ |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
74 } |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
75 |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
76 // 8 planes * 8-bit mask |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
77 static const uint64_t plane8_lut[8][256] = { |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
78 LUT8(0), LUT8(1), LUT8(2), LUT8(3), |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
79 LUT8(4), LUT8(5), LUT8(6), LUT8(7), |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
80 }; |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
81 |
11700 | 82 #define LUT32(plane) { \ |
83 0, 0, 0, 0, \ | |
84 0, 0, 0, 1 << plane, \ | |
85 0, 0, 1 << plane, 0, \ | |
86 0, 0, 1 << plane, 1 << plane, \ | |
87 0, 1 << plane, 0, 0, \ | |
88 0, 1 << plane, 0, 1 << plane, \ | |
89 0, 1 << plane, 1 << plane, 0, \ | |
90 0, 1 << plane, 1 << plane, 1 << plane, \ | |
91 1 << plane, 0, 0, 0, \ | |
92 1 << plane, 0, 0, 1 << plane, \ | |
93 1 << plane, 0, 1 << plane, 0, \ | |
94 1 << plane, 0, 1 << plane, 1 << plane, \ | |
95 1 << plane, 1 << plane, 0, 0, \ | |
96 1 << plane, 1 << plane, 0, 1 << plane, \ | |
97 1 << plane, 1 << plane, 1 << plane, 0, \ | |
98 1 << plane, 1 << plane, 1 << plane, 1 << plane, \ | |
99 } | |
100 | |
101 // 32 planes * 4-bit mask * 4 lookup tables each | |
102 static const uint32_t plane32_lut[32][16*4] = { | |
103 LUT32( 0), LUT32( 1), LUT32( 2), LUT32( 3), | |
104 LUT32( 4), LUT32( 5), LUT32( 6), LUT32( 7), | |
105 LUT32( 8), LUT32( 9), LUT32(10), LUT32(11), | |
106 LUT32(12), LUT32(13), LUT32(14), LUT32(15), | |
107 LUT32(16), LUT32(17), LUT32(18), LUT32(19), | |
108 LUT32(20), LUT32(21), LUT32(22), LUT32(23), | |
109 LUT32(24), LUT32(25), LUT32(26), LUT32(27), | |
110 LUT32(28), LUT32(29), LUT32(30), LUT32(31), | |
111 }; | |
112 | |
11074 | 113 /** |
114 * Convert CMAP buffer (stored in extradata) to lavc palette format | |
115 */ | |
116 int ff_cmap_read_palette(AVCodecContext *avctx, uint32_t *pal) | |
117 { | |
11678
e1dd1ff1ab27
Revert r22974 int->unsigned parts that don't have any meaningful effect.
rbultje
parents:
11663
diff
changeset
|
118 int count, i; |
11074 | 119 |
120 if (avctx->bits_per_coded_sample > 8) { | |
121 av_log(avctx, AV_LOG_ERROR, "bit_per_coded_sample > 8 not supported\n"); | |
122 return AVERROR_INVALIDDATA; | |
123 } | |
124 | |
125 count = 1 << avctx->bits_per_coded_sample; | |
126 if (avctx->extradata_size < count * 3) { | |
127 av_log(avctx, AV_LOG_ERROR, "palette data underflow\n"); | |
128 return AVERROR_INVALIDDATA; | |
129 } | |
130 for (i=0; i < count; i++) { | |
11175 | 131 pal[i] = 0xFF000000 | AV_RB24( avctx->extradata + i*3 ); |
11074 | 132 } |
133 return 0; | |
134 } | |
135 | |
136 static av_cold int decode_init(AVCodecContext *avctx) | |
137 { | |
11175 | 138 IffContext *s = avctx->priv_data; |
11480
534872e7ab38
Make iff.c:decode_init return the value returned by
stefano
parents:
11395
diff
changeset
|
139 int err; |
11074 | 140 |
11175 | 141 if (avctx->bits_per_coded_sample <= 8) { |
142 avctx->pix_fmt = PIX_FMT_PAL8; | |
143 } else if (avctx->bits_per_coded_sample <= 32) { | |
144 avctx->pix_fmt = PIX_FMT_BGR32; | |
145 } else { | |
146 return AVERROR_INVALIDDATA; | |
147 } | |
11074 | 148 |
11699
83b49b0997e8
Ensure that width and height are > 0. avcodec_open() itself only checks that
rbultje
parents:
11693
diff
changeset
|
149 if ((err = avcodec_check_dimensions(avctx, avctx->width, avctx->height))) |
83b49b0997e8
Ensure that width and height are > 0. avcodec_open() itself only checks that
rbultje
parents:
11693
diff
changeset
|
150 return err; |
11679 | 151 s->planesize = FFALIGN(avctx->width, 16) >> 3; // Align plane size in bits to word-boundary |
11175 | 152 s->planebuf = av_malloc(s->planesize + FF_INPUT_BUFFER_PADDING_SIZE); |
153 if (!s->planebuf) | |
154 return AVERROR(ENOMEM); | |
155 | |
156 s->frame.reference = 1; | |
11480
534872e7ab38
Make iff.c:decode_init return the value returned by
stefano
parents:
11395
diff
changeset
|
157 if ((err = avctx->get_buffer(avctx, &s->frame) < 0)) { |
11074 | 158 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n"); |
11480
534872e7ab38
Make iff.c:decode_init return the value returned by
stefano
parents:
11395
diff
changeset
|
159 return err; |
11074 | 160 } |
11175 | 161 |
162 return avctx->bits_per_coded_sample <= 8 ? | |
163 ff_cmap_read_palette(avctx, (uint32_t*)s->frame.data[1]) : 0; | |
11074 | 164 } |
165 | |
166 /** | |
11660 | 167 * Decode interleaved plane buffer up to 8bpp |
168 * @param dst Destination buffer | |
169 * @param buf Source buffer | |
170 * @param buf_size | |
171 * @param plane plane number to decode as | |
172 */ | |
11693
3ec57be57312
Remove "bps" parameter to decodeplane8/32(), it's unused.
rbultje
parents:
11692
diff
changeset
|
173 static void decodeplane8(uint8_t *dst, const uint8_t *buf, int buf_size, int plane) |
11660 | 174 { |
11691
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
175 const uint64_t *lut = plane8_lut[plane]; |
11692 | 176 while (buf_size--) { |
11691
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
177 uint64_t v = AV_RN64A(dst) | lut[*buf++]; |
24827da9c8dc
Optimize decodeplane8(), patch by Sebastian Vater <cdgs basty googlemail com>.
rbultje
parents:
11679
diff
changeset
|
178 AV_WN64A(dst, v); |
11692 | 179 dst += 8; |
11660 | 180 } |
181 } | |
182 | |
183 /** | |
184 * Decode interleaved plane buffer up to 24bpp | |
11175 | 185 * @param dst Destination buffer |
186 * @param buf Source buffer | |
187 * @param buf_size | |
188 * @param plane plane number to decode as | |
11074 | 189 */ |
11700 | 190 static void decodeplane32(uint32_t *dst, const uint8_t *buf, int buf_size, int plane) |
11660 | 191 { |
11700 | 192 const uint32_t *lut = plane32_lut[plane]; |
193 do { | |
194 unsigned mask = (*buf >> 2) & ~3; | |
195 dst[0] |= lut[mask++]; | |
196 dst[1] |= lut[mask++]; | |
197 dst[2] |= lut[mask++]; | |
198 dst[3] |= lut[mask]; | |
199 mask = (*buf++ << 2) & 0x3F; | |
200 dst[4] |= lut[mask++]; | |
201 dst[5] |= lut[mask++]; | |
202 dst[6] |= lut[mask++]; | |
203 dst[7] |= lut[mask]; | |
204 dst += 8; | |
205 } while (--buf_size); | |
11074 | 206 } |
207 | |
208 static int decode_frame_ilbm(AVCodecContext *avctx, | |
209 void *data, int *data_size, | |
210 AVPacket *avpkt) | |
211 { | |
11175 | 212 IffContext *s = avctx->priv_data; |
11074 | 213 const uint8_t *buf = avpkt->data; |
11678
e1dd1ff1ab27
Revert r22974 int->unsigned parts that don't have any meaningful effect.
rbultje
parents:
11663
diff
changeset
|
214 int buf_size = avpkt->size; |
11187 | 215 const uint8_t *buf_end = buf+buf_size; |
11678
e1dd1ff1ab27
Revert r22974 int->unsigned parts that don't have any meaningful effect.
rbultje
parents:
11663
diff
changeset
|
216 int y, plane; |
11074 | 217 |
11175 | 218 if (avctx->reget_buffer(avctx, &s->frame) < 0){ |
11074 | 219 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n"); |
220 return -1; | |
221 } | |
222 | |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
223 if (avctx->pix_fmt == PIX_FMT_PAL8) { |
11663 | 224 for(y = 0; y < avctx->height; y++ ) { |
225 uint8_t *row = &s->frame.data[0][ y*s->frame.linesize[0] ]; | |
226 memset(row, 0, avctx->width); | |
227 for (plane = 0; plane < avctx->bits_per_coded_sample && buf < buf_end; plane++) { | |
11693
3ec57be57312
Remove "bps" parameter to decodeplane8/32(), it's unused.
rbultje
parents:
11692
diff
changeset
|
228 decodeplane8(row, buf, FFMIN(s->planesize, buf_end - buf), plane); |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
229 buf += s->planesize; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
230 } |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
231 } |
11663 | 232 } else { // PIX_FMT_BGR32 |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
233 for(y = 0; y < avctx->height; y++ ) { |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
234 uint8_t *row = &s->frame.data[0][y*s->frame.linesize[0]]; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
235 memset(row, 0, avctx->width << 2); |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
236 for (plane = 0; plane < avctx->bits_per_coded_sample && buf < buf_end; plane++) { |
11693
3ec57be57312
Remove "bps" parameter to decodeplane8/32(), it's unused.
rbultje
parents:
11692
diff
changeset
|
237 decodeplane32((uint32_t *) row, buf, FFMIN(s->planesize, buf_end - buf), plane); |
11663 | 238 buf += s->planesize; |
11175 | 239 } |
11074 | 240 } |
241 } | |
242 | |
243 *data_size = sizeof(AVFrame); | |
11175 | 244 *(AVFrame*)data = s->frame; |
11074 | 245 return buf_size; |
246 } | |
247 | |
248 static int decode_frame_byterun1(AVCodecContext *avctx, | |
249 void *data, int *data_size, | |
250 AVPacket *avpkt) | |
251 { | |
11175 | 252 IffContext *s = avctx->priv_data; |
11074 | 253 const uint8_t *buf = avpkt->data; |
11678
e1dd1ff1ab27
Revert r22974 int->unsigned parts that don't have any meaningful effect.
rbultje
parents:
11663
diff
changeset
|
254 int buf_size = avpkt->size; |
11074 | 255 const uint8_t *buf_end = buf+buf_size; |
11678
e1dd1ff1ab27
Revert r22974 int->unsigned parts that don't have any meaningful effect.
rbultje
parents:
11663
diff
changeset
|
256 int y, plane, x; |
11074 | 257 |
11175 | 258 if (avctx->reget_buffer(avctx, &s->frame) < 0){ |
11074 | 259 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n"); |
260 return -1; | |
261 } | |
262 | |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
263 if (avctx->codec_tag == MKTAG('I','L','B','M')) { //interleaved |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
264 if (avctx->pix_fmt == PIX_FMT_PAL8) { |
11663 | 265 for(y = 0; y < avctx->height ; y++ ) { |
266 uint8_t *row = &s->frame.data[0][ y*s->frame.linesize[0] ]; | |
267 memset(row, 0, avctx->width); | |
268 for (plane = 0; plane < avctx->bits_per_coded_sample; plane++) { | |
269 for(x = 0; x < s->planesize && buf < buf_end; ) { | |
270 int8_t value = *buf++; | |
271 unsigned length; | |
272 if (value >= 0) { | |
273 length = value + 1; | |
274 memcpy(s->planebuf + x, buf, FFMIN3(length, s->planesize - x, buf_end - buf)); | |
275 buf += length; | |
276 } else if (value > -128) { | |
277 length = -value + 1; | |
278 memset(s->planebuf + x, *buf++, FFMIN(length, s->planesize - x)); | |
279 } else { //noop | |
280 continue; | |
281 } | |
282 x += length; | |
11074 | 283 } |
11693
3ec57be57312
Remove "bps" parameter to decodeplane8/32(), it's unused.
rbultje
parents:
11692
diff
changeset
|
284 decodeplane8(row, s->planebuf, s->planesize, plane); |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
285 } |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
286 } |
11663 | 287 } else { //PIX_FMT_BGR32 |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
288 for(y = 0; y < avctx->height ; y++ ) { |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
289 uint8_t *row = &s->frame.data[0][y*s->frame.linesize[0]]; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
290 memset(row, 0, avctx->width << 2); |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
291 for (plane = 0; plane < avctx->bits_per_coded_sample; plane++) { |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
292 for(x = 0; x < s->planesize && buf < buf_end; ) { |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
293 int8_t value = *buf++; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
294 unsigned length; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
295 if (value >= 0) { |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
296 length = value + 1; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
297 memcpy(s->planebuf + x, buf, FFMIN3(length, s->planesize - x, buf_end - buf)); |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
298 buf += length; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
299 } else if (value > -128) { |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
300 length = -value + 1; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
301 memset(s->planebuf + x, *buf++, FFMIN(length, s->planesize - x)); |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
302 } else { // noop |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
303 continue; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
304 } |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
305 x += length; |
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
306 } |
11693
3ec57be57312
Remove "bps" parameter to decodeplane8/32(), it's unused.
rbultje
parents:
11692
diff
changeset
|
307 decodeplane32((uint32_t *) row, s->planebuf, s->planesize, plane); |
11175 | 308 } |
11074 | 309 } |
11662
33e4b0d712c8
Move some branches outside looped code. Should improve the generated asm (and
rbultje
parents:
11661
diff
changeset
|
310 } |
11663 | 311 } else { |
312 for(y = 0; y < avctx->height ; y++ ) { | |
313 uint8_t *row = &s->frame.data[0][y*s->frame.linesize[0]]; | |
11074 | 314 for(x = 0; x < avctx->width && buf < buf_end; ) { |
11124
85a1b00a2413
Use int8_t instead of char, the signedness of char can differ between systems.
reimar
parents:
11074
diff
changeset
|
315 int8_t value = *buf++; |
11661
7a5f3c94b9ad
Switch some ints to unsigned (they can only have positive values, this allows
rbultje
parents:
11660
diff
changeset
|
316 unsigned length; |
11074 | 317 if (value >= 0) { |
318 length = value + 1; | |
319 memcpy(row + x, buf, FFMIN3(length, buf_end - buf, avctx->width - x)); | |
320 buf += length; | |
321 } else if (value > -128) { | |
322 length = -value + 1; | |
323 memset(row + x, *buf++, FFMIN(length, avctx->width - x)); | |
324 } else { //noop | |
325 continue; | |
326 } | |
327 x += length; | |
328 } | |
329 } | |
330 } | |
331 | |
332 *data_size = sizeof(AVFrame); | |
11175 | 333 *(AVFrame*)data = s->frame; |
11074 | 334 return buf_size; |
335 } | |
336 | |
337 static av_cold int decode_end(AVCodecContext *avctx) | |
338 { | |
11175 | 339 IffContext *s = avctx->priv_data; |
340 if (s->frame.data[0]) | |
341 avctx->release_buffer(avctx, &s->frame); | |
342 av_freep(&s->planebuf); | |
11074 | 343 return 0; |
344 } | |
345 | |
346 AVCodec iff_ilbm_decoder = { | |
347 "iff_ilbm", | |
11560
8a4984c5cacc
Define AVMediaType enum, and use it instead of enum CodecType, which
stefano
parents:
11480
diff
changeset
|
348 AVMEDIA_TYPE_VIDEO, |
11074 | 349 CODEC_ID_IFF_ILBM, |
11175 | 350 sizeof(IffContext), |
11074 | 351 decode_init, |
352 NULL, | |
353 decode_end, | |
354 decode_frame_ilbm, | |
355 CODEC_CAP_DR1, | |
356 .long_name = NULL_IF_CONFIG_SMALL("IFF ILBM"), | |
357 }; | |
358 | |
359 AVCodec iff_byterun1_decoder = { | |
360 "iff_byterun1", | |
11560
8a4984c5cacc
Define AVMediaType enum, and use it instead of enum CodecType, which
stefano
parents:
11480
diff
changeset
|
361 AVMEDIA_TYPE_VIDEO, |
11074 | 362 CODEC_ID_IFF_BYTERUN1, |
11175 | 363 sizeof(IffContext), |
11074 | 364 decode_init, |
365 NULL, | |
366 decode_end, | |
367 decode_frame_byterun1, | |
368 CODEC_CAP_DR1, | |
369 .long_name = NULL_IF_CONFIG_SMALL("IFF ByteRun1"), | |
370 }; |