Mercurial > libavcodec.hg
annotate dv.c @ 8159:b5e4cfdcf185 libavcodec
cosmetics: Group ppc-specific objects together.
author | diego |
---|---|
date | Mon, 17 Nov 2008 16:38:50 +0000 |
parents | c30bdda1adb1 |
children | e1a094cabfc3 |
rev | line source |
---|---|
723 | 1 /* |
2 * DV decoder | |
3 * Copyright (c) 2002 Fabrice Bellard. | |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
4 * Copyright (c) 2004 Roman Shaposhnik. |
723 | 5 * |
2967 | 6 * DV encoder |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
7 * Copyright (c) 2003 Roman Shaposhnik. |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
8 * |
3167 | 9 * 50 Mbps (DVCPRO50) support |
10 * Copyright (c) 2006 Daniel Maas <dmaas@maasdigital.com> | |
11 * | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
12 * 100 Mbps (DVCPRO HD) support |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
13 * Initial code by Daniel Maas <dmaas@maasdigital.com> (funded by BBC R&D) |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
14 * Final code by Roman Shaposhnik |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
15 * |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
16 * Many thanks to Dan Dennedy <dan@dennedy.org> for providing wealth |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
17 * of DV technical info. |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
18 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
19 * This file is part of FFmpeg. |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
20 * |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
21 * FFmpeg is free software; you can redistribute it and/or |
723 | 22 * modify it under the terms of the GNU Lesser General Public |
23 * License as published by the Free Software Foundation; either | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
24 * version 2.1 of the License, or (at your option) any later version. |
723 | 25 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
26 * FFmpeg is distributed in the hope that it will be useful, |
723 | 27 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
28 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU | |
29 * Lesser General Public License for more details. | |
30 * | |
31 * You should have received a copy of the GNU Lesser General Public | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3806
diff
changeset
|
32 * License along with FFmpeg; if not, write to the Free Software |
3036
0b546eab515d
Update licensing information: The FSF changed postal address.
diego
parents:
3016
diff
changeset
|
33 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
723 | 34 */ |
1106 | 35 |
36 /** | |
37 * @file dv.c | |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
38 * DV codec. |
1106 | 39 */ |
3649 | 40 #define ALT_BITSTREAM_READER |
723 | 41 #include "avcodec.h" |
42 #include "dsputil.h" | |
6450 | 43 #include "bitstream.h" |
723 | 44 #include "simple_idct.h" |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
45 #include "dvdata.h" |
723 | 46 |
2847 | 47 //#undef NDEBUG |
48 //#include <assert.h> | |
49 | |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
50 typedef struct DVVideoContext { |
8051 | 51 const DVprofile *sys; |
52 AVFrame picture; | |
53 AVCodecContext *avctx; | |
54 uint8_t *buf; | |
2967 | 55 |
8051 | 56 uint8_t dv_zigzag[2][64]; |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
57 uint32_t dv_idct_factor[2][2][22][64]; |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
58 uint32_t dv100_idct_factor[4][4][16][64]; |
2967 | 59 |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
60 void (*get_pixels)(DCTELEM *block, const uint8_t *pixels, int line_size); |
1567 | 61 void (*fdct[2])(DCTELEM *block); |
62 void (*idct_put[2])(uint8_t *dest, int line_size, DCTELEM *block); | |
3016
97e6c0f82182
Moving dv_anchor back to the global scope. This creates a tiny memory
romansh
parents:
2991
diff
changeset
|
63 } DVVideoContext; |
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
64 |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
65 #define TEX_VLC_BITS 9 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
66 |
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
67 #if ENABLE_SMALL |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
68 #define DV_VLC_MAP_RUN_SIZE 15 |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
69 #define DV_VLC_MAP_LEV_SIZE 23 |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
70 #else |
2967 | 71 #define DV_VLC_MAP_RUN_SIZE 64 |
2847 | 72 #define DV_VLC_MAP_LEV_SIZE 512 //FIXME sign was removed so this should be /2 but needs check |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
73 #endif |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
74 |
723 | 75 /* XXX: also include quantization */ |
4661 | 76 static RL_VLC_ELEM dv_rl_vlc[1184]; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
77 /* VLC encoding lookup table */ |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
78 static struct dv_vlc_pair { |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
79 uint32_t vlc; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
80 uint8_t size; |
4666 | 81 } dv_vlc_map[DV_VLC_MAP_RUN_SIZE][DV_VLC_MAP_LEV_SIZE]; |
723 | 82 |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
83 static inline int dv_work_pool_size(const DVprofile *d) |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
84 { |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
85 int size = d->n_difchan*d->difseg_size*27; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
86 if (DV_PROFILE_IS_1080i50(d)) |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
87 size -= 3*27; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
88 if (DV_PROFILE_IS_720p50(d)) |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
89 size -= 4*27; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
90 return size; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
91 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
92 |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
93 static int dv_init_dynamic_tables(const DVprofile *d) |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
94 { |
8131 | 95 int j,i,c,s,p,k; |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
96 |
8131 | 97 if (d->work_chunks[dv_work_pool_size(d)-1].buf_offset) |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
98 return 0; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
99 |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
100 p = i = 0; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
101 for (c=0; c<d->n_difchan; c++) { |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
102 for (s=0; s<d->difseg_size; s++) { |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
103 p += 6; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
104 for (j=0; j<27; j++) { |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
105 p += !(j%3); |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
106 if (!(DV_PROFILE_IS_1080i50(d) && c != 0 && s == 11) && |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
107 !(DV_PROFILE_IS_720p50(d) && s > 9)) { |
8131 | 108 for (k=0; k<5; k++) |
109 d->work_chunks[i].mb_coordinates[k] = d->video_place[(c*d->difseg_size+s)*27*5 + j*5 + k]; | |
110 d->work_chunks[i++].buf_offset = p; | |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
111 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
112 p += 5; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
113 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
114 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
115 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
116 return 0; |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
117 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
118 |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
119 static void dv_build_unquantize_tables(DVVideoContext *s, uint8_t* perm) |
723 | 120 { |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
121 int i, q, a; |
723 | 122 |
123 /* NOTE: max left shift is 6 */ | |
8051 | 124 for (q = 0; q < 22; q++) { |
1567 | 125 /* 88DCT */ |
8051 | 126 i = 1; |
127 for (a = 0; a < 4; a++) { | |
128 for (; i < dv_quant_areas[a]; i++) { | |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
129 /* 88 table */ |
8051 | 130 s->dv_idct_factor[0][0][q][i] = dv_iweight_88[i] << (dv_quant_shifts[q][a] + 1); |
131 s->dv_idct_factor[1][0][q][i] = s->dv_idct_factor[0][0][q][i] << 1; | |
2967 | 132 |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
133 /* 248 table */ |
8051 | 134 s->dv_idct_factor[0][1][q][i] = dv_iweight_248[i] << (dv_quant_shifts[q][a] + 1); |
135 s->dv_idct_factor[1][1][q][i] = s->dv_idct_factor[0][1][q][i] << 1; | |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
136 } |
723 | 137 } |
138 } | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
139 |
8051 | 140 for (a = 0; a < 4; a++) { |
141 for (q = 0; q < 16; q++) { | |
142 for (i = 1; i < 64; i++) { | |
143 s->dv100_idct_factor[0][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_1080_y[i]; | |
144 s->dv100_idct_factor[1][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_1080_c[i]; | |
145 s->dv100_idct_factor[2][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_720_y[i]; | |
146 s->dv100_idct_factor[3][a][q][i] = (dv100_qstep[q] << (a + 9)) * dv_iweight_720_c[i]; | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
147 } |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
148 } |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
149 } |
723 | 150 } |
151 | |
6517
48759bfbd073
Apply 'cold' attribute to init/uninit functions in libavcodec
zuxy
parents:
6450
diff
changeset
|
152 static av_cold int dvvideo_init(AVCodecContext *avctx) |
723 | 153 { |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
154 DVVideoContext *s = avctx->priv_data; |
1567 | 155 DSPContext dsp; |
8051 | 156 static int done = 0; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
157 int i, j; |
723 | 158 |
159 if (!done) { | |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
160 VLC dv_vlc; |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
161 uint16_t new_dv_vlc_bits[NB_DV_VLC*2]; |
8051 | 162 uint8_t new_dv_vlc_len[NB_DV_VLC*2]; |
163 uint8_t new_dv_vlc_run[NB_DV_VLC*2]; | |
164 int16_t new_dv_vlc_level[NB_DV_VLC*2]; | |
723 | 165 |
166 done = 1; | |
167 | |
2979 | 168 /* it's faster to include sign bit in a generic VLC parsing scheme */ |
8051 | 169 for (i = 0, j = 0; i < NB_DV_VLC; i++, j++) { |
170 new_dv_vlc_bits[j] = dv_vlc_bits[i]; | |
171 new_dv_vlc_len[j] = dv_vlc_len[i]; | |
172 new_dv_vlc_run[j] = dv_vlc_run[i]; | |
2979 | 173 new_dv_vlc_level[j] = dv_vlc_level[i]; |
2967 | 174 |
2979 | 175 if (dv_vlc_level[i]) { |
176 new_dv_vlc_bits[j] <<= 1; | |
177 new_dv_vlc_len[j]++; | |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
178 |
2979 | 179 j++; |
8051 | 180 new_dv_vlc_bits[j] = (dv_vlc_bits[i] << 1) | 1; |
181 new_dv_vlc_len[j] = dv_vlc_len[i] + 1; | |
182 new_dv_vlc_run[j] = dv_vlc_run[i]; | |
2979 | 183 new_dv_vlc_level[j] = -dv_vlc_level[i]; |
184 } | |
185 } | |
2967 | 186 |
723 | 187 /* NOTE: as a trick, we use the fact the no codes are unused |
188 to accelerate the parsing of partial codes */ | |
2967 | 189 init_vlc(&dv_vlc, TEX_VLC_BITS, j, |
2370
26560d4fdb1f
Memory leak fix patch by (Burkhard Plaum <plaum >at< ipf.uni-stuttgart )dot( de>)
michael
parents:
2247
diff
changeset
|
190 new_dv_vlc_len, 1, 1, new_dv_vlc_bits, 2, 2, 0); |
4661 | 191 assert(dv_vlc.table_size == 1184); |
3016
97e6c0f82182
Moving dv_anchor back to the global scope. This creates a tiny memory
romansh
parents:
2991
diff
changeset
|
192 |
8051 | 193 for (i = 0; i < dv_vlc.table_size; i++){ |
194 int code = dv_vlc.table[i][0]; | |
195 int len = dv_vlc.table[i][1]; | |
723 | 196 int level, run; |
2967 | 197 |
8051 | 198 if (len < 0){ //more bits needed |
199 run = 0; | |
200 level = code; | |
723 | 201 } else { |
8051 | 202 run = new_dv_vlc_run [code] + 1; |
203 level = new_dv_vlc_level[code]; | |
723 | 204 } |
8051 | 205 dv_rl_vlc[i].len = len; |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
206 dv_rl_vlc[i].level = level; |
8051 | 207 dv_rl_vlc[i].run = run; |
723 | 208 } |
2979 | 209 free_vlc(&dv_vlc); |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
210 |
2979 | 211 for (i = 0; i < NB_DV_VLC - 1; i++) { |
2027
3a78447c3b53
oops, forgot to commit that change from the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1994
diff
changeset
|
212 if (dv_vlc_run[i] >= DV_VLC_MAP_RUN_SIZE) |
2979 | 213 continue; |
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
214 #if ENABLE_SMALL |
2027
3a78447c3b53
oops, forgot to commit that change from the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1994
diff
changeset
|
215 if (dv_vlc_level[i] >= DV_VLC_MAP_LEV_SIZE) |
2979 | 216 continue; |
2027
3a78447c3b53
oops, forgot to commit that change from the warning fixes by (Michael Roitzsch <mroi at users dot sourceforge dot net>)
michael
parents:
1994
diff
changeset
|
217 #endif |
2967 | 218 |
2979 | 219 if (dv_vlc_map[dv_vlc_run[i]][dv_vlc_level[i]].size != 0) |
220 continue; | |
2967 | 221 |
8051 | 222 dv_vlc_map[dv_vlc_run[i]][dv_vlc_level[i]].vlc = |
223 dv_vlc_bits[i] << (!!dv_vlc_level[i]); | |
224 dv_vlc_map[dv_vlc_run[i]][dv_vlc_level[i]].size = | |
225 dv_vlc_len[i] + (!!dv_vlc_level[i]); | |
2979 | 226 } |
227 for (i = 0; i < DV_VLC_MAP_RUN_SIZE; i++) { | |
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
228 #if ENABLE_SMALL |
2979 | 229 for (j = 1; j < DV_VLC_MAP_LEV_SIZE; j++) { |
230 if (dv_vlc_map[i][j].size == 0) { | |
231 dv_vlc_map[i][j].vlc = dv_vlc_map[0][j].vlc | | |
232 (dv_vlc_map[i-1][0].vlc << (dv_vlc_map[0][j].size)); | |
233 dv_vlc_map[i][j].size = dv_vlc_map[i-1][0].size + | |
234 dv_vlc_map[0][j].size; | |
235 } | |
236 } | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
237 #else |
2979 | 238 for (j = 1; j < DV_VLC_MAP_LEV_SIZE/2; j++) { |
239 if (dv_vlc_map[i][j].size == 0) { | |
240 dv_vlc_map[i][j].vlc = dv_vlc_map[0][j].vlc | | |
241 (dv_vlc_map[i-1][0].vlc << (dv_vlc_map[0][j].size)); | |
242 dv_vlc_map[i][j].size = dv_vlc_map[i-1][0].size + | |
243 dv_vlc_map[0][j].size; | |
244 } | |
245 dv_vlc_map[i][((uint16_t)(-j))&0x1ff].vlc = | |
246 dv_vlc_map[i][j].vlc | 1; | |
247 dv_vlc_map[i][((uint16_t)(-j))&0x1ff].size = | |
248 dv_vlc_map[i][j].size; | |
249 } | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
250 #endif |
2979 | 251 } |
723 | 252 } |
725 | 253 |
1567 | 254 /* Generic DSP setup */ |
255 dsputil_init(&dsp, avctx); | |
256 s->get_pixels = dsp.get_pixels; | |
725 | 257 |
1567 | 258 /* 88DCT setup */ |
8051 | 259 s->fdct[0] = dsp.fdct; |
1567 | 260 s->idct_put[0] = dsp.idct_put; |
8051 | 261 for (i = 0; i < 64; i++) |
1567 | 262 s->dv_zigzag[0][i] = dsp.idct_permutation[ff_zigzag_direct[i]]; |
725 | 263 |
1567 | 264 /* 248DCT setup */ |
8051 | 265 s->fdct[1] = dsp.fdct248; |
6001 | 266 s->idct_put[1] = ff_simple_idct248_put; // FIXME: need to add it to DSP |
8051 | 267 if (avctx->lowres){ |
268 for (i = 0; i < 64; i++){ | |
269 int j = ff_zigzag248_direct[i]; | |
270 s->dv_zigzag[1][i] = dsp.idct_permutation[(j & 7) + (j & 8) * 4 + (j & 48) / 2]; | |
2849 | 271 } |
272 }else | |
273 memcpy(s->dv_zigzag[1], ff_zigzag248_direct, 64); | |
725 | 274 |
723 | 275 /* XXX: do it only for constant case */ |
1567 | 276 dv_build_unquantize_tables(s, dsp.idct_permutation); |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
277 |
1543
7542cb99b950
* providing MPEG codecs with a generic fields in AVFrame to use.
romansh
parents:
1540
diff
changeset
|
278 avctx->coded_frame = &s->picture; |
8051 | 279 s->avctx = avctx; |
2967 | 280 |
723 | 281 return 0; |
282 } | |
283 | |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
284 // #define VLC_DEBUG |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
285 // #define printf(...) av_log(NULL, AV_LOG_ERROR, __VA_ARGS__) |
723 | 286 |
725 | 287 typedef struct BlockInfo { |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
288 const uint32_t *factor_table; |
1064 | 289 const uint8_t *scan_table; |
290 uint8_t pos; /* position in block */ | |
7706 | 291 void (*idct_put)(uint8_t *dest, int line_size, DCTELEM *block); |
1064 | 292 uint8_t partial_bit_count; |
293 uint16_t partial_bit_buffer; | |
725 | 294 int shift_offset; |
295 } BlockInfo; | |
723 | 296 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
297 /* bit budget for AC only in 5 MBs */ |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
298 static const int vs_total_ac_bits = (100 * 4 + 68*2) * 5; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
299 /* see dv_88_areas and dv_248_areas for details */ |
2967 | 300 static const int mb_area_start[5] = { 1, 6, 21, 43, 64 }; |
723 | 301 |
1895
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
302 static inline int get_bits_left(GetBitContext *s) |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
303 { |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
304 return s->size_in_bits - get_bits_count(s); |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
305 } |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
306 |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
307 static inline int put_bits_left(PutBitContext* s) |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
308 { |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
309 return (s->buf_end - s->buf) * 8 - put_bits_count(s); |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
310 } |
e5687117cc7f
* removing casualties of battle of the wits and English language
romansh
parents:
1887
diff
changeset
|
311 |
7980 | 312 /* decode ac coefficients */ |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
313 static void dv_decode_ac(GetBitContext *gb, BlockInfo *mb, DCTELEM *block) |
723 | 314 { |
7039 | 315 int last_index = gb->size_in_bits; |
8051 | 316 const uint8_t *scan_table = mb->scan_table; |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
317 const uint32_t *factor_table = mb->factor_table; |
8051 | 318 int pos = mb->pos; |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
319 int partial_bit_count = mb->partial_bit_count; |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
320 int level, run, vlc_len, index; |
2967 | 321 |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
322 OPEN_READER(re, gb); |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
323 UPDATE_CACHE(re, gb); |
2967 | 324 |
723 | 325 /* if we must parse a partial vlc, we do it here */ |
326 if (partial_bit_count > 0) { | |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
327 re_cache = ((unsigned)re_cache >> partial_bit_count) | |
8051 | 328 (mb->partial_bit_buffer << (sizeof(re_cache) * 8 - partial_bit_count)); |
2979 | 329 re_index -= partial_bit_count; |
330 mb->partial_bit_count = 0; | |
723 | 331 } |
332 | |
333 /* get the AC coefficients until last_index is reached */ | |
8051 | 334 for (;;) { |
723 | 335 #ifdef VLC_DEBUG |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
336 printf("%2d: bits=%04x index=%d\n", pos, SHOW_UBITS(re, gb, 16), re_index); |
723 | 337 #endif |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
338 /* our own optimized GET_RL_VLC */ |
8051 | 339 index = NEG_USR32(re_cache, TEX_VLC_BITS); |
2979 | 340 vlc_len = dv_rl_vlc[index].len; |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
341 if (vlc_len < 0) { |
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
342 index = NEG_USR32((unsigned)re_cache << TEX_VLC_BITS, -vlc_len) + dv_rl_vlc[index].level; |
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
343 vlc_len = TEX_VLC_BITS - vlc_len; |
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
344 } |
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
345 level = dv_rl_vlc[index].level; |
8051 | 346 run = dv_rl_vlc[index].run; |
2967 | 347 |
2979 | 348 /* gotta check if we're still within gb boundaries */ |
349 if (re_index + vlc_len > last_index) { | |
350 /* should be < 16 bits otherwise a codeword could have been parsed */ | |
351 mb->partial_bit_count = last_index - re_index; | |
352 mb->partial_bit_buffer = NEG_USR32(re_cache, mb->partial_bit_count); | |
353 re_index = last_index; | |
354 break; | |
355 } | |
356 re_index += vlc_len; | |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
357 |
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
358 #ifdef VLC_DEBUG |
2979 | 359 printf("run=%d level=%d\n", run, level); |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
360 #endif |
2979 | 361 pos += run; |
362 if (pos >= 64) | |
363 break; | |
2967 | 364 |
8051 | 365 level = (level * factor_table[pos] + (1 << (dv_iweight_bits - 1))) >> dv_iweight_bits; |
7536
910087e97750
Coalescing the un-weighting and de-quantization steps for faster
romansh
parents:
7240
diff
changeset
|
366 block[scan_table[pos]] = level; |
1905
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
367 |
2761950695cc
* some significant clean-up of the dv_decode_ac (it looks real
romansh
parents:
1904
diff
changeset
|
368 UPDATE_CACHE(re, gb); |
723 | 369 } |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
370 CLOSE_READER(re, gb); |
725 | 371 mb->pos = pos; |
723 | 372 } |
373 | |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
374 static inline void bit_copy(PutBitContext *pb, GetBitContext *gb) |
723 | 375 { |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
376 int bits_left = get_bits_left(gb); |
2847 | 377 while (bits_left >= MIN_CACHE_BITS) { |
378 put_bits(pb, MIN_CACHE_BITS, get_bits(gb, MIN_CACHE_BITS)); | |
379 bits_left -= MIN_CACHE_BITS; | |
723 | 380 } |
381 if (bits_left > 0) { | |
382 put_bits(pb, bits_left, get_bits(gb, bits_left)); | |
383 } | |
384 } | |
385 | |
8131 | 386 static inline void dv_calculate_mb_xy(DVVideoContext *s, DVwork_chunk *work_chunk, int m, int *mb_x, int *mb_y) |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
387 { |
8131 | 388 *mb_x = work_chunk->mb_coordinates[m] & 0xff; |
389 *mb_y = work_chunk->mb_coordinates[m] >> 8; | |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
390 |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
391 /* We work with 720p frames split in half. The odd half-frame (chan==2,3) is displaced :-( */ |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
392 if (s->sys->height == 720 && !(s->buf[1]&0x0C)) { |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
393 *mb_y -= (*mb_y>17)?18:-72; /* shifting the Y coordinate down by 72/2 macro blocks */ |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
394 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
395 } |
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
396 |
723 | 397 /* mb_x and mb_y are in units of 8 pixels */ |
8131 | 398 static inline void dv_decode_video_segment(DVVideoContext *s, DVwork_chunk *work_chunk) |
723 | 399 { |
400 int quant, dc, dct_mode, class1, j; | |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
401 int mb_index, mb_x, mb_y, last_index; |
8011 | 402 int y_stride, linesize; |
723 | 403 DCTELEM *block, *block1; |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
404 int c_offset; |
1064 | 405 uint8_t *y_ptr; |
6266 | 406 const uint8_t *buf_ptr; |
723 | 407 PutBitContext pb, vs_pb; |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
408 GetBitContext gb; |
7614
1afa1171b7b2
Introducing DV_MAX_BPM macro instead of a hardcoded value for the
romansh
parents:
7538
diff
changeset
|
409 BlockInfo mb_data[5 * DV_MAX_BPM], *mb, *mb1; |
1afa1171b7b2
Introducing DV_MAX_BPM macro instead of a hardcoded value for the
romansh
parents:
7538
diff
changeset
|
410 DECLARE_ALIGNED_16(DCTELEM, sblock[5*DV_MAX_BPM][64]); |
3089 | 411 DECLARE_ALIGNED_8(uint8_t, mb_bit_buffer[80 + 4]); /* allow some slack */ |
412 DECLARE_ALIGNED_8(uint8_t, vs_bit_buffer[5 * 80 + 4]); /* allow some slack */ | |
8051 | 413 const int log2_blocksize = 3-s->avctx->lowres; |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
414 int is_field_mode[5]; |
2967 | 415 |
8051 | 416 assert((((int)mb_bit_buffer) & 7) == 0); |
417 assert((((int)vs_bit_buffer) & 7) == 0); | |
2967 | 418 |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
419 memset(sblock, 0, sizeof(sblock)); |
723 | 420 |
421 /* pass 1 : read DC and AC coefficients in blocks */ | |
8131 | 422 buf_ptr = &s->buf[work_chunk->buf_offset*80]; |
8051 | 423 block1 = &sblock[0][0]; |
424 mb1 = mb_data; | |
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1507
diff
changeset
|
425 init_put_bits(&vs_pb, vs_bit_buffer, 5 * 80); |
8051 | 426 for (mb_index = 0; mb_index < 5; mb_index++, mb1 += s->sys->bpm, block1 += s->sys->bpm * 64) { |
723 | 427 /* skip header */ |
428 quant = buf_ptr[3] & 0x0f; | |
429 buf_ptr += 4; | |
1522
79dddc5cd990
removed the obsolete and unused parameters of init_put_bits
alex
parents:
1507
diff
changeset
|
430 init_put_bits(&pb, mb_bit_buffer, 80); |
8051 | 431 mb = mb1; |
723 | 432 block = block1; |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
433 is_field_mode[mb_index] = 0; |
8051 | 434 for (j = 0; j < s->sys->bpm; j++) { |
7616
685ef77c9fe5
Making block size in bits variable and dependent on the DV spec
romansh
parents:
7615
diff
changeset
|
435 last_index = s->sys->block_sizes[j]; |
2979 | 436 init_get_bits(&gb, buf_ptr, last_index); |
2967 | 437 |
723 | 438 /* get the dc */ |
8051 | 439 dc = get_sbits(&gb, 9); |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
440 dct_mode = get_bits1(&gb); |
8051 | 441 class1 = get_bits(&gb, 2); |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
442 if (DV_PROFILE_IS_HD(s->sys)) { |
8051 | 443 mb->idct_put = s->idct_put[0]; |
444 mb->scan_table = s->dv_zigzag[0]; | |
445 mb->factor_table = s->dv100_idct_factor[((s->sys->height == 720) << 1) | (j >= 4)][class1][quant]; | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
446 is_field_mode[mb_index] |= !j && dct_mode; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
447 } else { |
8051 | 448 mb->idct_put = s->idct_put[dct_mode && log2_blocksize == 3]; |
449 mb->scan_table = s->dv_zigzag[dct_mode]; | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
450 mb->factor_table = s->dv_idct_factor[class1 == 3][dct_mode] |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
451 [quant + dv_quant_offset[class1]]; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
452 } |
723 | 453 dc = dc << 2; |
454 /* convert to unsigned because 128 is not added in the | |
455 standard IDCT */ | |
456 dc += 1024; | |
457 block[0] = dc; | |
458 buf_ptr += last_index >> 3; | |
8051 | 459 mb->pos = 0; |
725 | 460 mb->partial_bit_count = 0; |
723 | 461 |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
462 #ifdef VLC_DEBUG |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
463 printf("MB block: %d, %d ", mb_index, j); |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
464 #endif |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
465 dv_decode_ac(&gb, mb, block); |
723 | 466 |
467 /* write the remaining bits in a new buffer only if the | |
468 block is finished */ | |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
469 if (mb->pos >= 64) |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
470 bit_copy(&pb, &gb); |
2967 | 471 |
723 | 472 block += 64; |
725 | 473 mb++; |
723 | 474 } |
2967 | 475 |
723 | 476 /* pass 2 : we can do it just after */ |
477 #ifdef VLC_DEBUG | |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
478 printf("***pass 2 size=%d MB#=%d\n", put_bits_count(&pb), mb_index); |
723 | 479 #endif |
480 block = block1; | |
8051 | 481 mb = mb1; |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
482 init_get_bits(&gb, mb_bit_buffer, put_bits_count(&pb)); |
2979 | 483 flush_put_bits(&pb); |
8051 | 484 for (j = 0; j < s->sys->bpm; j++, block += 64, mb++) { |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
485 if (mb->pos < 64 && get_bits_left(&gb) > 0) { |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
486 dv_decode_ac(&gb, mb, block); |
723 | 487 /* if still not finished, no need to parse other blocks */ |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
488 if (mb->pos < 64) |
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
489 break; |
723 | 490 } |
491 } | |
492 /* all blocks are finished, so the extra bytes can be used at | |
493 the video segment level */ | |
7615
290fd3ae1219
Making the number of blocks per macroblock dependent on the DV stream
romansh
parents:
7614
diff
changeset
|
494 if (j >= s->sys->bpm) |
2979 | 495 bit_copy(&vs_pb, &gb); |
723 | 496 } |
497 | |
498 /* we need a pass other the whole video segment */ | |
499 #ifdef VLC_DEBUG | |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
500 printf("***pass 3 size=%d\n", put_bits_count(&vs_pb)); |
723 | 501 #endif |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
502 block = &sblock[0][0]; |
8051 | 503 mb = mb_data; |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
504 init_get_bits(&gb, vs_bit_buffer, put_bits_count(&vs_pb)); |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
505 flush_put_bits(&vs_pb); |
8051 | 506 for (mb_index = 0; mb_index < 5; mb_index++) { |
507 for (j = 0; j < s->sys->bpm; j++) { | |
1886
fbcf02596520
* DV decoder simplifications. Now it looks to be 6% faster. At least
romansh
parents:
1875
diff
changeset
|
508 if (mb->pos < 64) { |
723 | 509 #ifdef VLC_DEBUG |
510 printf("start %d:%d\n", mb_index, j); | |
511 #endif | |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
512 dv_decode_ac(&gb, mb, block); |
723 | 513 } |
2979 | 514 if (mb->pos >= 64 && mb->pos < 127) |
515 av_log(NULL, AV_LOG_ERROR, "AC EOB marker is absent pos=%d\n", mb->pos); | |
723 | 516 block += 64; |
725 | 517 mb++; |
723 | 518 } |
519 } | |
2967 | 520 |
723 | 521 /* compute idct and place blocks */ |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
522 block = &sblock[0][0]; |
8051 | 523 mb = mb_data; |
524 for (mb_index = 0; mb_index < 5; mb_index++) { | |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
525 dv_calculate_mb_xy(s, work_chunk, mb_index, &mb_x, &mb_y); |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
526 |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
527 /* idct_put'ting luminance */ |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
528 if ((s->sys->pix_fmt == PIX_FMT_YUV420P) || |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
529 (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x >= (704 / 8)) || |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
530 (s->sys->height >= 720 && mb_y != 134)) { |
8051 | 531 y_stride = (s->picture.linesize[0] << ((!is_field_mode[mb_index]) * log2_blocksize)); |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
532 } else { |
8051 | 533 y_stride = (2 << log2_blocksize); |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
534 } |
8051 | 535 y_ptr = s->picture.data[0] + ((mb_y * s->picture.linesize[0] + mb_x) << log2_blocksize); |
536 linesize = s->picture.linesize[0] << is_field_mode[mb_index]; | |
537 mb[0] .idct_put(y_ptr , linesize, block + 0*64); | |
8011 | 538 if (s->sys->video_stype == 4) { /* SD 422 */ |
8051 | 539 mb[2].idct_put(y_ptr + (1 << log2_blocksize) , linesize, block + 2*64); |
8011 | 540 } else { |
8051 | 541 mb[1].idct_put(y_ptr + (1 << log2_blocksize) , linesize, block + 1*64); |
542 mb[2].idct_put(y_ptr + y_stride, linesize, block + 2*64); | |
543 mb[3].idct_put(y_ptr + (1 << log2_blocksize) + y_stride, linesize, block + 3*64); | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
544 } |
8011 | 545 mb += 4; |
546 block += 4*64; | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
547 |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
548 /* idct_put'ting chrominance */ |
8051 | 549 c_offset = (((mb_y >> (s->sys->pix_fmt == PIX_FMT_YUV420P)) * s->picture.linesize[1] + |
550 (mb_x >> ((s->sys->pix_fmt == PIX_FMT_YUV411P) ? 2 : 1))) << log2_blocksize); | |
551 for (j = 2; j; j--) { | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
552 uint8_t *c_ptr = s->picture.data[j] + c_offset; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
553 if (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x >= (704 / 8)) { |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
554 uint64_t aligned_pixels[64/8]; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
555 uint8_t *pixels = (uint8_t*)aligned_pixels; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
556 uint8_t *c_ptr1, *ptr1; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
557 int x, y; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
558 mb->idct_put(pixels, 8, block); |
8051 | 559 for (y = 0; y < (1 << log2_blocksize); y++, c_ptr += s->picture.linesize[j], pixels += 8) { |
560 ptr1 = pixels + (1 << (log2_blocksize - 1)); | |
561 c_ptr1 = c_ptr + (s->picture.linesize[j] << log2_blocksize); | |
562 for (x = 0; x < (1 << (log2_blocksize - 1)); x++) { | |
563 c_ptr[x] = pixels[x]; | |
564 c_ptr1[x] = ptr1[x]; | |
7715
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
565 } |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
566 } |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
567 block += 64; mb++; |
e8f71784062e
Intial implementation of the DV100 (AKA DVCPRO HD) decoder and demuxer as
romansh
parents:
7708
diff
changeset
|
568 } else { |
8051 | 569 y_stride = (mb_y == 134) ? (1 << log2_blocksize) : |
570 s->picture.linesize[j] << ((!is_field_mode[mb_index]) * log2_blocksize); | |
571 linesize = s->picture.linesize[j] << is_field_mode[mb_index]; | |
572 (mb++)-> idct_put(c_ptr , linesize, block); block += 64; | |
8011 | 573 if (s->sys->bpm == 8) { |
8051 | 574 (mb++)->idct_put(c_ptr + y_stride, linesize, block); block += 64; |
8011 | 575 } |
723 | 576 } |
577 } | |
578 } | |
579 } | |
580 | |
8088
728e0e4fcb95
renaming macro in order to conform with the rest of libavcodec
romansh
parents:
8051
diff
changeset
|
581 #if ENABLE_SMALL |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
582 /* Converts run and level (where level != 0) pair into vlc, returning bit size */ |
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
583 static av_always_inline int dv_rl2vlc(int run, int level, int sign, uint32_t* vlc) |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
584 { |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
585 int size; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
586 if (run < DV_VLC_MAP_RUN_SIZE && level < DV_VLC_MAP_LEV_SIZE) { |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
587 *vlc = dv_vlc_map[run][level].vlc | sign; |
2979 | 588 size = dv_vlc_map[run][level].size; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
589 } |
2967 | 590 else { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
591 if (level < DV_VLC_MAP_LEV_SIZE) { |
2979 | 592 *vlc = dv_vlc_map[0][level].vlc | sign; |
593 size = dv_vlc_map[0][level].size; | |
594 } else { | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
595 *vlc = 0xfe00 | (level << 1) | sign; |
2979 | 596 size = 16; |
597 } | |
598 if (run) { | |
599 *vlc |= ((run < 16) ? dv_vlc_map[run-1][0].vlc : | |
600 (0x1f80 | (run - 1))) << size; | |
8051 | 601 size += (run < 16) ? dv_vlc_map[run-1][0].size : 13; |
2979 | 602 } |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
603 } |
2967 | 604 |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
605 return size; |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
606 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
607 |
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
608 static av_always_inline int dv_rl2vlc_size(int run, int level) |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
609 { |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
610 int size; |
2967 | 611 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
612 if (run < DV_VLC_MAP_RUN_SIZE && level < DV_VLC_MAP_LEV_SIZE) { |
2979 | 613 size = dv_vlc_map[run][level].size; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
614 } |
2967 | 615 else { |
2979 | 616 size = (level < DV_VLC_MAP_LEV_SIZE) ? dv_vlc_map[0][level].size : 16; |
617 if (run) { | |
618 size += (run < 16) ? dv_vlc_map[run-1][0].size : 13; | |
619 } | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
620 } |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
621 return size; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
622 } |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
623 #else |
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
624 static av_always_inline int dv_rl2vlc(int run, int l, int sign, uint32_t* vlc) |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
625 { |
2847 | 626 *vlc = dv_vlc_map[run][l].vlc | sign; |
627 return dv_vlc_map[run][l].size; | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
628 } |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
629 |
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
630 static av_always_inline int dv_rl2vlc_size(int run, int l) |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
631 { |
2847 | 632 return dv_vlc_map[run][l].size; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
633 } |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
634 #endif |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
635 |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
636 typedef struct EncBlockInfo { |
8051 | 637 int area_q[4]; |
638 int bit_size[4]; | |
639 int prev[5]; | |
640 int cur_ac; | |
641 int cno; | |
642 int dct_mode; | |
643 DCTELEM mb[64]; | |
644 uint8_t next[64]; | |
645 uint8_t sign[64]; | |
646 uint8_t partial_bit_count; | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
647 uint32_t partial_bit_buffer; /* we can't use uint16_t here */ |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
648 } EncBlockInfo; |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
649 |
8051 | 650 static av_always_inline PutBitContext* dv_encode_ac(EncBlockInfo* bi, |
651 PutBitContext* pb_pool, | |
652 PutBitContext* pb_end) | |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
653 { |
8051 | 654 int prev, bits_left; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
655 PutBitContext* pb = pb_pool; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
656 int size = bi->partial_bit_count; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
657 uint32_t vlc = bi->partial_bit_buffer; |
2847 | 658 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
659 bi->partial_bit_count = bi->partial_bit_buffer = 0; |
8051 | 660 for (;;){ |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
661 /* Find suitable storage space */ |
1875
45a1592dadca
* moving some of the commonly used bit reading/writing functions
romansh
parents:
1726
diff
changeset
|
662 for (; size > (bits_left = put_bits_left(pb)); pb++) { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
663 if (bits_left) { |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
664 size -= bits_left; |
2979 | 665 put_bits(pb, bits_left, vlc >> size); |
8051 | 666 vlc = vlc & ((1 << size) - 1); |
2979 | 667 } |
668 if (pb + 1 >= pb_end) { | |
8051 | 669 bi->partial_bit_count = size; |
2979 | 670 bi->partial_bit_buffer = vlc; |
671 return pb; | |
672 } | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
673 } |
2967 | 674 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
675 /* Store VLC */ |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
676 put_bits(pb, size, vlc); |
2967 | 677 |
8051 | 678 if (bi->cur_ac >= 64) |
2847 | 679 break; |
2967 | 680 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
681 /* Construct the next VLC */ |
8051 | 682 prev = bi->cur_ac; |
2847 | 683 bi->cur_ac = bi->next[prev]; |
8051 | 684 if (bi->cur_ac < 64){ |
2847 | 685 size = dv_rl2vlc(bi->cur_ac - prev - 1, bi->mb[bi->cur_ac], bi->sign[bi->cur_ac], &vlc); |
686 } else { | |
687 size = 4; vlc = 6; /* End Of Block stamp */ | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
688 } |
2847 | 689 } |
690 return pb; | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
691 } |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
692 |
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
693 static av_always_inline void dv_set_class_number(DCTELEM* blk, EncBlockInfo* bi, |
8051 | 694 const uint8_t* zigzag_scan, |
695 const int *weight, int bias) | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
696 { |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
697 int i, area; |
3152
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
698 /* We offer two different methods for class number assignment: the |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
699 method suggested in SMPTE 314M Table 22, and an improved |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
700 method. The SMPTE method is very conservative; it assigns class |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
701 3 (i.e. severe quantization) to any block where the largest AC |
7980 | 702 component is greater than 36. FFmpeg's DV encoder tracks AC bit |
3152
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
703 consumption precisely, so there is no need to bias most blocks |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
704 towards strongly lossy compression. Instead, we assign class 2 |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
705 to most blocks, and use class 3 only when strictly necessary |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
706 (for blocks whose largest AC component exceeds 255). */ |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
707 |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
708 #if 0 /* SMPTE spec method */ |
2847 | 709 static const int classes[] = {12, 24, 36, 0xffff}; |
7980 | 710 #else /* improved FFmpeg method */ |
3152
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
711 static const int classes[] = {-1, -1, 255, 0xffff}; |
28a087ad41d1
Assign class 2 to most macroblocks by default, instead of a more conservative
romansh
parents:
3150
diff
changeset
|
712 #endif |
8051 | 713 int max = classes[0]; |
714 int prev = 0; | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
715 |
2967 | 716 bi->mb[0] = blk[0]; |
717 | |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
718 for (area = 0; area < 4; area++) { |
8051 | 719 bi->prev[area] = prev; |
2847 | 720 bi->bit_size[area] = 1; // 4 areas 4 bits for EOB :) |
8051 | 721 for (i = mb_area_start[area]; i < mb_area_start[area+1]; i++) { |
2847 | 722 int level = blk[zigzag_scan[i]]; |
2967 | 723 |
8051 | 724 if (level + 15 > 30U) { |
725 bi->sign[i] = (level >> 31) & 1; | |
3149
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
726 /* weigh it and and shift down into range, adding for rounding */ |
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
727 /* the extra division by a factor of 2^4 reverses the 8x expansion of the DCT |
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
728 AND the 2x doubling of the weights */ |
8051 | 729 level = (FFABS(level) * weight[i] + (1 << (dv_weight_bits+3))) >> (dv_weight_bits+4); |
3149
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
730 bi->mb[i] = level; |
8051 | 731 if (level > max) |
732 max = level; | |
2847 | 733 bi->bit_size[area] += dv_rl2vlc_size(i - prev - 1, level); |
734 bi->next[prev]= i; | |
8051 | 735 prev = i; |
2847 | 736 } |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
737 } |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
738 } |
2847 | 739 bi->next[prev]= i; |
8051 | 740 for (bi->cno = 0; max > classes[bi->cno]; bi->cno++); |
2847 | 741 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
742 bi->cno += bias; |
2967 | 743 |
2847 | 744 if (bi->cno >= 3) { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
745 bi->cno = 3; |
8051 | 746 prev = 0; |
747 i = bi->next[prev]; | |
2847 | 748 for (area = 0; area < 4; area++) { |
8051 | 749 bi->prev[area] = prev; |
2847 | 750 bi->bit_size[area] = 1; // 4 areas 4 bits for EOB :) |
8051 | 751 for (; i < mb_area_start[area+1]; i = bi->next[i]) { |
752 bi->mb[i] >>= 1; | |
2967 | 753 |
2847 | 754 if (bi->mb[i]) { |
755 bi->bit_size[area] += dv_rl2vlc_size(i - prev - 1, bi->mb[i]); | |
756 bi->next[prev]= i; | |
8051 | 757 prev = i; |
2847 | 758 } |
759 } | |
760 } | |
761 bi->next[prev]= i; | |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
762 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
763 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
764 |
2847 | 765 //FIXME replace this by dsputil |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
766 #define SC(x, y) ((s[x] - s[y]) ^ ((s[x] - s[y]) >> 7)) |
4283
d6f83e2f8804
rename always_inline to av_always_inline and move to common.h
mru
parents:
4001
diff
changeset
|
767 static av_always_inline int dv_guess_dct_mode(DCTELEM *blk) { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
768 DCTELEM *s; |
8051 | 769 int score88 = 0; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
770 int score248 = 0; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
771 int i; |
2967 | 772 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
773 /* Compute 8-8 score (small values give a better chance for 8-8 DCT) */ |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
774 s = blk; |
8051 | 775 for (i = 0; i < 7; i++) { |
2967 | 776 score88 += SC(0, 8) + SC(1, 9) + SC(2, 10) + SC(3, 11) + |
2979 | 777 SC(4, 12) + SC(5,13) + SC(6, 14) + SC(7, 15); |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
778 s += 8; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
779 } |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
780 /* Compute 2-4-8 score (small values give a better chance for 2-4-8 DCT) */ |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
781 s = blk; |
8051 | 782 for (i = 0; i < 6; i++) { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
783 score248 += SC(0, 16) + SC(1,17) + SC(2, 18) + SC(3, 19) + |
2979 | 784 SC(4, 20) + SC(5,21) + SC(6, 22) + SC(7, 23); |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
785 s += 8; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
786 } |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
787 |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
788 return (score88 - score248 > -10); |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
789 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
790 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
791 static inline void dv_guess_qnos(EncBlockInfo* blks, int* qnos) |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
792 { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
793 int size[5]; |
3140 | 794 int i, j, k, a, prev, a2; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
795 EncBlockInfo* b; |
2847 | 796 |
8051 | 797 size[0] = size[1] = size[2] = size[3] = size[4] = 1 << 24; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
798 do { |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
799 b = blks; |
8051 | 800 for (i = 0; i < 5; i++) { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
801 if (!qnos[i]) |
2979 | 802 continue; |
2967 | 803 |
2979 | 804 qnos[i]--; |
805 size[i] = 0; | |
8051 | 806 for (j = 0; j < 6; j++, b++) { |
807 for (a = 0; a < 4; a++) { | |
2979 | 808 if (b->area_q[a] != dv_quant_shifts[qnos[i] + dv_quant_offset[b->cno]][a]) { |
809 b->bit_size[a] = 1; // 4 areas 4 bits for EOB :) | |
810 b->area_q[a]++; | |
8051 | 811 prev = b->prev[a]; |
3147 | 812 assert(b->next[prev] >= mb_area_start[a+1] || b->mb[prev]); |
8051 | 813 for (k = b->next[prev] ; k < mb_area_start[a+1]; k = b->next[k]) { |
2979 | 814 b->mb[k] >>= 1; |
815 if (b->mb[k]) { | |
2847 | 816 b->bit_size[a] += dv_rl2vlc_size(k - prev - 1, b->mb[k]); |
8051 | 817 prev = k; |
2847 | 818 } else { |
8051 | 819 if (b->next[k] >= mb_area_start[a+1] && b->next[k]<64){ |
820 for (a2 = a + 1; b->next[k] >= mb_area_start[a2+1]; a2++) | |
3146
dcae1bde37ac
size[0-3] are not initialized (and can get random negative trash
michael
parents:
3143
diff
changeset
|
821 b->prev[a2] = prev; |
8051 | 822 assert(a2 < 4); |
3140 | 823 assert(b->mb[b->next[k]]); |
824 b->bit_size[a2] += dv_rl2vlc_size(b->next[k] - prev - 1, b->mb[b->next[k]]) | |
825 -dv_rl2vlc_size(b->next[k] - k - 1, b->mb[b->next[k]]); | |
8051 | 826 assert(b->prev[a2] == k && (a2 + 1 >= 4 || b->prev[a2+1] != k)); |
3147 | 827 b->prev[a2] = prev; |
3140 | 828 } |
2847 | 829 b->next[prev] = b->next[k]; |
830 } | |
2979 | 831 } |
2847 | 832 b->prev[a+1]= prev; |
2979 | 833 } |
834 size[i] += b->bit_size[a]; | |
835 } | |
836 } | |
8051 | 837 if (vs_total_ac_bits >= size[0] + size[1] + size[2] + size[3] + size[4]) |
3142 | 838 return; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
839 } |
3140 | 840 } while (qnos[0]|qnos[1]|qnos[2]|qnos[3]|qnos[4]); |
841 | |
842 | |
8051 | 843 for (a = 2; a == 2 || vs_total_ac_bits < size[0]; a += a){ |
3140 | 844 b = blks; |
8051 | 845 size[0] = 5 * 6 * 4; //EOB |
846 for (j = 0; j < 6 *5; j++, b++) { | |
847 prev = b->prev[0]; | |
848 for (k = b->next[prev]; k < 64; k = b->next[k]) { | |
849 if (b->mb[k] < a && b->mb[k] > -a){ | |
3140 | 850 b->next[prev] = b->next[k]; |
851 }else{ | |
852 size[0] += dv_rl2vlc_size(k - prev - 1, b->mb[k]); | |
8051 | 853 prev = k; |
3140 | 854 } |
855 } | |
856 } | |
857 } | |
1567 | 858 } |
859 | |
8131 | 860 static inline void dv_encode_video_segment(DVVideoContext *s, DVwork_chunk *work_chunk) |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
861 { |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
862 int mb_index, i, j; |
2967 | 863 int mb_x, mb_y, c_offset, linesize; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
864 uint8_t* y_ptr; |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
865 uint8_t* data; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
866 uint8_t* ptr; |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
867 uint8_t* dif; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
868 int do_edge_wrap; |
4675
c23a5c8263bc
force 16-bytes alignement of block array, as needed by the implementation of ff_dct_sse2
gpoirier
parents:
4666
diff
changeset
|
869 DECLARE_ALIGNED_16(DCTELEM, block[64]); |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
870 EncBlockInfo enc_blks[5*6]; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
871 PutBitContext pbs[5*6]; |
2967 | 872 PutBitContext* pb; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
873 EncBlockInfo* enc_blk; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
874 int vs_bit_size = 0; |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
875 int qnos[5]; |
2967 | 876 |
4675
c23a5c8263bc
force 16-bytes alignement of block array, as needed by the implementation of ff_dct_sse2
gpoirier
parents:
4666
diff
changeset
|
877 assert((((int)block) & 15) == 0); |
2967 | 878 |
8131 | 879 dif = &s->buf[work_chunk->buf_offset*80]; |
1567 | 880 enc_blk = &enc_blks[0]; |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
881 pb = &pbs[0]; |
8051 | 882 for (mb_index = 0; mb_index < 5; mb_index++) { |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
883 dv_calculate_mb_xy(s, work_chunk, mb_index, &mb_x, &mb_y); |
8051 | 884 y_ptr = s->picture.data[0] + ((mb_y * s->picture.linesize[0] + mb_x) << 3); |
885 c_offset = (((mb_y >> (s->sys->pix_fmt == PIX_FMT_YUV420P)) * s->picture.linesize[1] + | |
886 (mb_x >> ((s->sys->pix_fmt == PIX_FMT_YUV411P) ? 2 : 1))) << 3); | |
887 do_edge_wrap = 0; | |
2979 | 888 qnos[mb_index] = 15; /* No quantization */ |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
889 ptr = dif + mb_index*80 + 4; |
8051 | 890 for (j = 0; j < 6; j++) { |
3167 | 891 int dummy = 0; |
892 if (s->sys->pix_fmt == PIX_FMT_YUV422P) { /* 4:2:2 */ | |
893 if (j == 0 || j == 2) { | |
894 /* Y0 Y1 */ | |
8051 | 895 data = y_ptr + ((j >> 1) * 8); |
3167 | 896 linesize = s->picture.linesize[0]; |
897 } else if (j > 3) { | |
898 /* Cr Cb */ | |
8051 | 899 data = s->picture.data[6 - j] + c_offset; |
3167 | 900 linesize = s->picture.linesize[6 - j]; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
901 } else { |
3167 | 902 /* j=1 and j=3 are "dummy" blocks, used for AC data only */ |
8051 | 903 data = 0; |
3167 | 904 linesize = 0; |
8051 | 905 dummy = 1; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
906 } |
3167 | 907 } else { /* 4:1:1 or 4:2:0 */ |
908 if (j < 4) { /* Four Y blocks */ | |
909 /* NOTE: at end of line, the macroblock is handled as 420 */ | |
910 if (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x < (704 / 8)) { | |
911 data = y_ptr + (j * 8); | |
912 } else { | |
913 data = y_ptr + ((j & 1) * 8) + ((j >> 1) * 8 * s->picture.linesize[0]); | |
914 } | |
915 linesize = s->picture.linesize[0]; | |
916 } else { /* Cr and Cb blocks */ | |
917 /* don't ask Fabrice why they inverted Cb and Cr ! */ | |
8051 | 918 data = s->picture.data [6 - j] + c_offset; |
3167 | 919 linesize = s->picture.linesize[6 - j]; |
920 if (s->sys->pix_fmt == PIX_FMT_YUV411P && mb_x >= (704 / 8)) | |
921 do_edge_wrap = 1; | |
922 } | |
2979 | 923 } |
2967 | 924 |
2979 | 925 /* Everything is set up -- now just copy data -> DCT block */ |
926 if (do_edge_wrap) { /* Edge wrap copy: 4x16 -> 8x8 */ | |
927 uint8_t* d; | |
928 DCTELEM *b = block; | |
8051 | 929 for (i = 0; i < 8; i++) { |
2979 | 930 d = data + 8 * linesize; |
931 b[0] = data[0]; b[1] = data[1]; b[2] = data[2]; b[3] = data[3]; | |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
932 b[4] = d[0]; b[5] = d[1]; b[6] = d[2]; b[7] = d[3]; |
2979 | 933 data += linesize; |
934 b += 8; | |
935 } | |
936 } else { /* Simple copy: 8x8 -> 8x8 */ | |
3167 | 937 if (!dummy) |
938 s->get_pixels(block, data, linesize); | |
2979 | 939 } |
2967 | 940 |
8051 | 941 if (s->avctx->flags & CODEC_FLAG_INTERLACED_DCT) |
2847 | 942 enc_blk->dct_mode = dv_guess_dct_mode(block); |
943 else | |
944 enc_blk->dct_mode = 0; | |
2979 | 945 enc_blk->area_q[0] = enc_blk->area_q[1] = enc_blk->area_q[2] = enc_blk->area_q[3] = 0; |
946 enc_blk->partial_bit_count = 0; | |
947 enc_blk->partial_bit_buffer = 0; | |
948 enc_blk->cur_ac = 0; | |
2967 | 949 |
3167 | 950 if (dummy) { |
951 /* We rely on the fact that encoding all zeros leads to an immediate EOB, | |
952 which is precisely what the spec calls for in the "dummy" blocks. */ | |
953 memset(block, 0, sizeof(block)); | |
954 } else { | |
955 s->fdct[enc_blk->dct_mode](block); | |
956 } | |
2967 | 957 |
2979 | 958 dv_set_class_number(block, enc_blk, |
3149
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
959 enc_blk->dct_mode ? ff_zigzag248_direct : ff_zigzag_direct, |
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
960 enc_blk->dct_mode ? dv_weight_248 : dv_weight_88, |
2679184e8be0
AC coefficient weighing (per SMPTE 314M) for the DV encoder and decoder. The
romansh
parents:
3148
diff
changeset
|
961 j/4); |
2967 | 962 |
7616
685ef77c9fe5
Making block size in bits variable and dependent on the DV spec
romansh
parents:
7615
diff
changeset
|
963 init_put_bits(pb, ptr, s->sys->block_sizes[j]/8); |
2979 | 964 put_bits(pb, 9, (uint16_t)(((enc_blk->mb[0] >> 3) - 1024 + 2) >> 2)); |
965 put_bits(pb, 1, enc_blk->dct_mode); | |
966 put_bits(pb, 2, enc_blk->cno); | |
2967 | 967 |
2979 | 968 vs_bit_size += enc_blk->bit_size[0] + enc_blk->bit_size[1] + |
969 enc_blk->bit_size[2] + enc_blk->bit_size[3]; | |
970 ++enc_blk; | |
971 ++pb; | |
7616
685ef77c9fe5
Making block size in bits variable and dependent on the DV spec
romansh
parents:
7615
diff
changeset
|
972 ptr += s->sys->block_sizes[j]/8; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
973 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
974 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
975 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
976 if (vs_total_ac_bits < vs_bit_size) |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
977 dv_guess_qnos(&enc_blks[0], &qnos[0]); |
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
978 |
8051 | 979 for (i = 0; i < 5; i++) { |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
980 dif[i*80 + 3] = qnos[i]; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
981 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
982 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
983 /* First pass over individual cells only */ |
8051 | 984 for (j = 0; j < 5 * 6; j++) |
2847 | 985 dv_encode_ac(&enc_blks[j], &pbs[j], &pbs[j+1]); |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
986 |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
987 /* Second pass over each MB space */ |
8051 | 988 for (j = 0; j < 5 * 6; j += 6) { |
989 pb = &pbs[j]; | |
990 for (i = 0; i < 6; i++) { | |
2847 | 991 if (enc_blks[i+j].partial_bit_count) |
8051 | 992 pb = dv_encode_ac(&enc_blks[i+j], pb, &pbs[j+6]); |
2847 | 993 } |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
994 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
995 |
8050 | 996 /* Third and final pass over the whole video segment space */ |
8051 | 997 pb = &pbs[0]; |
998 for (j = 0; j < 5 * 6; j++) { | |
2847 | 999 if (enc_blks[j].partial_bit_count) |
8051 | 1000 pb = dv_encode_ac(&enc_blks[j], pb, &pbs[6*5]); |
3139
e58fb7ffbb4f
print a big warning if we mess up and run out of space ...
michael
parents:
3089
diff
changeset
|
1001 if (enc_blks[j].partial_bit_count) |
e58fb7ffbb4f
print a big warning if we mess up and run out of space ...
michael
parents:
3089
diff
changeset
|
1002 av_log(NULL, AV_LOG_ERROR, "ac bitstream overflow\n"); |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1003 } |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1004 |
8051 | 1005 for (j = 0; j < 5 * 6; j++) |
1631
59f2fa833449
* 3x encoding speedup. Finally we seem to be on par with libdv
romansh
parents:
1598
diff
changeset
|
1006 flush_put_bits(&pbs[j]); |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1007 } |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1008 |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1009 static int dv_decode_mt(AVCodecContext *avctx, void* sl) |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1010 { |
8131 | 1011 dv_decode_video_segment((DVVideoContext *)avctx->priv_data, (DVwork_chunk*)sl); |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1012 return 0; |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1013 } |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1014 |
7239
6519374c5020
Make preprocessor condition more specific and useful by changing
diego
parents:
7040
diff
changeset
|
1015 #ifdef CONFIG_DVVIDEO_ENCODER |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1016 static int dv_encode_mt(AVCodecContext *avctx, void* sl) |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1017 { |
8131 | 1018 dv_encode_video_segment((DVVideoContext *)avctx->priv_data, (DVwork_chunk*)sl); |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1019 return 0; |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1020 } |
3777 | 1021 #endif |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1022 |
7776
dbcdd0165e55
Replace generic CONFIG_DECODERS preprocessor conditionals by more specific
diego
parents:
7715
diff
changeset
|
1023 #ifdef CONFIG_DVVIDEO_DECODER |
723 | 1024 /* NOTE: exactly one frame must be given (120000 bytes for NTSC, |
3167 | 1025 144000 bytes for PAL - or twice those for 50Mbps) */ |
2967 | 1026 static int dvvideo_decode_frame(AVCodecContext *avctx, |
723 | 1027 void *data, int *data_size, |
6218 | 1028 const uint8_t *buf, int buf_size) |
723 | 1029 { |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1030 DVVideoContext *s = avctx->priv_data; |
2967 | 1031 |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1032 s->sys = dv_frame_profile(buf); |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1033 if (!s->sys || buf_size < s->sys->frame_size || dv_init_dynamic_tables(s->sys)) |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1034 return -1; /* NOTE: we only accept several full frames */ |
723 | 1035 |
8051 | 1036 if (s->picture.data[0]) |
1228 | 1037 avctx->release_buffer(avctx, &s->picture); |
2967 | 1038 |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1039 s->picture.reference = 0; |
2822
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1040 s->picture.key_frame = 1; |
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1041 s->picture.pict_type = FF_I_TYPE; |
8051 | 1042 avctx->pix_fmt = s->sys->pix_fmt; |
8014
07d8986fbea7
replacing frame_rate and frame_rate_base with an AVRational time_base
romansh
parents:
8011
diff
changeset
|
1043 avctx->time_base = s->sys->time_base; |
2849 | 1044 avcodec_set_dimensions(avctx, s->sys->width, s->sys->height); |
8051 | 1045 if (avctx->get_buffer(avctx, &s->picture) < 0) { |
1598
932d306bf1dc
av_log() patch by (Michel Bardiaux <mbardiaux at peaktime dot be>)
michael
parents:
1567
diff
changeset
|
1046 av_log(avctx, AV_LOG_ERROR, "get_buffer() failed\n"); |
903 | 1047 return -1; |
835 | 1048 } |
1543
7542cb99b950
* providing MPEG codecs with a generic fields in AVFrame to use.
romansh
parents:
1540
diff
changeset
|
1049 s->picture.interlaced_frame = 1; |
8051 | 1050 s->picture.top_field_first = 0; |
835 | 1051 |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1052 s->buf = buf; |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1053 avctx->execute(avctx, dv_decode_mt, s->sys->work_chunks, NULL, |
8131 | 1054 dv_work_pool_size(s->sys), sizeof(DVwork_chunk)); |
2967 | 1055 |
734
2d6b3e3d6c6f
10l - MMX/FPU state was not restored, causing nonsense fpu behaviour in caller (mplayer)
arpi_esp
parents:
733
diff
changeset
|
1056 emms_c(); |
2d6b3e3d6c6f
10l - MMX/FPU state was not restored, causing nonsense fpu behaviour in caller (mplayer)
arpi_esp
parents:
733
diff
changeset
|
1057 |
723 | 1058 /* return image */ |
925 | 1059 *data_size = sizeof(AVFrame); |
8051 | 1060 *(AVFrame*)data = s->picture; |
2967 | 1061 |
1489
337d13aee605
* DV handling was streamlined for both muxing/demuxing and
romansh
parents:
1416
diff
changeset
|
1062 return s->sys->frame_size; |
723 | 1063 } |
7776
dbcdd0165e55
Replace generic CONFIG_DECODERS preprocessor conditionals by more specific
diego
parents:
7715
diff
changeset
|
1064 #endif /* CONFIG_DVVIDEO_DECODER */ |
723 | 1065 |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1066 |
8051 | 1067 static inline int dv_write_pack(enum dv_pack_type pack_id, DVVideoContext *c, |
1068 uint8_t* buf) | |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1069 { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1070 /* |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1071 * Here's what SMPTE314M says about these two: |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1072 * (page 6) APTn, AP1n, AP2n, AP3n: These data shall be identical |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1073 * as track application IDs (APTn = 001, AP1n = |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1074 * 001, AP2n = 001, AP3n = 001), if the source signal |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1075 * comes from a digital VCR. If the signal source is |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1076 * unknown, all bits for these data shall be set to 1. |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1077 * (page 12) STYPE: STYPE defines a signal type of video signal |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1078 * 00000b = 4:1:1 compression |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1079 * 00100b = 4:2:2 compression |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1080 * XXXXXX = Reserved |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1081 * Now, I've got two problems with these statements: |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1082 * 1. it looks like APT == 111b should be a safe bet, but it isn't. |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1083 * It seems that for PAL as defined in IEC 61834 we have to set |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1084 * APT to 000 and for SMPTE314M to 001. |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1085 * 2. It is not at all clear what STYPE is used for 4:2:0 PAL |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1086 * compression scheme (if any). |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1087 */ |
8051 | 1088 int apt = (c->sys->pix_fmt == PIX_FMT_YUV420P ? 0 : 1); |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1089 int stype = (c->sys->pix_fmt == PIX_FMT_YUV422P ? 4 : 0); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1090 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1091 uint8_t aspect = 0; |
8051 | 1092 if ((int)(av_q2d(c->avctx->sample_aspect_ratio) * c->avctx->width / c->avctx->height * 10) == 17) /* 16:9 */ |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1093 aspect = 0x02; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1094 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1095 buf[0] = (uint8_t)pack_id; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1096 switch (pack_id) { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1097 case dv_header525: /* I can't imagine why these two weren't defined as real */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1098 case dv_header625: /* packs in SMPTE314M -- they definitely look like ones */ |
8051 | 1099 buf[1] = 0xf8 | /* reserved -- always 1 */ |
1100 (apt & 0x07); /* APT: Track application ID */ | |
1101 buf[2] = (0 << 7) | /* TF1: audio data is 0 - valid; 1 - invalid */ | |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1102 (0x0f << 3) | /* reserved -- always 1 */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1103 (apt & 0x07); /* AP1: Audio application ID */ |
8051 | 1104 buf[3] = (0 << 7) | /* TF2: video data is 0 - valid; 1 - invalid */ |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1105 (0x0f << 3) | /* reserved -- always 1 */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1106 (apt & 0x07); /* AP2: Video application ID */ |
8051 | 1107 buf[4] = (0 << 7) | /* TF3: subcode(SSYB) is 0 - valid; 1 - invalid */ |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1108 (0x0f << 3) | /* reserved -- always 1 */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1109 (apt & 0x07); /* AP3: Subcode application ID */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1110 break; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1111 case dv_video_source: |
8051 | 1112 buf[1] = 0xff; /* reserved -- always 1 */ |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1113 buf[2] = (1 << 7) | /* B/W: 0 - b/w, 1 - color */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1114 (1 << 6) | /* following CLF is valid - 0, invalid - 1 */ |
8050 | 1115 (3 << 4) | /* CLF: color frames ID (see ITU-R BT.470-4) */ |
8051 | 1116 0xf; /* reserved -- always 1 */ |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1117 buf[3] = (3 << 6) | /* reserved -- always 1 */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1118 (c->sys->dsf << 5) | /* system: 60fields/50fields */ |
8051 | 1119 stype; /* signal type video compression */ |
1120 buf[4] = 0xff; /* VISC: 0xff -- no information */ | |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1121 break; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1122 case dv_video_control: |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1123 buf[1] = (0 << 6) | /* Copy generation management (CGMS) 0 -- free */ |
8051 | 1124 0x3f; /* reserved -- always 1 */ |
1125 buf[2] = 0xc8 | /* reserved -- always b11001xxx */ | |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1126 aspect; |
8050 | 1127 buf[3] = (1 << 7) | /* frame/field flag 1 -- frame, 0 -- field */ |
1128 (1 << 6) | /* first/second field flag 0 -- field 2, 1 -- field 1 */ | |
1129 (1 << 5) | /* frame change flag 0 -- same picture as before, 1 -- different */ | |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1130 (1 << 4) | /* 1 - interlaced, 0 - noninterlaced */ |
8051 | 1131 0xc; /* reserved -- always b1100 */ |
1132 buf[4] = 0xff; /* reserved -- always 1 */ | |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1133 break; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1134 default: |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1135 buf[1] = buf[2] = buf[3] = buf[4] = 0xff; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1136 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1137 return 5; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1138 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1139 |
7240
2552555c8a92
Move #ifdef CONFIG_DVVIDEO_ENCODER up to cover all functions used for encoding.
diego
parents:
7239
diff
changeset
|
1140 #ifdef CONFIG_DVVIDEO_ENCODER |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1141 static void dv_format_frame(DVVideoContext* c, uint8_t* buf) |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1142 { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1143 int chan, i, j, k; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1144 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1145 for (chan = 0; chan < c->sys->n_difchan; chan++) { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1146 for (i = 0; i < c->sys->difseg_size; i++) { |
8050 | 1147 memset(buf, 0xff, 80 * 6); /* first 6 DIF blocks are for control data */ |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1148 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1149 /* DV header: 1DIF */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1150 buf += dv_write_dif_id(dv_sect_header, chan, i, 0, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1151 buf += dv_write_pack((c->sys->dsf ? dv_header625 : dv_header525), c, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1152 buf += 72; /* unused bytes */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1153 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1154 /* DV subcode: 2DIFs */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1155 for (j = 0; j < 2; j++) { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1156 buf += dv_write_dif_id(dv_sect_subcode, chan, i, j, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1157 for (k = 0; k < 6; k++) |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1158 buf += dv_write_ssyb_id(k, (i < c->sys->difseg_size/2), buf) + 5; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1159 buf += 29; /* unused bytes */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1160 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1161 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1162 /* DV VAUX: 3DIFS */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1163 for (j = 0; j < 3; j++) { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1164 buf += dv_write_dif_id(dv_sect_vaux, chan, i, j, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1165 buf += dv_write_pack(dv_video_source, c, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1166 buf += dv_write_pack(dv_video_control, c, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1167 buf += 7*5; |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1168 buf += dv_write_pack(dv_video_source, c, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1169 buf += dv_write_pack(dv_video_control, c, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1170 buf += 4*5 + 2; /* unused bytes */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1171 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1172 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1173 /* DV Audio/Video: 135 Video DIFs + 9 Audio DIFs */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1174 for (j = 0; j < 135; j++) { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1175 if (j%15 == 0) { |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1176 memset(buf, 0xff, 80); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1177 buf += dv_write_dif_id(dv_sect_audio, chan, i, j/15, buf); |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1178 buf += 77; /* audio control & shuffled PCM audio */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1179 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1180 buf += dv_write_dif_id(dv_sect_video, chan, i, j, buf); |
7980 | 1181 buf += 77; /* 1 video macroblock: 1 bytes control |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1182 4 * 14 bytes Y 8x8 data |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1183 10 bytes Cr 8x8 data |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1184 10 bytes Cb 8x8 data */ |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1185 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1186 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1187 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1188 } |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1189 |
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1190 |
2967 | 1191 static int dvvideo_encode_frame(AVCodecContext *c, uint8_t *buf, int buf_size, |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1192 void *data) |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1193 { |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1194 DVVideoContext *s = c->priv_data; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1195 |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1196 s->sys = dv_codec_profile(c); |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1197 if (!s->sys || buf_size < s->sys->frame_size || dv_init_dynamic_tables(s->sys)) |
2422 | 1198 return -1; |
1199 | |
8051 | 1200 c->pix_fmt = s->sys->pix_fmt; |
1201 s->picture = *((AVFrame *)data); | |
2822
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1202 s->picture.key_frame = 1; |
fdedaa2e6da4
DV video encoder/decoder doesn't set keyframe and picture type properties patch by (Edward Hervey:bilboed,gmail com)
michael
parents:
2661
diff
changeset
|
1203 s->picture.pict_type = FF_I_TYPE; |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1204 |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1205 s->buf = buf; |
8118
890df98a7848
implementing more efficient (and direct) allocation of work for DV codec workers
romansh
parents:
8088
diff
changeset
|
1206 c->execute(c, dv_encode_mt, s->sys->work_chunks, NULL, |
8131 | 1207 dv_work_pool_size(s->sys), sizeof(DVwork_chunk)); |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1208 |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1209 emms_c(); |
3167 | 1210 |
3671
18113845d891
* Restructuring the division of labor between DV codec and DV format
romansh
parents:
3649
diff
changeset
|
1211 dv_format_frame(s, buf); |
3167 | 1212 |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1213 return s->sys->frame_size; |
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1214 } |
3806 | 1215 #endif |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1216 |
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1217 static int dvvideo_close(AVCodecContext *c) |
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1218 { |
4352
0ee71c12734e
* Fixing a bug with incorrect bits set in AAUX source pack
romansh
parents:
4283
diff
changeset
|
1219 DVVideoContext *s = c->priv_data; |
0ee71c12734e
* Fixing a bug with incorrect bits set in AAUX source pack
romansh
parents:
4283
diff
changeset
|
1220 |
8051 | 1221 if (s->picture.data[0]) |
4352
0ee71c12734e
* Fixing a bug with incorrect bits set in AAUX source pack
romansh
parents:
4283
diff
changeset
|
1222 c->release_buffer(c, &s->picture); |
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1223 |
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1224 return 0; |
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1225 } |
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1226 |
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1227 |
2661
b2846918585c
a few #ifdef CONFIG_X_ENCODER, patch by (Roine Gustafsson <roine users.sourceforge net]
michael
parents:
2614
diff
changeset
|
1228 #ifdef CONFIG_DVVIDEO_ENCODER |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1229 AVCodec dvvideo_encoder = { |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1230 "dvvideo", |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1231 CODEC_TYPE_VIDEO, |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1232 CODEC_ID_DVVIDEO, |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1233 sizeof(DVVideoContext), |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1234 dvvideo_init, |
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1235 dvvideo_encode_frame, |
8051 | 1236 .pix_fmts = (enum PixelFormat[]) {PIX_FMT_YUV411P, PIX_FMT_YUV422P, PIX_FMT_YUV420P, PIX_FMT_NONE}, |
7040
e943e1409077
Make AVCodec long_names definition conditional depending on CONFIG_SMALL.
stefano
parents:
7039
diff
changeset
|
1237 .long_name = NULL_IF_CONFIG_SMALL("DV (Digital Video)"), |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1238 }; |
2661
b2846918585c
a few #ifdef CONFIG_X_ENCODER, patch by (Roine Gustafsson <roine users.sourceforge net]
michael
parents:
2614
diff
changeset
|
1239 #endif // CONFIG_DVVIDEO_ENCODER |
723 | 1240 |
3777 | 1241 #ifdef CONFIG_DVVIDEO_DECODER |
723 | 1242 AVCodec dvvideo_decoder = { |
1243 "dvvideo", | |
1244 CODEC_TYPE_VIDEO, | |
1245 CODEC_ID_DVVIDEO, | |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1246 sizeof(DVVideoContext), |
1493
ad7e62df9962
* preAlpha DV encoding support -- there's still a truckload
romansh
parents:
1489
diff
changeset
|
1247 dvvideo_init, |
1887
85fe2f4633ec
* DV decoding/encoding now supports MultiThreading for up to 324 CPUs ;-)
romansh
parents:
1886
diff
changeset
|
1248 NULL, |
2991
d377b0788381
Fix DV memory leak and allow multiple instances patch by (Burkhard Plaum?)
michael
parents:
2979
diff
changeset
|
1249 dvvideo_close, |
723 | 1250 dvvideo_decode_frame, |
835 | 1251 CODEC_CAP_DR1, |
6717 | 1252 NULL, |
7040
e943e1409077
Make AVCodec long_names definition conditional depending on CONFIG_SMALL.
stefano
parents:
7039
diff
changeset
|
1253 .long_name = NULL_IF_CONFIG_SMALL("DV (Digital Video)"), |
723 | 1254 }; |
3777 | 1255 #endif |