Mercurial > libavcodec.hg
annotate arm/dsputil_arm.c @ 10292:01e6afd0aba6 libavcodec
Remove unneeded table lookup.
author | jbr |
---|---|
date | Sun, 27 Sep 2009 06:16:49 +0000 |
parents | 0905f8eed0a9 |
children | 48be79afc72d |
rev | line source |
---|---|
61 | 1 /* |
8359 | 2 * ARM optimized DSP utils |
8629
04423b2f6e0b
cosmetics: Remove pointless period after copyright statement non-sentences.
diego
parents:
8596
diff
changeset
|
3 * Copyright (c) 2001 Lionel Ulmer |
61 | 4 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3769
diff
changeset
|
5 * This file is part of FFmpeg. |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3769
diff
changeset
|
6 * |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3769
diff
changeset
|
7 * FFmpeg is free software; you can redistribute it and/or |
429 | 8 * modify it under the terms of the GNU Lesser General Public |
9 * License as published by the Free Software Foundation; either | |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3769
diff
changeset
|
10 * version 2.1 of the License, or (at your option) any later version. |
61 | 11 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3769
diff
changeset
|
12 * FFmpeg is distributed in the hope that it will be useful, |
61 | 13 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
429 | 14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
15 * Lesser General Public License for more details. | |
61 | 16 * |
429 | 17 * You should have received a copy of the GNU Lesser General Public |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3769
diff
changeset
|
18 * License along with FFmpeg; if not, write to the Free Software |
3036
0b546eab515d
Update licensing information: The FSF changed postal address.
diego
parents:
2979
diff
changeset
|
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
61 | 20 */ |
21 | |
6763 | 22 #include "libavcodec/dsputil.h" |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
23 |
8250 | 24 void dsputil_init_iwmmxt(DSPContext* c, AVCodecContext *avctx); |
25 void ff_float_init_arm_vfp(DSPContext* c, AVCodecContext *avctx); | |
8334 | 26 void ff_dsputil_init_neon(DSPContext *c, AVCodecContext *avctx); |
61 | 27 |
8250 | 28 void j_rev_dct_ARM(DCTELEM *data); |
29 void simple_idct_ARM(DCTELEM *data); | |
61 | 30 |
8250 | 31 void simple_idct_armv5te(DCTELEM *data); |
32 void simple_idct_put_armv5te(uint8_t *dest, int line_size, DCTELEM *data); | |
33 void simple_idct_add_armv5te(uint8_t *dest, int line_size, DCTELEM *data); | |
3769 | 34 |
8250 | 35 void ff_simple_idct_armv6(DCTELEM *data); |
36 void ff_simple_idct_put_armv6(uint8_t *dest, int line_size, DCTELEM *data); | |
37 void ff_simple_idct_add_armv6(uint8_t *dest, int line_size, DCTELEM *data); | |
4427 | 38 |
8335 | 39 void ff_simple_idct_neon(DCTELEM *data); |
40 void ff_simple_idct_put_neon(uint8_t *dest, int line_size, DCTELEM *data); | |
41 void ff_simple_idct_add_neon(uint8_t *dest, int line_size, DCTELEM *data); | |
42 | |
9916 | 43 void ff_vp3_idct_neon(DCTELEM *data); |
44 void ff_vp3_idct_put_neon(uint8_t *dest, int line_size, DCTELEM *data); | |
45 void ff_vp3_idct_add_neon(uint8_t *dest, int line_size, DCTELEM *data); | |
46 | |
1092 | 47 /* XXX: local hack */ |
48 static void (*ff_put_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size); | |
49 static void (*ff_add_pixels_clamped)(const DCTELEM *block, uint8_t *pixels, int line_size); | |
50 | |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
51 void put_pixels8_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
52 void put_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
53 void put_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
54 void put_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
55 |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
56 void put_no_rnd_pixels8_x2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
57 void put_no_rnd_pixels8_y2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
58 void put_no_rnd_pixels8_xy2_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
59 |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
60 void put_pixels16_arm(uint8_t *block, const uint8_t *pixels, int line_size, int h); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
61 |
8250 | 62 void ff_prefetch_arm(void *mem, int stride, int h); |
8070 | 63 |
2735 | 64 CALL_2X_PIXELS(put_pixels16_x2_arm , put_pixels8_x2_arm , 8) |
65 CALL_2X_PIXELS(put_pixels16_y2_arm , put_pixels8_y2_arm , 8) | |
66 CALL_2X_PIXELS(put_pixels16_xy2_arm, put_pixels8_xy2_arm, 8) | |
67 CALL_2X_PIXELS(put_no_rnd_pixels16_x2_arm , put_no_rnd_pixels8_x2_arm , 8) | |
68 CALL_2X_PIXELS(put_no_rnd_pixels16_y2_arm , put_no_rnd_pixels8_y2_arm , 8) | |
69 CALL_2X_PIXELS(put_no_rnd_pixels16_xy2_arm, put_no_rnd_pixels8_xy2_arm, 8) | |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
70 |
8250 | 71 void ff_add_pixels_clamped_ARM(short *block, unsigned char *dest, |
8072 | 72 int line_size); |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
73 |
1092 | 74 /* XXX: those functions should be suppressed ASAP when all IDCTs are |
75 converted */ | |
1347
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
76 static void j_rev_dct_ARM_put(uint8_t *dest, int line_size, DCTELEM *block) |
1092 | 77 { |
78 j_rev_dct_ARM (block); | |
79 ff_put_pixels_clamped(block, dest, line_size); | |
80 } | |
1347
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
81 static void j_rev_dct_ARM_add(uint8_t *dest, int line_size, DCTELEM *block) |
61 | 82 { |
1092 | 83 j_rev_dct_ARM (block); |
84 ff_add_pixels_clamped(block, dest, line_size); | |
61 | 85 } |
1347
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
86 static void simple_idct_ARM_put(uint8_t *dest, int line_size, DCTELEM *block) |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
87 { |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
88 simple_idct_ARM (block); |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
89 ff_put_pixels_clamped(block, dest, line_size); |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
90 } |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
91 static void simple_idct_ARM_add(uint8_t *dest, int line_size, DCTELEM *block) |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
92 { |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
93 simple_idct_ARM (block); |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
94 ff_add_pixels_clamped(block, dest, line_size); |
cca26199ab17
Optimized simple idct for arm by Frederic 'dilb' Boulay <dilb@handhelds.org>. Currently licensed under the GPLv2, but the author allowed to license it under the LGPL, feel free to change
al3x
parents:
1324
diff
changeset
|
95 } |
3726 | 96 |
7165 | 97 int mm_support(void) |
98 { | |
8596
68e959302527
replace all occurrence of ENABLE_ by the corresponding CONFIG_, HAVE_ or ARCH_
aurel
parents:
8590
diff
changeset
|
99 return HAVE_IWMMXT * FF_MM_IWMMXT; |
7165 | 100 } |
101 | |
8359 | 102 void dsputil_init_arm(DSPContext* c, AVCodecContext *avctx) |
1092 | 103 { |
3726 | 104 int idct_algo= avctx->idct_algo; |
1092 | 105 |
106 ff_put_pixels_clamped = c->put_pixels_clamped; | |
107 ff_add_pixels_clamped = c->add_pixels_clamped; | |
108 | |
6179 | 109 if (avctx->lowres == 0) { |
6180 | 110 if(idct_algo == FF_IDCT_AUTO){ |
10203 | 111 #if HAVE_NEON |
8335 | 112 idct_algo = FF_IDCT_SIMPLENEON; |
8590 | 113 #elif HAVE_ARMV6 |
6180 | 114 idct_algo = FF_IDCT_SIMPLEARMV6; |
8590 | 115 #elif HAVE_ARMV5TE |
6180 | 116 idct_algo = FF_IDCT_SIMPLEARMV5TE; |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
117 #else |
6180 | 118 idct_algo = FF_IDCT_ARM; |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
119 #endif |
6180 | 120 } |
3726 | 121 |
6180 | 122 if(idct_algo==FF_IDCT_ARM){ |
123 c->idct_put= j_rev_dct_ARM_put; | |
124 c->idct_add= j_rev_dct_ARM_add; | |
125 c->idct = j_rev_dct_ARM; | |
8267 | 126 c->idct_permutation_type= FF_LIBMPEG2_IDCT_PERM; |
6180 | 127 } else if (idct_algo==FF_IDCT_SIMPLEARM){ |
128 c->idct_put= simple_idct_ARM_put; | |
129 c->idct_add= simple_idct_ARM_add; | |
130 c->idct = simple_idct_ARM; | |
131 c->idct_permutation_type= FF_NO_IDCT_PERM; | |
8590 | 132 #if HAVE_ARMV6 |
6180 | 133 } else if (idct_algo==FF_IDCT_SIMPLEARMV6){ |
134 c->idct_put= ff_simple_idct_put_armv6; | |
135 c->idct_add= ff_simple_idct_add_armv6; | |
136 c->idct = ff_simple_idct_armv6; | |
137 c->idct_permutation_type= FF_LIBMPEG2_IDCT_PERM; | |
4427 | 138 #endif |
8590 | 139 #if HAVE_ARMV5TE |
6180 | 140 } else if (idct_algo==FF_IDCT_SIMPLEARMV5TE){ |
141 c->idct_put= simple_idct_put_armv5te; | |
142 c->idct_add= simple_idct_add_armv5te; | |
143 c->idct = simple_idct_armv5te; | |
144 c->idct_permutation_type = FF_NO_IDCT_PERM; | |
3769 | 145 #endif |
8590 | 146 #if HAVE_NEON |
8335 | 147 } else if (idct_algo==FF_IDCT_SIMPLENEON){ |
148 c->idct_put= ff_simple_idct_put_neon; | |
149 c->idct_add= ff_simple_idct_add_neon; | |
150 c->idct = ff_simple_idct_neon; | |
151 c->idct_permutation_type = FF_PARTTRANS_IDCT_PERM; | |
9975
d6d7e8d4a04d
Do not redundantly check for both CONFIG_THEORA_DECODER and CONFIG_VP3_DECODER.
diego
parents:
9916
diff
changeset
|
152 } else if ((CONFIG_VP3_DECODER || CONFIG_VP5_DECODER || CONFIG_VP6_DECODER) && |
9916 | 153 idct_algo==FF_IDCT_VP3){ |
154 c->idct_put= ff_vp3_idct_put_neon; | |
155 c->idct_add= ff_vp3_idct_add_neon; | |
156 c->idct = ff_vp3_idct_neon; | |
157 c->idct_permutation_type = FF_TRANSPOSE_IDCT_PERM; | |
8335 | 158 #endif |
6180 | 159 } |
6179 | 160 } |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
161 |
5641
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
162 c->put_pixels_tab[0][0] = put_pixels16_arm; |
8267 | 163 c->put_pixels_tab[0][1] = put_pixels16_x2_arm; |
164 c->put_pixels_tab[0][2] = put_pixels16_y2_arm; | |
5641
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
165 c->put_pixels_tab[0][3] = put_pixels16_xy2_arm; |
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
166 c->put_no_rnd_pixels_tab[0][0] = put_pixels16_arm; |
8267 | 167 c->put_no_rnd_pixels_tab[0][1] = put_no_rnd_pixels16_x2_arm; |
168 c->put_no_rnd_pixels_tab[0][2] = put_no_rnd_pixels16_y2_arm; | |
5641
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
169 c->put_no_rnd_pixels_tab[0][3] = put_no_rnd_pixels16_xy2_arm; |
8267 | 170 c->put_pixels_tab[1][0] = put_pixels8_arm; |
171 c->put_pixels_tab[1][1] = put_pixels8_x2_arm; | |
5641
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
172 c->put_pixels_tab[1][2] = put_pixels8_y2_arm; |
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
173 c->put_pixels_tab[1][3] = put_pixels8_xy2_arm; |
8267 | 174 c->put_no_rnd_pixels_tab[1][0] = put_pixels8_arm; |
175 c->put_no_rnd_pixels_tab[1][1] = put_no_rnd_pixels8_x2_arm; | |
176 c->put_no_rnd_pixels_tab[1][2] = put_no_rnd_pixels8_y2_arm; | |
5641
1e93e637fa21
Fix put_*_xy2_arm bug and enable put_pixels16_arm and put_pixels8_y2_arm.
diego
parents:
5010
diff
changeset
|
177 c->put_no_rnd_pixels_tab[1][3] = put_no_rnd_pixels8_xy2_arm; |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
178 |
8590 | 179 #if HAVE_ARMV5TE |
8070 | 180 c->prefetch = ff_prefetch_arm; |
7688
160d5c1ae60a
ARM: add prefetch function using ARMv5 PLD instruction
mru
parents:
7166
diff
changeset
|
181 #endif |
160d5c1ae60a
ARM: add prefetch function using ARMv5 PLD instruction
mru
parents:
7166
diff
changeset
|
182 |
8590 | 183 #if HAVE_IWMMXT |
2734
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
184 dsputil_init_iwmmxt(c, avctx); |
aeea63c97878
Better ARM support for mplayer/ffmpeg, ported from atty fork
michael
parents:
1347
diff
changeset
|
185 #endif |
8590 | 186 #if HAVE_ARMVFP |
6786
18084aaa277b
Add some initial optimizations for ARM VFP (floating
gpoirier
parents:
6763
diff
changeset
|
187 ff_float_init_arm_vfp(c, avctx); |
18084aaa277b
Add some initial optimizations for ARM VFP (floating
gpoirier
parents:
6763
diff
changeset
|
188 #endif |
8590 | 189 #if HAVE_NEON |
8334 | 190 ff_dsputil_init_neon(c, avctx); |
191 #endif | |
1092 | 192 } |