annotate arm/h264pred_init_arm.c @ 10902:1e41e6ab9a18 libavcodec

Apply last 2 optimizations to similar code i forgot.
author michael
date Sat, 16 Jan 2010 16:21:12 +0000
parents 8db678424a18
children 21566c95834c
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
10623
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
1 /*
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
2 * Copyright (c) 2009 Mans Rullgard <mans@mansr.com>
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
3 *
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
4 * This file is part of FFmpeg.
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
5 *
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
6 * FFmpeg is free software; you can redistribute it and/or
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
7 * modify it under the terms of the GNU Lesser General Public
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
8 * License as published by the Free Software Foundation; either
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
9 * version 2.1 of the License, or (at your option) any later version.
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
10 *
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
11 * FFmpeg is distributed in the hope that it will be useful,
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
14 * Lesser General Public License for more details.
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
15 *
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
16 * You should have received a copy of the GNU Lesser General Public
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
17 * License along with FFmpeg; if not, write to the Free Software
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
19 */
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
20
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
21 #include <stdint.h>
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
22
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
23 #include "libavcodec/h264pred.h"
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
24
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
25 void ff_pred16x16_vert_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
26 void ff_pred16x16_hor_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
27 void ff_pred16x16_plane_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
28 void ff_pred16x16_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
29 void ff_pred16x16_128_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
30 void ff_pred16x16_left_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
31 void ff_pred16x16_top_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
32
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
33 void ff_pred8x8_vert_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
34 void ff_pred8x8_hor_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
35 void ff_pred8x8_plane_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
36 void ff_pred8x8_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
37 void ff_pred8x8_128_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
38 void ff_pred8x8_left_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
39 void ff_pred8x8_top_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
40 void ff_pred8x8_l0t_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
41 void ff_pred8x8_0lt_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
42 void ff_pred8x8_l00_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
43 void ff_pred8x8_0l0_dc_neon(uint8_t *src, int stride);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
44
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
45 #if HAVE_NEON
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
46 static void ff_h264_pred_init_neon(H264PredContext *h, int codec_id)
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
47 {
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
48 h->pred8x8[VERT_PRED8x8 ] = ff_pred8x8_vert_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
49 h->pred8x8[HOR_PRED8x8 ] = ff_pred8x8_hor_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
50 h->pred8x8[PLANE_PRED8x8 ] = ff_pred8x8_plane_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
51 h->pred8x8[DC_128_PRED8x8 ] = ff_pred8x8_128_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
52 if (codec_id != CODEC_ID_RV40) {
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
53 h->pred8x8[DC_PRED8x8 ] = ff_pred8x8_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
54 h->pred8x8[LEFT_DC_PRED8x8] = ff_pred8x8_left_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
55 h->pred8x8[TOP_DC_PRED8x8 ] = ff_pred8x8_top_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
56 h->pred8x8[ALZHEIMER_DC_L0T_PRED8x8] = ff_pred8x8_l0t_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
57 h->pred8x8[ALZHEIMER_DC_0LT_PRED8x8] = ff_pred8x8_0lt_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
58 h->pred8x8[ALZHEIMER_DC_L00_PRED8x8] = ff_pred8x8_l00_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
59 h->pred8x8[ALZHEIMER_DC_0L0_PRED8x8] = ff_pred8x8_0l0_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
60 }
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
61
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
62 h->pred16x16[DC_PRED8x8 ] = ff_pred16x16_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
63 h->pred16x16[VERT_PRED8x8 ] = ff_pred16x16_vert_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
64 h->pred16x16[HOR_PRED8x8 ] = ff_pred16x16_hor_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
65 h->pred16x16[LEFT_DC_PRED8x8] = ff_pred16x16_left_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
66 h->pred16x16[TOP_DC_PRED8x8 ] = ff_pred16x16_top_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
67 h->pred16x16[DC_128_PRED8x8 ] = ff_pred16x16_128_dc_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
68 if (codec_id != CODEC_ID_SVQ3 && codec_id != CODEC_ID_RV40)
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
69 h->pred16x16[PLANE_PRED8x8 ] = ff_pred16x16_plane_neon;
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
70 }
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
71 #endif
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
72
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
73 void ff_h264_pred_init_arm(H264PredContext *h, int codec_id)
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
74 {
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
75 if (HAVE_NEON) ff_h264_pred_init_neon(h, codec_id);
f52d07b169b4 ARM: NEON optimised H264 16x16, 8x8 pred
mru
parents:
diff changeset
76 }