annotate h264_loopfilter.c @ 11032:01bd040f8607 libavcodec

Unroll main loop so the edge==0 case is seperate. This allows many things to be simplified away. h264 decoder is overall 1% faster with a mbaff sample and 0.1% slower with the cathedral sample, probably because the slow loop filter code must be loaded into the code cache for each first MB of each row but isnt used for the following MBs.
author michael
date Thu, 28 Jan 2010 01:24:25 +0000
parents f5678fb91140
children b5577677b97d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
1 /*
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
2 * H.26L/H.264/AVC/JVT/14496-10/... loop filter
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
4 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
5 * This file is part of FFmpeg.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
6 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
7 * FFmpeg is free software; you can redistribute it and/or
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
8 * modify it under the terms of the GNU Lesser General Public
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
9 * License as published by the Free Software Foundation; either
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
10 * version 2.1 of the License, or (at your option) any later version.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
11 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
12 * FFmpeg is distributed in the hope that it will be useful,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
15 * Lesser General Public License for more details.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
16 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
17 * You should have received a copy of the GNU Lesser General Public
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
18 * License along with FFmpeg; if not, write to the Free Software
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
20 */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
21
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
22 /**
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
23 * @file libavcodec/h264_loopfilter.c
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
24 * H.264 / AVC / MPEG4 part10 loop filter.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
25 * @author Michael Niedermayer <michaelni@gmx.at>
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
26 */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
27
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
28 #include "internal.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
29 #include "dsputil.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
30 #include "avcodec.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
31 #include "mpegvideo.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
32 #include "h264.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
33 #include "mathops.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
34 #include "rectangle.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
35
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
36 //#undef NDEBUG
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
37 #include <assert.h>
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
38
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
39 /* Deblocking filter (p153) */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
40 static const uint8_t alpha_table[52*3] = {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
41 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
42 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
43 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
44 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
45 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
46 0, 0, 0, 0, 0, 0, 4, 4, 5, 6,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
47 7, 8, 9, 10, 12, 13, 15, 17, 20, 22,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
48 25, 28, 32, 36, 40, 45, 50, 56, 63, 71,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
49 80, 90,101,113,127,144,162,182,203,226,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
50 255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
51 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
52 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
53 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
54 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
55 };
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
56 static const uint8_t beta_table[52*3] = {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
57 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
58 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
59 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
60 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
61 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
62 0, 0, 0, 0, 0, 0, 2, 2, 2, 3,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
63 3, 3, 3, 4, 4, 4, 6, 6, 7, 7,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
64 8, 8, 9, 9, 10, 10, 11, 11, 12, 12,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
65 13, 13, 14, 14, 15, 15, 16, 16, 17, 17,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
66 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
67 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
68 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
69 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
70 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
71 };
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
72 static const uint8_t tc0_table[52*3][4] = {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
73 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
74 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
75 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
76 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
77 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
78 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
79 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
80 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
81 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
82 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
83 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
84 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 1 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
85 {-1, 0, 0, 1 }, {-1, 0, 0, 1 }, {-1, 0, 0, 1 }, {-1, 0, 1, 1 }, {-1, 0, 1, 1 }, {-1, 1, 1, 1 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
86 {-1, 1, 1, 1 }, {-1, 1, 1, 1 }, {-1, 1, 1, 1 }, {-1, 1, 1, 2 }, {-1, 1, 1, 2 }, {-1, 1, 1, 2 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
87 {-1, 1, 1, 2 }, {-1, 1, 2, 3 }, {-1, 1, 2, 3 }, {-1, 2, 2, 3 }, {-1, 2, 2, 4 }, {-1, 2, 3, 4 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
88 {-1, 2, 3, 4 }, {-1, 3, 3, 5 }, {-1, 3, 4, 6 }, {-1, 3, 4, 6 }, {-1, 4, 5, 7 }, {-1, 4, 5, 8 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
89 {-1, 4, 6, 9 }, {-1, 5, 7,10 }, {-1, 6, 8,11 }, {-1, 6, 8,13 }, {-1, 7,10,14 }, {-1, 8,11,16 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
90 {-1, 9,12,18 }, {-1,10,13,20 }, {-1,11,15,23 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
91 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
92 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
93 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
94 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
95 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
96 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
97 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
98 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
99 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
100 };
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
101
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
102 static void av_noinline filter_mb_edgev( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h) {
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
103 const unsigned int index_a = qp + h->slice_alpha_c0_offset;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
104 const int alpha = alpha_table[index_a];
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
105 const int beta = beta_table[qp + h->slice_beta_offset];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
106 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
107
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
108 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
109 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
110 tc[0] = tc0_table[index_a][bS[0]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
111 tc[1] = tc0_table[index_a][bS[1]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
112 tc[2] = tc0_table[index_a][bS[2]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
113 tc[3] = tc0_table[index_a][bS[3]];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
114 h->s.dsp.h264_h_loop_filter_luma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
115 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
116 h->s.dsp.h264_h_loop_filter_luma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
117 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
118 }
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
119 static void av_noinline filter_mb_edgecv( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h ) {
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
120 const unsigned int index_a = qp + h->slice_alpha_c0_offset;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
121 const int alpha = alpha_table[index_a];
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
122 const int beta = beta_table[qp + h->slice_beta_offset];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
123 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
124
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
125 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
126 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
127 tc[0] = tc0_table[index_a][bS[0]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
128 tc[1] = tc0_table[index_a][bS[1]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
129 tc[2] = tc0_table[index_a][bS[2]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
130 tc[3] = tc0_table[index_a][bS[3]]+1;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
131 h->s.dsp.h264_h_loop_filter_chroma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
132 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
133 h->s.dsp.h264_h_loop_filter_chroma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
134 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
135 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
136
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
137 static void filter_mb_mbaff_edgev( H264Context *h, uint8_t *pix, int stride, int16_t bS[4], int bsi, int qp ) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
138 int i;
10970
eb5f0ccb6a98 Optimize filter_mb_mbaff_edge*()
michael
parents: 10969
diff changeset
139 int index_a = qp + h->slice_alpha_c0_offset;
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
140 int alpha = alpha_table[index_a];
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
141 int beta = beta_table[qp + h->slice_beta_offset];
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
142 for( i = 0; i < 8; i++, pix += stride) {
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
143 const int bS_index = (i >> 1) * bsi;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
144
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
145 if( bS[bS_index] == 0 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
146 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
147 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
148
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
149 if( bS[bS_index] < 4 ) {
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
150 const int tc0 = tc0_table[index_a][bS[bS_index]];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
151 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
152 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
153 const int p2 = pix[-3];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
154 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
155 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
156 const int q2 = pix[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
157
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
158 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
159 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
160 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
161 int tc = tc0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
162 int i_delta;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
163
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
164 if( FFABS( p2 - p0 ) < beta ) {
10970
eb5f0ccb6a98 Optimize filter_mb_mbaff_edge*()
michael
parents: 10969
diff changeset
165 if(tc0)
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
166 pix[-2] = p1 + av_clip( ( p2 + ( ( p0 + q0 + 1 ) >> 1 ) - ( p1 << 1 ) ) >> 1, -tc0, tc0 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
167 tc++;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
168 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
169 if( FFABS( q2 - q0 ) < beta ) {
10970
eb5f0ccb6a98 Optimize filter_mb_mbaff_edge*()
michael
parents: 10969
diff changeset
170 if(tc0)
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
171 pix[1] = q1 + av_clip( ( q2 + ( ( p0 + q0 + 1 ) >> 1 ) - ( q1 << 1 ) ) >> 1, -tc0, tc0 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
172 tc++;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
173 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
174
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
175 i_delta = av_clip( (((q0 - p0 ) << 2) + (p1 - q1) + 4) >> 3, -tc, tc );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
176 pix[-1] = av_clip_uint8( p0 + i_delta ); /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
177 pix[0] = av_clip_uint8( q0 - i_delta ); /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
178 tprintf(h->s.avctx, "filter_mb_mbaff_edgev i:%d, qp:%d, indexA:%d, alpha:%d, beta:%d, tc:%d\n# bS:%d -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x]\n", i, qp[qp_index], index_a, alpha, beta, tc, bS[bS_index], pix[-3], p1, p0, q0, q1, pix[2], p1, pix[-1], pix[0], q1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
179 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
180 }else{
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
181 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
182 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
183 const int p2 = pix[-3];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
184
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
185 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
186 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
187 const int q2 = pix[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
188
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
189 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
190 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
191 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
192
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
193 if(FFABS( p0 - q0 ) < (( alpha >> 2 ) + 2 )){
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
194 if( FFABS( p2 - p0 ) < beta)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
195 {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
196 const int p3 = pix[-4];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
197 /* p0', p1', p2' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
198 pix[-1] = ( p2 + 2*p1 + 2*p0 + 2*q0 + q1 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
199 pix[-2] = ( p2 + p1 + p0 + q0 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
200 pix[-3] = ( 2*p3 + 3*p2 + p1 + p0 + q0 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
201 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
202 /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
203 pix[-1] = ( 2*p1 + p0 + q1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
204 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
205 if( FFABS( q2 - q0 ) < beta)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
206 {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
207 const int q3 = pix[3];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
208 /* q0', q1', q2' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
209 pix[0] = ( p1 + 2*p0 + 2*q0 + 2*q1 + q2 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
210 pix[1] = ( p0 + q0 + q1 + q2 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
211 pix[2] = ( 2*q3 + 3*q2 + q1 + q0 + p0 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
212 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
213 /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
214 pix[0] = ( 2*q1 + q0 + p1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
215 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
216 }else{
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
217 /* p0', q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
218 pix[-1] = ( 2*p1 + p0 + q1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
219 pix[ 0] = ( 2*q1 + q0 + p1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
220 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
221 tprintf(h->s.avctx, "filter_mb_mbaff_edgev i:%d, qp:%d, indexA:%d, alpha:%d, beta:%d\n# bS:4 -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x, %02x, %02x]\n", i, qp[qp_index], index_a, alpha, beta, p2, p1, p0, q0, q1, q2, pix[-3], pix[-2], pix[-1], pix[0], pix[1], pix[2]);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
222 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
223 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
224 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
225 }
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
226 static void filter_mb_mbaff_edgecv( H264Context *h, uint8_t *pix, int stride, int16_t bS[4], int bsi, int qp ) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
227 int i;
10970
eb5f0ccb6a98 Optimize filter_mb_mbaff_edge*()
michael
parents: 10969
diff changeset
228 int index_a = qp + h->slice_alpha_c0_offset;
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
229 int alpha = alpha_table[index_a];
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
230 int beta = beta_table[qp + h->slice_beta_offset];
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
231 for( i = 0; i < 4; i++, pix += stride) {
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
232 const int bS_index = i*bsi;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
233
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
234 if( bS[bS_index] == 0 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
235 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
236 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
237
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
238 if( bS[bS_index] < 4 ) {
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
239 const int tc = tc0_table[index_a][bS[bS_index]] + 1;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
240 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
241 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
242 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
243 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
244
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
245 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
246 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
247 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
248 const int i_delta = av_clip( (((q0 - p0 ) << 2) + (p1 - q1) + 4) >> 3, -tc, tc );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
249
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
250 pix[-1] = av_clip_uint8( p0 + i_delta ); /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
251 pix[0] = av_clip_uint8( q0 - i_delta ); /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
252 tprintf(h->s.avctx, "filter_mb_mbaff_edgecv i:%d, qp:%d, indexA:%d, alpha:%d, beta:%d, tc:%d\n# bS:%d -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x]\n", i, qp[qp_index], index_a, alpha, beta, tc, bS[bS_index], pix[-3], p1, p0, q0, q1, pix[2], p1, pix[-1], pix[0], q1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
253 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
254 }else{
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
255 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
256 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
257 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
258 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
259
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
260 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
261 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
262 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
263
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
264 pix[-1] = ( 2*p1 + p0 + q1 + 2 ) >> 2; /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
265 pix[0] = ( 2*q1 + q0 + p1 + 2 ) >> 2; /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
266 tprintf(h->s.avctx, "filter_mb_mbaff_edgecv i:%d\n# bS:4 -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x, %02x, %02x]\n", i, pix[-3], p1, p0, q0, q1, pix[2], pix[-3], pix[-2], pix[-1], pix[0], pix[1], pix[2]);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
267 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
268 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
269 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
270 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
271
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
272 static void av_noinline filter_mb_edgeh( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h ) {
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
273 const unsigned int index_a = qp + h->slice_alpha_c0_offset;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
274 const int alpha = alpha_table[index_a];
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
275 const int beta = beta_table[qp + h->slice_beta_offset];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
276 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
277
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
278 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
279 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
280 tc[0] = tc0_table[index_a][bS[0]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
281 tc[1] = tc0_table[index_a][bS[1]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
282 tc[2] = tc0_table[index_a][bS[2]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
283 tc[3] = tc0_table[index_a][bS[3]];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
284 h->s.dsp.h264_v_loop_filter_luma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
285 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
286 h->s.dsp.h264_v_loop_filter_luma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
287 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
288 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
289
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
290 static void av_noinline filter_mb_edgech( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h ) {
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
291 const unsigned int index_a = qp + h->slice_alpha_c0_offset;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
292 const int alpha = alpha_table[index_a];
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
293 const int beta = beta_table[qp + h->slice_beta_offset];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
294 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
295
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
296 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
297 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
298 tc[0] = tc0_table[index_a][bS[0]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
299 tc[1] = tc0_table[index_a][bS[1]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
300 tc[2] = tc0_table[index_a][bS[2]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
301 tc[3] = tc0_table[index_a][bS[3]]+1;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
302 h->s.dsp.h264_v_loop_filter_chroma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
303 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
304 h->s.dsp.h264_v_loop_filter_chroma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
305 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
306 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
307
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
308 void ff_h264_filter_mb_fast( H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
309 MpegEncContext * const s = &h->s;
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
310 int mb_xy;
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
311 int mb_type;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
312 int qp, qp0, qp1, qpc, qpc0, qpc1, qp_thresh;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
313
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
314 mb_xy = h->mb_xy;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
315
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
316 if(!h->top_type || !h->left_type[0] || !s->dsp.h264_loop_filter_strength || h->pps.chroma_qp_diff) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
317 ff_h264_filter_mb(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
318 return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
319 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
320 assert(!FRAME_MBAFF);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
321
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
322 mb_type = s->current_picture.mb_type[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
323 qp = s->current_picture.qscale_table[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
324 qp0 = s->current_picture.qscale_table[mb_xy-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
325 qp1 = s->current_picture.qscale_table[h->top_mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
326 qpc = get_chroma_qp( h, 0, qp );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
327 qpc0 = get_chroma_qp( h, 0, qp0 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
328 qpc1 = get_chroma_qp( h, 0, qp1 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
329 qp0 = (qp + qp0 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
330 qp1 = (qp + qp1 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
331 qpc0 = (qpc + qpc0 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
332 qpc1 = (qpc + qpc1 + 1) >> 1;
10979
776dba50775c Move +52 from the loop filter to the alpha/beta offsets in the context.
michael
parents: 10973
diff changeset
333 qp_thresh = 15+52 - h->slice_alpha_c0_offset;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
334 if(qp <= qp_thresh && qp0 <= qp_thresh && qp1 <= qp_thresh &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
335 qpc <= qp_thresh && qpc0 <= qp_thresh && qpc1 <= qp_thresh)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
336 return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
337
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
338 if( IS_INTRA(mb_type) ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
339 int16_t bS4[4] = {4,4,4,4};
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
340 int16_t bS3[4] = {3,3,3,3};
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
341 int16_t *bSH = FIELD_PICTURE ? bS3 : bS4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
342 if( IS_8x8DCT(mb_type) ) {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
343 filter_mb_edgev( &img_y[4*0], linesize, bS4, qp0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
344 filter_mb_edgev( &img_y[4*2], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
345 filter_mb_edgeh( &img_y[4*0*linesize], linesize, bSH, qp1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
346 filter_mb_edgeh( &img_y[4*2*linesize], linesize, bS3, qp, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
347 } else {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
348 filter_mb_edgev( &img_y[4*0], linesize, bS4, qp0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
349 filter_mb_edgev( &img_y[4*1], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
350 filter_mb_edgev( &img_y[4*2], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
351 filter_mb_edgev( &img_y[4*3], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
352 filter_mb_edgeh( &img_y[4*0*linesize], linesize, bSH, qp1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
353 filter_mb_edgeh( &img_y[4*1*linesize], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
354 filter_mb_edgeh( &img_y[4*2*linesize], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
355 filter_mb_edgeh( &img_y[4*3*linesize], linesize, bS3, qp, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
356 }
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
357 filter_mb_edgecv( &img_cb[2*0], uvlinesize, bS4, qpc0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
358 filter_mb_edgecv( &img_cb[2*2], uvlinesize, bS3, qpc, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
359 filter_mb_edgecv( &img_cr[2*0], uvlinesize, bS4, qpc0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
360 filter_mb_edgecv( &img_cr[2*2], uvlinesize, bS3, qpc, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
361 filter_mb_edgech( &img_cb[2*0*uvlinesize], uvlinesize, bSH, qpc1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
362 filter_mb_edgech( &img_cb[2*2*uvlinesize], uvlinesize, bS3, qpc, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
363 filter_mb_edgech( &img_cr[2*0*uvlinesize], uvlinesize, bSH, qpc1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
364 filter_mb_edgech( &img_cr[2*2*uvlinesize], uvlinesize, bS3, qpc, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
365 return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
366 } else {
10961
34a65026fa06 Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents: 10960
diff changeset
367 DECLARE_ALIGNED_8(int16_t, bS)[2][4][4];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
368 uint64_t (*bSv)[4] = (uint64_t(*)[4])bS;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
369 int edges;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
370 if( IS_8x8DCT(mb_type) && (h->cbp&7) == 7 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
371 edges = 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
372 bSv[0][0] = bSv[0][2] = bSv[1][0] = bSv[1][2] = 0x0002000200020002ULL;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
373 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
374 int mask_edge1 = (mb_type & (MB_TYPE_16x16 | MB_TYPE_8x16)) ? 3 :
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
375 (mb_type & MB_TYPE_16x8) ? 1 : 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
376 int mask_edge0 = (mb_type & (MB_TYPE_16x16 | MB_TYPE_8x16))
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
377 && (h->left_type[0] & (MB_TYPE_16x16 | MB_TYPE_8x16))
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
378 ? 3 : 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
379 int step = IS_8x8DCT(mb_type) ? 2 : 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
380 edges = (mb_type & MB_TYPE_16x16) && !(h->cbp & 15) ? 1 : 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
381 s->dsp.h264_loop_filter_strength( bS, h->non_zero_count_cache, h->ref_cache, h->mv_cache,
10984
541acd292c48 Remove all uses of slice_type* from the loop filter, also remove its
michael
parents: 10979
diff changeset
382 h->list_count==2, edges, step, mask_edge0, mask_edge1, FIELD_PICTURE);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
383 }
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
384 if( IS_INTRA(h->left_type[0]) )
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
385 bSv[0][0] = 0x0004000400040004ULL;
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
386 if( IS_INTRA(h->top_type) )
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
387 bSv[1][0] = FIELD_PICTURE ? 0x0003000300030003ULL : 0x0004000400040004ULL;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
388
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
389 #define FILTER(hv,dir,edge)\
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
390 if(bSv[dir][edge]) {\
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
391 filter_mb_edge##hv( &img_y[4*edge*(dir?linesize:1)], linesize, bS[dir][edge], edge ? qp : qp##dir, h );\
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
392 if(!(edge&1)) {\
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
393 filter_mb_edgec##hv( &img_cb[2*edge*(dir?uvlinesize:1)], uvlinesize, bS[dir][edge], edge ? qpc : qpc##dir, h );\
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
394 filter_mb_edgec##hv( &img_cr[2*edge*(dir?uvlinesize:1)], uvlinesize, bS[dir][edge], edge ? qpc : qpc##dir, h );\
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
395 }\
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
396 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
397 if( edges == 1 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
398 FILTER(v,0,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
399 FILTER(h,1,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
400 } else if( IS_8x8DCT(mb_type) ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
401 FILTER(v,0,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
402 FILTER(v,0,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
403 FILTER(h,1,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
404 FILTER(h,1,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
405 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
406 FILTER(v,0,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
407 FILTER(v,0,1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
408 FILTER(v,0,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
409 FILTER(v,0,3);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
410 FILTER(h,1,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
411 FILTER(h,1,1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
412 FILTER(h,1,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
413 FILTER(h,1,3);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
414 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
415 #undef FILTER
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
416 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
417 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
418
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
419
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
420 static av_always_inline void filter_mb_dir(H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize, int mb_xy, int mb_type, int mvy_limit, int first_vertical_edge_done, int dir) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
421 MpegEncContext * const s = &h->s;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
422 int edge;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
423 const int mbm_xy = dir == 0 ? mb_xy -1 : h->top_mb_xy;
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
424 const int mbm_type = dir == 0 ? h->left_type[0] : h->top_type;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
425
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
426 // how often to recheck mv-based bS when iterating between edges
10958
304db572a69a Make calculation of mask_edge free of branches, faster of course but probably
michael
parents: 10950
diff changeset
427 static const uint8_t mask_edge_tab[2][8]={{0,3,3,3,1,1,1,1},
304db572a69a Make calculation of mask_edge free of branches, faster of course but probably
michael
parents: 10950
diff changeset
428 {0,3,1,1,3,3,3,3}};
304db572a69a Make calculation of mask_edge free of branches, faster of course but probably
michael
parents: 10950
diff changeset
429 const int mask_edge = mask_edge_tab[dir][(mb_type>>3)&7];
10973
214adf5e303b Set edges based on cbp and mv partitioning, not just skiped MBs.
michael
parents: 10970
diff changeset
430 const int edges = mask_edge== 3 && !(h->cbp&15) ? 1 : 4;
214adf5e303b Set edges based on cbp and mv partitioning, not just skiped MBs.
michael
parents: 10970
diff changeset
431
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
432 // how often to recheck mv-based bS when iterating along each edge
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
433 const int mask_par0 = mb_type & (MB_TYPE_16x16 | (MB_TYPE_8x16 >> dir));
10942
ee944149442f Sightly simplify initialization of int start.
michael
parents: 10939
diff changeset
434 int start = h->slice_table[mbm_xy] == 0xFFFF
ee944149442f Sightly simplify initialization of int start.
michael
parents: 10939
diff changeset
435 || first_vertical_edge_done
ee944149442f Sightly simplify initialization of int start.
michael
parents: 10939
diff changeset
436 || (h->deblocking_filter==2 && h->slice_table[mbm_xy] != h->slice_num);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
437
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
438
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
439 if (FRAME_MBAFF && (dir == 1) && ((mb_y&1) == 0) && start == 0
10946
5a23fa01dec1 Merge multiple IS_* macro uses where possible.
michael
parents: 10945
diff changeset
440 && IS_INTERLACED(mbm_type&~mb_type)
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
441 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
442 // This is a special case in the norm where the filtering must
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
443 // be done twice (one each of the field) even if we are in a
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
444 // frame macroblock.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
445 //
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
446 unsigned int tmp_linesize = 2 * linesize;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
447 unsigned int tmp_uvlinesize = 2 * uvlinesize;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
448 int mbn_xy = mb_xy - 2 * s->mb_stride;
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
449 int j;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
450
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
451 for(j=0; j<2; j++, mbn_xy += s->mb_stride){
10961
34a65026fa06 Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents: 10960
diff changeset
452 DECLARE_ALIGNED_8(int16_t, bS)[4];
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
453 int qp;
10946
5a23fa01dec1 Merge multiple IS_* macro uses where possible.
michael
parents: 10945
diff changeset
454 if( IS_INTRA(mb_type|s->current_picture.mb_type[mbn_xy]) ) {
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
455 *(uint64_t*)bS= 0x0003000300030003ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
456 } else {
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
457 const uint8_t *mbn_nnz = h->non_zero_count[mbn_xy] + 4+3*8;
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
458 int i;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
459 for( i = 0; i < 4; i++ ) {
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
460 bS[i] = 1 + !!(h->non_zero_count_cache[scan8[0]+i] | mbn_nnz[i]);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
461 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
462 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
463 // Do not use s->qscale as luma quantizer because it has not the same
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
464 // value in IPCM macroblocks.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
465 qp = ( s->current_picture.qscale_table[mb_xy] + s->current_picture.qscale_table[mbn_xy] + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
466 tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d ls:%d uvls:%d", mb_x, mb_y, dir, edge, qp, tmp_linesize, tmp_uvlinesize);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
467 { int i; for (i = 0; i < 4; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
468 filter_mb_edgeh( &img_y[j*linesize], tmp_linesize, bS, qp, h );
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
469 filter_mb_edgech( &img_cb[j*uvlinesize], tmp_uvlinesize, bS,
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
470 ( h->chroma_qp[0] + get_chroma_qp( h, 0, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
471 filter_mb_edgech( &img_cr[j*uvlinesize], tmp_uvlinesize, bS,
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
472 ( h->chroma_qp[1] + get_chroma_qp( h, 1, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
473 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
474
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
475 start = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
476 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
477
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
478 /* Calculate bS */
11032
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
479 if(start==0) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
480 DECLARE_ALIGNED_8(int16_t, bS)[4];
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
481 int qp;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
482
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
483 if( IS_INTRA(mb_type|mbm_type)) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
484 *(uint64_t*)bS= 0x0003000300030003ULL;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
485 if ( (!IS_INTERLACED(mb_type|mbm_type))
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
486 || ((FRAME_MBAFF || (s->picture_structure != PICT_FRAME)) && (dir == 0))
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
487 )
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
488 *(uint64_t*)bS= 0x0004000400040004ULL;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
489 } else {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
490 int i, l;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
491 int mv_done;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
492
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
493 if( FRAME_MBAFF && IS_INTERLACED(mb_type ^ mbm_type)) { //FIXME not posible left
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
494 *(uint64_t*)bS= 0x0001000100010001ULL;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
495 mv_done = 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
496 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
497 else if( mask_par0 && ((mbm_type & (MB_TYPE_16x16 | (MB_TYPE_8x16 >> dir)))) ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
498 int b_idx= 8 + 4;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
499 int bn_idx= b_idx - (dir ? 8:1);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
500 int v = 0;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
501
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
502 for( l = 0; !v && l < h->list_count; l++ ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
503 v |= h->ref_cache[l][b_idx] != h->ref_cache[l][bn_idx] |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
504 h->mv_cache[l][b_idx][0] - h->mv_cache[l][bn_idx][0] + 3 >= 7U |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
505 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[l][bn_idx][1] ) >= mvy_limit;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
506 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
507
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
508 if(h->list_count==2 && v){
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
509 v=0;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
510 for( l = 0; !v && l < 2; l++ ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
511 int ln= 1-l;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
512 v |= h->ref_cache[l][b_idx] != h->ref_cache[ln][bn_idx] |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
513 h->mv_cache[l][b_idx][0] - h->mv_cache[ln][bn_idx][0] + 3 >= 7U |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
514 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[ln][bn_idx][1] ) >= mvy_limit;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
515 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
516 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
517
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
518 bS[0] = bS[1] = bS[2] = bS[3] = v;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
519 mv_done = 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
520 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
521 else
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
522 mv_done = 0;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
523
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
524 for( i = 0; i < 4; i++ ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
525 int x = dir == 0 ? 0 : i;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
526 int y = dir == 0 ? i : 0;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
527 int b_idx= 8 + 4 + x + 8*y;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
528 int bn_idx= b_idx - (dir ? 8:1);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
529
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
530 if( h->non_zero_count_cache[b_idx] |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
531 h->non_zero_count_cache[bn_idx] ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
532 bS[i] = 2;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
533 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
534 else if(!mv_done)
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
535 {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
536 bS[i] = 0;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
537 for( l = 0; l < h->list_count; l++ ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
538 if( h->ref_cache[l][b_idx] != h->ref_cache[l][bn_idx] |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
539 h->mv_cache[l][b_idx][0] - h->mv_cache[l][bn_idx][0] + 3 >= 7U |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
540 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[l][bn_idx][1] ) >= mvy_limit ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
541 bS[i] = 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
542 break;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
543 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
544 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
545
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
546 if(h->list_count == 2 && bS[i]){
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
547 bS[i] = 0;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
548 for( l = 0; l < 2; l++ ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
549 int ln= 1-l;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
550 if( h->ref_cache[l][b_idx] != h->ref_cache[ln][bn_idx] |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
551 h->mv_cache[l][b_idx][0] - h->mv_cache[ln][bn_idx][0] + 3 >= 7U |
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
552 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[ln][bn_idx][1] ) >= mvy_limit ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
553 bS[i] = 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
554 break;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
555 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
556 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
557 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
558 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
559 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
560 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
561
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
562 /* Filter edge */
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
563 // Do not use s->qscale as luma quantizer because it has not the same
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
564 // value in IPCM macroblocks.
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
565 if(bS[0]+bS[1]+bS[2]+bS[3]){
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
566 qp = ( s->current_picture.qscale_table[mb_xy] + s->current_picture.qscale_table[mbm_xy] + 1 ) >> 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
567 //tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d, QPc:%d, QPcn:%d\n", mb_x, mb_y, dir, edge, qp, h->chroma_qp[0], s->current_picture.qscale_table[mbn_xy]);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
568 tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d ls:%d uvls:%d", mb_x, mb_y, dir, edge, qp, linesize, uvlinesize);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
569 //{ int i; for (i = 0; i < 4; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
570 if( dir == 0 ) {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
571 filter_mb_edgev( &img_y[0], linesize, bS, qp, h );
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
572 {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
573 int qp= ( h->chroma_qp[0] + get_chroma_qp( h, 0, s->current_picture.qscale_table[mbm_xy] ) + 1 ) >> 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
574 filter_mb_edgecv( &img_cb[0], uvlinesize, bS, qp, h);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
575 if(h->pps.chroma_qp_diff)
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
576 qp= ( h->chroma_qp[1] + get_chroma_qp( h, 1, s->current_picture.qscale_table[mbm_xy] ) + 1 ) >> 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
577 filter_mb_edgecv( &img_cr[0], uvlinesize, bS, qp, h);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
578 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
579 } else {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
580 filter_mb_edgeh( &img_y[0], linesize, bS, qp, h );
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
581 {
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
582 int qp= ( h->chroma_qp[0] + get_chroma_qp( h, 0, s->current_picture.qscale_table[mbm_xy] ) + 1 ) >> 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
583 filter_mb_edgech( &img_cb[0], uvlinesize, bS, qp, h);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
584 if(h->pps.chroma_qp_diff)
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
585 qp= ( h->chroma_qp[1] + get_chroma_qp( h, 1, s->current_picture.qscale_table[mbm_xy] ) + 1 ) >> 1;
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
586 filter_mb_edgech( &img_cr[0], uvlinesize, bS, qp, h);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
587 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
588 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
589 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
590 }
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
591 /* Calculate bS */
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
592 for( edge = 1; edge < edges; edge++ ) {
10961
34a65026fa06 Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents: 10960
diff changeset
593 DECLARE_ALIGNED_8(int16_t, bS)[4];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
594 int qp;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
595
10969
2e8fbfc278d5 Optmize 8x8dct check used to skip some borders in the loop filter.
michael
parents: 10961
diff changeset
596 if( IS_8x8DCT(mb_type & (edge<<24)) ) // (edge&1) && IS_8x8DCT(mb_type)
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
597 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
598
11032
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
599 if( IS_INTRA(mb_type)) {
10945
0d93bbc17950 Simplify and optimize intra code in h264_loopfilter.c
michael
parents: 10942
diff changeset
600 *(uint64_t*)bS= 0x0003000300030003ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
601 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
602 int i, l;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
603 int mv_done;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
604
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
605 if( edge & mask_edge ) {
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
606 *(uint64_t*)bS= 0;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
607 mv_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
608 }
11032
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
609 else if( mask_par0 ) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
610 int b_idx= 8 + 4 + edge * (dir ? 8:1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
611 int bn_idx= b_idx - (dir ? 8:1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
612 int v = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
613
10984
541acd292c48 Remove all uses of slice_type* from the loop filter, also remove its
michael
parents: 10979
diff changeset
614 for( l = 0; !v && l < h->list_count; l++ ) {
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
615 v |= h->ref_cache[l][b_idx] != h->ref_cache[l][bn_idx] |
10901
2a5c3d89201d Another microopt, 4 cpu cycles for avoidance of FFABS().
michael
parents: 10899
diff changeset
616 h->mv_cache[l][b_idx][0] - h->mv_cache[l][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
617 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[l][bn_idx][1] ) >= mvy_limit;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
618 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
619
10984
541acd292c48 Remove all uses of slice_type* from the loop filter, also remove its
michael
parents: 10979
diff changeset
620 if(h->list_count==2 && v){
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
621 v=0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
622 for( l = 0; !v && l < 2; l++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
623 int ln= 1-l;
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
624 v |= h->ref_cache[l][b_idx] != h->ref_cache[ln][bn_idx] |
10901
2a5c3d89201d Another microopt, 4 cpu cycles for avoidance of FFABS().
michael
parents: 10899
diff changeset
625 h->mv_cache[l][b_idx][0] - h->mv_cache[ln][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
626 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[ln][bn_idx][1] ) >= mvy_limit;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
627 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
628 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
629
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
630 bS[0] = bS[1] = bS[2] = bS[3] = v;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
631 mv_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
632 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
633 else
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
634 mv_done = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
635
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
636 for( i = 0; i < 4; i++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
637 int x = dir == 0 ? edge : i;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
638 int y = dir == 0 ? i : edge;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
639 int b_idx= 8 + 4 + x + 8*y;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
640 int bn_idx= b_idx - (dir ? 8:1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
641
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
642 if( h->non_zero_count_cache[b_idx] |
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
643 h->non_zero_count_cache[bn_idx] ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
644 bS[i] = 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
645 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
646 else if(!mv_done)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
647 {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
648 bS[i] = 0;
10984
541acd292c48 Remove all uses of slice_type* from the loop filter, also remove its
michael
parents: 10979
diff changeset
649 for( l = 0; l < h->list_count; l++ ) {
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
650 if( h->ref_cache[l][b_idx] != h->ref_cache[l][bn_idx] |
10902
1e41e6ab9a18 Apply last 2 optimizations to similar code i forgot.
michael
parents: 10901
diff changeset
651 h->mv_cache[l][b_idx][0] - h->mv_cache[l][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
652 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[l][bn_idx][1] ) >= mvy_limit ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
653 bS[i] = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
654 break;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
655 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
656 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
657
10984
541acd292c48 Remove all uses of slice_type* from the loop filter, also remove its
michael
parents: 10979
diff changeset
658 if(h->list_count == 2 && bS[i]){
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
659 bS[i] = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
660 for( l = 0; l < 2; l++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
661 int ln= 1-l;
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
662 if( h->ref_cache[l][b_idx] != h->ref_cache[ln][bn_idx] |
10902
1e41e6ab9a18 Apply last 2 optimizations to similar code i forgot.
michael
parents: 10901
diff changeset
663 h->mv_cache[l][b_idx][0] - h->mv_cache[ln][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
664 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[ln][bn_idx][1] ) >= mvy_limit ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
665 bS[i] = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
666 break;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
667 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
668 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
669 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
670 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
671 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
672
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
673 if(bS[0]+bS[1]+bS[2]+bS[3] == 0)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
674 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
675 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
676
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
677 /* Filter edge */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
678 // Do not use s->qscale as luma quantizer because it has not the same
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
679 // value in IPCM macroblocks.
11032
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
680 qp = s->current_picture.qscale_table[mb_xy];
10906
1b5fba731e24 Rearchitecturing the stiched up goose part 1
michael
parents: 10904
diff changeset
681 //tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d, QPc:%d, QPcn:%d\n", mb_x, mb_y, dir, edge, qp, h->chroma_qp[0], s->current_picture.qscale_table[mbn_xy]);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
682 tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d ls:%d uvls:%d", mb_x, mb_y, dir, edge, qp, linesize, uvlinesize);
10904
b30aef0c693f Comment for() ; out
michael
parents: 10903
diff changeset
683 //{ int i; for (i = 0; i < 4; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
684 if( dir == 0 ) {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
685 filter_mb_edgev( &img_y[4*edge], linesize, bS, qp, h );
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
686 if( (edge&1) == 0 ) {
11032
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
687 filter_mb_edgecv( &img_cb[2*edge], uvlinesize, bS, h->chroma_qp[0], h);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
688 filter_mb_edgecv( &img_cr[2*edge], uvlinesize, bS, h->chroma_qp[1], h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
689 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
690 } else {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
691 filter_mb_edgeh( &img_y[4*edge*linesize], linesize, bS, qp, h );
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
692 if( (edge&1) == 0 ) {
11032
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
693 filter_mb_edgech( &img_cb[2*edge*uvlinesize], uvlinesize, bS, h->chroma_qp[0], h);
01bd040f8607 Unroll main loop so the edge==0 case is seperate.
michael
parents: 11026
diff changeset
694 filter_mb_edgech( &img_cr[2*edge*uvlinesize], uvlinesize, bS, h->chroma_qp[1], h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
695 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
696 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
697 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
698 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
699
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
700 void ff_h264_filter_mb( H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
701 MpegEncContext * const s = &h->s;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
702 const int mb_xy= mb_x + mb_y*s->mb_stride;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
703 const int mb_type = s->current_picture.mb_type[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
704 const int mvy_limit = IS_INTERLACED(mb_type) ? 2 : 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
705 int first_vertical_edge_done = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
706 av_unused int dir;
10906
1b5fba731e24 Rearchitecturing the stiched up goose part 1
michael
parents: 10904
diff changeset
707 int list;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
708
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
709 if (FRAME_MBAFF
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
710 // and current and left pair do not have the same interlaced type
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
711 && IS_INTERLACED(mb_type^h->left_type[0])
11026
f5678fb91140 Update comment.
michael
parents: 11025
diff changeset
712 // and left mb is in available to us
11013
5e5d44c920b6 Simplify loop filter a little by using top/left_type.
michael
parents: 10984
diff changeset
713 && h->left_type[0]) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
714 /* First vertical edge is different in MBAFF frames
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
715 * There are 8 different bS to compute and 2 different Qp
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
716 */
10961
34a65026fa06 Move array specifiers outside DECLARE_ALIGNED() invocations
mru
parents: 10960
diff changeset
717 DECLARE_ALIGNED_8(int16_t, bS)[8];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
718 int qp[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
719 int bqp[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
720 int rqp[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
721 int mb_qp, mbn0_qp, mbn1_qp;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
722 int i;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
723 first_vertical_edge_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
724
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
725 if( IS_INTRA(mb_type) )
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
726 *(uint64_t*)&bS[0]=
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
727 *(uint64_t*)&bS[4]= 0x0004000400040004ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
728 else {
11025
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
729 static const uint8_t offset[2][2][8]={
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
730 {
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
731 {7+8*0, 7+8*0, 7+8*0, 7+8*0, 7+8*1, 7+8*1, 7+8*1, 7+8*1},
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
732 {7+8*2, 7+8*2, 7+8*2, 7+8*2, 7+8*3, 7+8*3, 7+8*3, 7+8*3},
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
733 },{
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
734 {7+8*0, 7+8*1, 7+8*2, 7+8*3, 7+8*0, 7+8*1, 7+8*2, 7+8*3},
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
735 {7+8*0, 7+8*1, 7+8*2, 7+8*3, 7+8*0, 7+8*1, 7+8*2, 7+8*3},
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
736 }
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
737 };
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
738 const uint8_t *off= offset[MB_FIELD][mb_y&1];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
739 for( i = 0; i < 8; i++ ) {
11021
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
740 int j= MB_FIELD ? i>>2 : i&1;
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
741 int mbn_xy = h->left_mb_xy[j];
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
742 int mbn_type= h->left_type[j];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
743
11021
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
744 if( IS_INTRA( mbn_type ) )
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
745 bS[i] = 4;
11021
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
746 else{
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
747 bS[i] = 1 + !!(h->non_zero_count_cache[12+8*(i>>1)] |
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
748 ((!h->pps.cabac && IS_8x8DCT(mbn_type)) ?
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
749 (h->cbp_table[mbn_xy] & ((MB_FIELD ? (i&2) : (mb_y&1)) ? 8 : 2))
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
750 :
11025
cd1f5f6a2e45 Use table to speedup access to non_zero_count in MBAFF with differing interlacing.
michael
parents: 11021
diff changeset
751 h->non_zero_count[mbn_xy][ off[i] ]));
11021
2bc05f2fc993 Optimize loop filtering of the left edge in MBAFF.
michael
parents: 11016
diff changeset
752 }
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
753 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
754 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
755
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
756 mb_qp = s->current_picture.qscale_table[mb_xy];
11015
d844c58b985a Use left_mb_xy from fill_caches instead of recalculating it.
michael
parents: 11013
diff changeset
757 mbn0_qp = s->current_picture.qscale_table[h->left_mb_xy[0]];
d844c58b985a Use left_mb_xy from fill_caches instead of recalculating it.
michael
parents: 11013
diff changeset
758 mbn1_qp = s->current_picture.qscale_table[h->left_mb_xy[1]];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
759 qp[0] = ( mb_qp + mbn0_qp + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
760 bqp[0] = ( get_chroma_qp( h, 0, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
761 get_chroma_qp( h, 0, mbn0_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
762 rqp[0] = ( get_chroma_qp( h, 1, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
763 get_chroma_qp( h, 1, mbn0_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
764 qp[1] = ( mb_qp + mbn1_qp + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
765 bqp[1] = ( get_chroma_qp( h, 0, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
766 get_chroma_qp( h, 0, mbn1_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
767 rqp[1] = ( get_chroma_qp( h, 1, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
768 get_chroma_qp( h, 1, mbn1_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
769
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
770 /* Filter edge */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
771 tprintf(s->avctx, "filter mb:%d/%d MBAFF, QPy:%d/%d, QPb:%d/%d QPr:%d/%d ls:%d uvls:%d", mb_x, mb_y, qp[0], qp[1], bqp[0], bqp[1], rqp[0], rqp[1], linesize, uvlinesize);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
772 { int i; for (i = 0; i < 8; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
773 if(MB_FIELD){
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
774 filter_mb_mbaff_edgev ( h, img_y , linesize, bS , 1, qp [0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
775 filter_mb_mbaff_edgev ( h, img_y + 8* linesize, linesize, bS+4, 1, qp [1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
776 filter_mb_mbaff_edgecv( h, img_cb, uvlinesize, bS , 1, bqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
777 filter_mb_mbaff_edgecv( h, img_cb + 4*uvlinesize, uvlinesize, bS+4, 1, bqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
778 filter_mb_mbaff_edgecv( h, img_cr, uvlinesize, bS , 1, rqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
779 filter_mb_mbaff_edgecv( h, img_cr + 4*uvlinesize, uvlinesize, bS+4, 1, rqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
780 }else{
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
781 filter_mb_mbaff_edgev ( h, img_y , 2* linesize, bS , 2, qp [0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
782 filter_mb_mbaff_edgev ( h, img_y + linesize, 2* linesize, bS+1, 2, qp [1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
783 filter_mb_mbaff_edgecv( h, img_cb, 2*uvlinesize, bS , 2, bqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
784 filter_mb_mbaff_edgecv( h, img_cb + uvlinesize, 2*uvlinesize, bS+1, 2, bqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
785 filter_mb_mbaff_edgecv( h, img_cr, 2*uvlinesize, bS , 2, rqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
786 filter_mb_mbaff_edgecv( h, img_cr + uvlinesize, 2*uvlinesize, bS+1, 2, rqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
787 }
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
788 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
789
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
790 #if CONFIG_SMALL
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
791 for( dir = 0; dir < 2; dir++ )
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
792 filter_mb_dir(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize, mb_xy, mb_type, mvy_limit, dir ? 0 : first_vertical_edge_done, dir);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
793 #else
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
794 filter_mb_dir(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize, mb_xy, mb_type, mvy_limit, first_vertical_edge_done, 0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
795 filter_mb_dir(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize, mb_xy, mb_type, mvy_limit, 0, 1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
796 #endif
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
797 }