annotate h264_loopfilter.c @ 10960:10759fd39860 libavcodec

Gcc idiocy fixes related to filter_mb_edge*. Change order of operands as gcc uses a hardcoded register per operand it seems even for static functions thus reducing unneeded moved (now functions try to pass the same argument in the same spot). Change signed int to unsigned int for array indexes as signed requires signed extension while unsigned is free. move the +52 up and merge it where it will end as a lea instruction, gcc always splits the 52 out there turning the free +52 into an expensive one otherwise. The changed code becomes a little faster.
author michael
date Fri, 22 Jan 2010 01:59:17 +0000
parents 304db572a69a
children 34a65026fa06
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
1 /*
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
2 * H.26L/H.264/AVC/JVT/14496-10/... loop filter
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
3 * Copyright (c) 2003 Michael Niedermayer <michaelni@gmx.at>
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
4 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
5 * This file is part of FFmpeg.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
6 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
7 * FFmpeg is free software; you can redistribute it and/or
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
8 * modify it under the terms of the GNU Lesser General Public
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
9 * License as published by the Free Software Foundation; either
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
10 * version 2.1 of the License, or (at your option) any later version.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
11 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
12 * FFmpeg is distributed in the hope that it will be useful,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
15 * Lesser General Public License for more details.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
16 *
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
17 * You should have received a copy of the GNU Lesser General Public
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
18 * License along with FFmpeg; if not, write to the Free Software
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
19 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
20 */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
21
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
22 /**
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
23 * @file libavcodec/h264_loopfilter.c
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
24 * H.264 / AVC / MPEG4 part10 loop filter.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
25 * @author Michael Niedermayer <michaelni@gmx.at>
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
26 */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
27
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
28 #include "internal.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
29 #include "dsputil.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
30 #include "avcodec.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
31 #include "mpegvideo.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
32 #include "h264.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
33 #include "mathops.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
34 #include "rectangle.h"
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
35
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
36 //#undef NDEBUG
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
37 #include <assert.h>
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
38
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
39 /* Deblocking filter (p153) */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
40 static const uint8_t alpha_table[52*3] = {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
41 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
42 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
43 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
44 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
45 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
46 0, 0, 0, 0, 0, 0, 4, 4, 5, 6,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
47 7, 8, 9, 10, 12, 13, 15, 17, 20, 22,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
48 25, 28, 32, 36, 40, 45, 50, 56, 63, 71,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
49 80, 90,101,113,127,144,162,182,203,226,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
50 255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
51 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
52 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
53 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
54 255,255,255,255,255,255,255,255,255,255,255,255,255,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
55 };
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
56 static const uint8_t beta_table[52*3] = {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
57 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
58 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
59 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
60 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
61 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
62 0, 0, 0, 0, 0, 0, 2, 2, 2, 3,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
63 3, 3, 3, 4, 4, 4, 6, 6, 7, 7,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
64 8, 8, 9, 9, 10, 10, 11, 11, 12, 12,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
65 13, 13, 14, 14, 15, 15, 16, 16, 17, 17,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
66 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
67 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
68 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
69 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
70 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18, 18,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
71 };
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
72 static const uint8_t tc0_table[52*3][4] = {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
73 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
74 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
75 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
76 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
77 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
78 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
79 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
80 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
81 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
82 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
83 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
84 {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 0 }, {-1, 0, 0, 1 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
85 {-1, 0, 0, 1 }, {-1, 0, 0, 1 }, {-1, 0, 0, 1 }, {-1, 0, 1, 1 }, {-1, 0, 1, 1 }, {-1, 1, 1, 1 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
86 {-1, 1, 1, 1 }, {-1, 1, 1, 1 }, {-1, 1, 1, 1 }, {-1, 1, 1, 2 }, {-1, 1, 1, 2 }, {-1, 1, 1, 2 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
87 {-1, 1, 1, 2 }, {-1, 1, 2, 3 }, {-1, 1, 2, 3 }, {-1, 2, 2, 3 }, {-1, 2, 2, 4 }, {-1, 2, 3, 4 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
88 {-1, 2, 3, 4 }, {-1, 3, 3, 5 }, {-1, 3, 4, 6 }, {-1, 3, 4, 6 }, {-1, 4, 5, 7 }, {-1, 4, 5, 8 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
89 {-1, 4, 6, 9 }, {-1, 5, 7,10 }, {-1, 6, 8,11 }, {-1, 6, 8,13 }, {-1, 7,10,14 }, {-1, 8,11,16 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
90 {-1, 9,12,18 }, {-1,10,13,20 }, {-1,11,15,23 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
91 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
92 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
93 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
94 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
95 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
96 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
97 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
98 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
99 {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 }, {-1,13,17,25 },
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
100 };
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
101
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
102 static void av_noinline filter_mb_edgev( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h) {
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
103 const unsigned int index_a = 52 + qp + h->slice_alpha_c0_offset;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
104 const int alpha = alpha_table[index_a];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
105 const int beta = (beta_table+52)[qp + h->slice_beta_offset];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
106 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
107
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
108 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
109 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
110 tc[0] = tc0_table[index_a][bS[0]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
111 tc[1] = tc0_table[index_a][bS[1]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
112 tc[2] = tc0_table[index_a][bS[2]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
113 tc[3] = tc0_table[index_a][bS[3]];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
114 h->s.dsp.h264_h_loop_filter_luma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
115 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
116 h->s.dsp.h264_h_loop_filter_luma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
117 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
118 }
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
119 static void av_noinline filter_mb_edgecv( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h ) {
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
120 const unsigned int index_a = 52 + qp + h->slice_alpha_c0_offset;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
121 const int alpha = alpha_table[index_a];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
122 const int beta = (beta_table+52)[qp + h->slice_beta_offset];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
123 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
124
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
125 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
126 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
127 tc[0] = tc0_table[index_a][bS[0]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
128 tc[1] = tc0_table[index_a][bS[1]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
129 tc[2] = tc0_table[index_a][bS[2]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
130 tc[3] = tc0_table[index_a][bS[3]]+1;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
131 h->s.dsp.h264_h_loop_filter_chroma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
132 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
133 h->s.dsp.h264_h_loop_filter_chroma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
134 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
135 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
136
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
137 static void filter_mb_mbaff_edgev( H264Context *h, uint8_t *pix, int stride, int16_t bS[4], int bsi, int qp ) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
138 int i;
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
139 for( i = 0; i < 8; i++, pix += stride) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
140 int index_a;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
141 int alpha;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
142 int beta;
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
143 const int bS_index = (i >> 1) * bsi;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
144
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
145 if( bS[bS_index] == 0 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
146 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
147 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
148
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
149 index_a = qp + h->slice_alpha_c0_offset;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
150 alpha = (alpha_table+52)[index_a];
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
151 beta = (beta_table+52)[qp + h->slice_beta_offset];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
152
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
153 if( bS[bS_index] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
154 const int tc0 = (tc0_table+52)[index_a][bS[bS_index]];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
155 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
156 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
157 const int p2 = pix[-3];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
158 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
159 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
160 const int q2 = pix[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
161
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
162 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
163 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
164 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
165 int tc = tc0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
166 int i_delta;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
167
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
168 if( FFABS( p2 - p0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
169 pix[-2] = p1 + av_clip( ( p2 + ( ( p0 + q0 + 1 ) >> 1 ) - ( p1 << 1 ) ) >> 1, -tc0, tc0 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
170 tc++;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
171 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
172 if( FFABS( q2 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
173 pix[1] = q1 + av_clip( ( q2 + ( ( p0 + q0 + 1 ) >> 1 ) - ( q1 << 1 ) ) >> 1, -tc0, tc0 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
174 tc++;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
175 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
176
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
177 i_delta = av_clip( (((q0 - p0 ) << 2) + (p1 - q1) + 4) >> 3, -tc, tc );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
178 pix[-1] = av_clip_uint8( p0 + i_delta ); /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
179 pix[0] = av_clip_uint8( q0 - i_delta ); /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
180 tprintf(h->s.avctx, "filter_mb_mbaff_edgev i:%d, qp:%d, indexA:%d, alpha:%d, beta:%d, tc:%d\n# bS:%d -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x]\n", i, qp[qp_index], index_a, alpha, beta, tc, bS[bS_index], pix[-3], p1, p0, q0, q1, pix[2], p1, pix[-1], pix[0], q1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
181 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
182 }else{
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
183 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
184 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
185 const int p2 = pix[-3];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
186
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
187 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
188 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
189 const int q2 = pix[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
190
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
191 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
192 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
193 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
194
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
195 if(FFABS( p0 - q0 ) < (( alpha >> 2 ) + 2 )){
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
196 if( FFABS( p2 - p0 ) < beta)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
197 {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
198 const int p3 = pix[-4];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
199 /* p0', p1', p2' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
200 pix[-1] = ( p2 + 2*p1 + 2*p0 + 2*q0 + q1 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
201 pix[-2] = ( p2 + p1 + p0 + q0 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
202 pix[-3] = ( 2*p3 + 3*p2 + p1 + p0 + q0 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
203 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
204 /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
205 pix[-1] = ( 2*p1 + p0 + q1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
206 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
207 if( FFABS( q2 - q0 ) < beta)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
208 {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
209 const int q3 = pix[3];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
210 /* q0', q1', q2' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
211 pix[0] = ( p1 + 2*p0 + 2*q0 + 2*q1 + q2 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
212 pix[1] = ( p0 + q0 + q1 + q2 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
213 pix[2] = ( 2*q3 + 3*q2 + q1 + q0 + p0 + 4 ) >> 3;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
214 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
215 /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
216 pix[0] = ( 2*q1 + q0 + p1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
217 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
218 }else{
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
219 /* p0', q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
220 pix[-1] = ( 2*p1 + p0 + q1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
221 pix[ 0] = ( 2*q1 + q0 + p1 + 2 ) >> 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
222 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
223 tprintf(h->s.avctx, "filter_mb_mbaff_edgev i:%d, qp:%d, indexA:%d, alpha:%d, beta:%d\n# bS:4 -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x, %02x, %02x]\n", i, qp[qp_index], index_a, alpha, beta, p2, p1, p0, q0, q1, q2, pix[-3], pix[-2], pix[-1], pix[0], pix[1], pix[2]);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
224 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
225 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
226 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
227 }
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
228 static void filter_mb_mbaff_edgecv( H264Context *h, uint8_t *pix, int stride, int16_t bS[4], int bsi, int qp ) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
229 int i;
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
230 for( i = 0; i < 4; i++, pix += stride) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
231 int index_a;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
232 int alpha;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
233 int beta;
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
234 const int bS_index = i*bsi;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
235
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
236 if( bS[bS_index] == 0 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
237 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
238 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
239
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
240 index_a = qp + h->slice_alpha_c0_offset;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
241 alpha = (alpha_table+52)[index_a];
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
242 beta = (beta_table+52)[qp + h->slice_beta_offset];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
243
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
244 if( bS[bS_index] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
245 const int tc = (tc0_table+52)[index_a][bS[bS_index]] + 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
246 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
247 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
248 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
249 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
250
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
251 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
252 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
253 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
254 const int i_delta = av_clip( (((q0 - p0 ) << 2) + (p1 - q1) + 4) >> 3, -tc, tc );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
255
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
256 pix[-1] = av_clip_uint8( p0 + i_delta ); /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
257 pix[0] = av_clip_uint8( q0 - i_delta ); /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
258 tprintf(h->s.avctx, "filter_mb_mbaff_edgecv i:%d, qp:%d, indexA:%d, alpha:%d, beta:%d, tc:%d\n# bS:%d -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x]\n", i, qp[qp_index], index_a, alpha, beta, tc, bS[bS_index], pix[-3], p1, p0, q0, q1, pix[2], p1, pix[-1], pix[0], q1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
259 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
260 }else{
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
261 const int p0 = pix[-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
262 const int p1 = pix[-2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
263 const int q0 = pix[0];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
264 const int q1 = pix[1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
265
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
266 if( FFABS( p0 - q0 ) < alpha &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
267 FFABS( p1 - p0 ) < beta &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
268 FFABS( q1 - q0 ) < beta ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
269
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
270 pix[-1] = ( 2*p1 + p0 + q1 + 2 ) >> 2; /* p0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
271 pix[0] = ( 2*q1 + q0 + p1 + 2 ) >> 2; /* q0' */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
272 tprintf(h->s.avctx, "filter_mb_mbaff_edgecv i:%d\n# bS:4 -> [%02x, %02x, %02x, %02x, %02x, %02x] =>[%02x, %02x, %02x, %02x, %02x, %02x]\n", i, pix[-3], p1, p0, q0, q1, pix[2], pix[-3], pix[-2], pix[-1], pix[0], pix[1], pix[2]);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
273 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
274 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
275 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
276 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
277
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
278 static void av_noinline filter_mb_edgeh( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h ) {
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
279 const unsigned int index_a = 52 + qp + h->slice_alpha_c0_offset;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
280 const int alpha = alpha_table[index_a];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
281 const int beta = (beta_table+52)[qp + h->slice_beta_offset];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
282 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
283
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
284 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
285 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
286 tc[0] = tc0_table[index_a][bS[0]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
287 tc[1] = tc0_table[index_a][bS[1]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
288 tc[2] = tc0_table[index_a][bS[2]];
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
289 tc[3] = tc0_table[index_a][bS[3]];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
290 h->s.dsp.h264_v_loop_filter_luma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
291 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
292 h->s.dsp.h264_v_loop_filter_luma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
293 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
294 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
295
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
296 static void av_noinline filter_mb_edgech( uint8_t *pix, int stride, int16_t bS[4], unsigned int qp, H264Context *h ) {
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
297 const unsigned int index_a = 52 + qp + h->slice_alpha_c0_offset;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
298 const int alpha = alpha_table[index_a];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
299 const int beta = (beta_table+52)[qp + h->slice_beta_offset];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
300 if (alpha ==0 || beta == 0) return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
301
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
302 if( bS[0] < 4 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
303 int8_t tc[4];
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
304 tc[0] = tc0_table[index_a][bS[0]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
305 tc[1] = tc0_table[index_a][bS[1]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
306 tc[2] = tc0_table[index_a][bS[2]]+1;
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
307 tc[3] = tc0_table[index_a][bS[3]]+1;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
308 h->s.dsp.h264_v_loop_filter_chroma(pix, stride, alpha, beta, tc);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
309 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
310 h->s.dsp.h264_v_loop_filter_chroma_intra(pix, stride, alpha, beta);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
311 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
312 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
313
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
314 void ff_h264_filter_mb_fast( H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
315 MpegEncContext * const s = &h->s;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
316 int mb_y_firstrow = s->picture_structure == PICT_BOTTOM_FIELD;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
317 int mb_xy, mb_type;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
318 int qp, qp0, qp1, qpc, qpc0, qpc1, qp_thresh;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
319
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
320 mb_xy = h->mb_xy;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
321
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
322 if(mb_x==0 || mb_y==mb_y_firstrow || !s->dsp.h264_loop_filter_strength || h->pps.chroma_qp_diff ||
10922
8945125b5ae6 Use h->slice_num where possible.
michael
parents: 10921
diff changeset
323 (h->deblocking_filter == 2 && (h->slice_num != h->slice_table[h->top_mb_xy] ||
8945125b5ae6 Use h->slice_num where possible.
michael
parents: 10921
diff changeset
324 h->slice_num != h->slice_table[mb_xy - 1]))) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
325 ff_h264_filter_mb(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
326 return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
327 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
328 assert(!FRAME_MBAFF);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
329
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
330 mb_type = s->current_picture.mb_type[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
331 qp = s->current_picture.qscale_table[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
332 qp0 = s->current_picture.qscale_table[mb_xy-1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
333 qp1 = s->current_picture.qscale_table[h->top_mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
334 qpc = get_chroma_qp( h, 0, qp );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
335 qpc0 = get_chroma_qp( h, 0, qp0 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
336 qpc1 = get_chroma_qp( h, 0, qp1 );
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
337 qp0 = (qp + qp0 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
338 qp1 = (qp + qp1 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
339 qpc0 = (qpc + qpc0 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
340 qpc1 = (qpc + qpc1 + 1) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
341 qp_thresh = 15 - h->slice_alpha_c0_offset;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
342 if(qp <= qp_thresh && qp0 <= qp_thresh && qp1 <= qp_thresh &&
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
343 qpc <= qp_thresh && qpc0 <= qp_thresh && qpc1 <= qp_thresh)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
344 return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
345
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
346 if( IS_INTRA(mb_type) ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
347 int16_t bS4[4] = {4,4,4,4};
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
348 int16_t bS3[4] = {3,3,3,3};
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
349 int16_t *bSH = FIELD_PICTURE ? bS3 : bS4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
350 if( IS_8x8DCT(mb_type) ) {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
351 filter_mb_edgev( &img_y[4*0], linesize, bS4, qp0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
352 filter_mb_edgev( &img_y[4*2], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
353 filter_mb_edgeh( &img_y[4*0*linesize], linesize, bSH, qp1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
354 filter_mb_edgeh( &img_y[4*2*linesize], linesize, bS3, qp, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
355 } else {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
356 filter_mb_edgev( &img_y[4*0], linesize, bS4, qp0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
357 filter_mb_edgev( &img_y[4*1], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
358 filter_mb_edgev( &img_y[4*2], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
359 filter_mb_edgev( &img_y[4*3], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
360 filter_mb_edgeh( &img_y[4*0*linesize], linesize, bSH, qp1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
361 filter_mb_edgeh( &img_y[4*1*linesize], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
362 filter_mb_edgeh( &img_y[4*2*linesize], linesize, bS3, qp, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
363 filter_mb_edgeh( &img_y[4*3*linesize], linesize, bS3, qp, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
364 }
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
365 filter_mb_edgecv( &img_cb[2*0], uvlinesize, bS4, qpc0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
366 filter_mb_edgecv( &img_cb[2*2], uvlinesize, bS3, qpc, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
367 filter_mb_edgecv( &img_cr[2*0], uvlinesize, bS4, qpc0, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
368 filter_mb_edgecv( &img_cr[2*2], uvlinesize, bS3, qpc, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
369 filter_mb_edgech( &img_cb[2*0*uvlinesize], uvlinesize, bSH, qpc1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
370 filter_mb_edgech( &img_cb[2*2*uvlinesize], uvlinesize, bS3, qpc, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
371 filter_mb_edgech( &img_cr[2*0*uvlinesize], uvlinesize, bSH, qpc1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
372 filter_mb_edgech( &img_cr[2*2*uvlinesize], uvlinesize, bS3, qpc, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
373 return;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
374 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
375 DECLARE_ALIGNED_8(int16_t, bS[2][4][4]);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
376 uint64_t (*bSv)[4] = (uint64_t(*)[4])bS;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
377 int edges;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
378 if( IS_8x8DCT(mb_type) && (h->cbp&7) == 7 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
379 edges = 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
380 bSv[0][0] = bSv[0][2] = bSv[1][0] = bSv[1][2] = 0x0002000200020002ULL;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
381 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
382 int mask_edge1 = (mb_type & (MB_TYPE_16x16 | MB_TYPE_8x16)) ? 3 :
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
383 (mb_type & MB_TYPE_16x8) ? 1 : 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
384 int mask_edge0 = (mb_type & (MB_TYPE_16x16 | MB_TYPE_8x16))
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
385 && (s->current_picture.mb_type[mb_xy-1] & (MB_TYPE_16x16 | MB_TYPE_8x16))
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
386 ? 3 : 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
387 int step = IS_8x8DCT(mb_type) ? 2 : 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
388 edges = (mb_type & MB_TYPE_16x16) && !(h->cbp & 15) ? 1 : 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
389 s->dsp.h264_loop_filter_strength( bS, h->non_zero_count_cache, h->ref_cache, h->mv_cache,
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
390 (h->slice_type_nos == FF_B_TYPE), edges, step, mask_edge0, mask_edge1, FIELD_PICTURE);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
391 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
392 if( IS_INTRA(s->current_picture.mb_type[mb_xy-1]) )
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
393 bSv[0][0] = 0x0004000400040004ULL;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
394 if( IS_INTRA(s->current_picture.mb_type[h->top_mb_xy]) )
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
395 bSv[1][0] = FIELD_PICTURE ? 0x0003000300030003ULL : 0x0004000400040004ULL;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
396
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
397 #define FILTER(hv,dir,edge)\
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
398 if(bSv[dir][edge]) {\
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
399 filter_mb_edge##hv( &img_y[4*edge*(dir?linesize:1)], linesize, bS[dir][edge], edge ? qp : qp##dir, h );\
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
400 if(!(edge&1)) {\
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
401 filter_mb_edgec##hv( &img_cb[2*edge*(dir?uvlinesize:1)], uvlinesize, bS[dir][edge], edge ? qpc : qpc##dir, h );\
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
402 filter_mb_edgec##hv( &img_cr[2*edge*(dir?uvlinesize:1)], uvlinesize, bS[dir][edge], edge ? qpc : qpc##dir, h );\
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
403 }\
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
404 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
405 if( edges == 1 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
406 FILTER(v,0,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
407 FILTER(h,1,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
408 } else if( IS_8x8DCT(mb_type) ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
409 FILTER(v,0,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
410 FILTER(v,0,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
411 FILTER(h,1,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
412 FILTER(h,1,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
413 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
414 FILTER(v,0,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
415 FILTER(v,0,1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
416 FILTER(v,0,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
417 FILTER(v,0,3);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
418 FILTER(h,1,0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
419 FILTER(h,1,1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
420 FILTER(h,1,2);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
421 FILTER(h,1,3);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
422 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
423 #undef FILTER
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
424 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
425 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
426
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
427
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
428 static av_always_inline void filter_mb_dir(H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize, int mb_xy, int mb_type, int mvy_limit, int first_vertical_edge_done, int dir) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
429 MpegEncContext * const s = &h->s;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
430 int edge;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
431 const int mbm_xy = dir == 0 ? mb_xy -1 : h->top_mb_xy;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
432 const int mbm_type = s->current_picture.mb_type[mbm_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
433
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
434 const int edges = (mb_type & (MB_TYPE_16x16|MB_TYPE_SKIP))
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
435 == (MB_TYPE_16x16|MB_TYPE_SKIP) ? 1 : 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
436 // how often to recheck mv-based bS when iterating between edges
10958
304db572a69a Make calculation of mask_edge free of branches, faster of course but probably
michael
parents: 10950
diff changeset
437 static const uint8_t mask_edge_tab[2][8]={{0,3,3,3,1,1,1,1},
304db572a69a Make calculation of mask_edge free of branches, faster of course but probably
michael
parents: 10950
diff changeset
438 {0,3,1,1,3,3,3,3}};
304db572a69a Make calculation of mask_edge free of branches, faster of course but probably
michael
parents: 10950
diff changeset
439 const int mask_edge = mask_edge_tab[dir][(mb_type>>3)&7];
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
440 // how often to recheck mv-based bS when iterating along each edge
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
441 const int mask_par0 = mb_type & (MB_TYPE_16x16 | (MB_TYPE_8x16 >> dir));
10942
ee944149442f Sightly simplify initialization of int start.
michael
parents: 10939
diff changeset
442 int start = h->slice_table[mbm_xy] == 0xFFFF
ee944149442f Sightly simplify initialization of int start.
michael
parents: 10939
diff changeset
443 || first_vertical_edge_done
ee944149442f Sightly simplify initialization of int start.
michael
parents: 10939
diff changeset
444 || (h->deblocking_filter==2 && h->slice_table[mbm_xy] != h->slice_num);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
445
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
446
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
447 if (FRAME_MBAFF && (dir == 1) && ((mb_y&1) == 0) && start == 0
10946
5a23fa01dec1 Merge multiple IS_* macro uses where possible.
michael
parents: 10945
diff changeset
448 && IS_INTERLACED(mbm_type&~mb_type)
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
449 ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
450 // This is a special case in the norm where the filtering must
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
451 // be done twice (one each of the field) even if we are in a
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
452 // frame macroblock.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
453 //
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
454 unsigned int tmp_linesize = 2 * linesize;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
455 unsigned int tmp_uvlinesize = 2 * uvlinesize;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
456 int mbn_xy = mb_xy - 2 * s->mb_stride;
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
457 int j;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
458
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
459 for(j=0; j<2; j++, mbn_xy += s->mb_stride){
10950
4776a56132e1 H.264: Declare bS with DECLARE_ALIGNED_8 for uint64_t casts.
astrange
parents: 10949
diff changeset
460 DECLARE_ALIGNED_8(int16_t, bS[4]);
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
461 int qp;
10946
5a23fa01dec1 Merge multiple IS_* macro uses where possible.
michael
parents: 10945
diff changeset
462 if( IS_INTRA(mb_type|s->current_picture.mb_type[mbn_xy]) ) {
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
463 *(uint64_t*)bS= 0x0003000300030003ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
464 } else {
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
465 const uint8_t *mbn_nnz = h->non_zero_count[mbn_xy] + 4+3*8;
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
466 int i;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
467 for( i = 0; i < 4; i++ ) {
10949
4c9b8e3065ee Simplify/Optimize another of the mbaff loop filter cases.
michael
parents: 10948
diff changeset
468 bS[i] = 1 + !!(h->non_zero_count_cache[scan8[0]+i] | mbn_nnz[i]);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
469 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
470 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
471 // Do not use s->qscale as luma quantizer because it has not the same
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
472 // value in IPCM macroblocks.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
473 qp = ( s->current_picture.qscale_table[mb_xy] + s->current_picture.qscale_table[mbn_xy] + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
474 tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d ls:%d uvls:%d", mb_x, mb_y, dir, edge, qp, tmp_linesize, tmp_uvlinesize);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
475 { int i; for (i = 0; i < 4; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
476 filter_mb_edgeh( &img_y[j*linesize], tmp_linesize, bS, qp, h );
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
477 filter_mb_edgech( &img_cb[j*uvlinesize], tmp_uvlinesize, bS,
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
478 ( h->chroma_qp[0] + get_chroma_qp( h, 0, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1, h);
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
479 filter_mb_edgech( &img_cr[j*uvlinesize], tmp_uvlinesize, bS,
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
480 ( h->chroma_qp[1] + get_chroma_qp( h, 1, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
481 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
482
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
483 start = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
484 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
485
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
486 /* Calculate bS */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
487 for( edge = start; edge < edges; edge++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
488 /* mbn_xy: neighbor macroblock */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
489 const int mbn_xy = edge > 0 ? mb_xy : mbm_xy;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
490 const int mbn_type = s->current_picture.mb_type[mbn_xy];
10950
4776a56132e1 H.264: Declare bS with DECLARE_ALIGNED_8 for uint64_t casts.
astrange
parents: 10949
diff changeset
491 DECLARE_ALIGNED_8(int16_t, bS[4]);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
492 int qp;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
493
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
494 if( (edge&1) && IS_8x8DCT(mb_type) )
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
495 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
496
10945
0d93bbc17950 Simplify and optimize intra code in h264_loopfilter.c
michael
parents: 10942
diff changeset
497 if( IS_INTRA(mb_type|mbn_type)) {
0d93bbc17950 Simplify and optimize intra code in h264_loopfilter.c
michael
parents: 10942
diff changeset
498 *(uint64_t*)bS= 0x0003000300030003ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
499 if (edge == 0) {
10945
0d93bbc17950 Simplify and optimize intra code in h264_loopfilter.c
michael
parents: 10942
diff changeset
500 if ( (!IS_INTERLACED(mb_type|mbm_type))
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
501 || ((FRAME_MBAFF || (s->picture_structure != PICT_FRAME)) && (dir == 0))
10945
0d93bbc17950 Simplify and optimize intra code in h264_loopfilter.c
michael
parents: 10942
diff changeset
502 )
0d93bbc17950 Simplify and optimize intra code in h264_loopfilter.c
michael
parents: 10942
diff changeset
503 *(uint64_t*)bS= 0x0004000400040004ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
504 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
505 } else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
506 int i, l;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
507 int mv_done;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
508
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
509 if( edge & mask_edge ) {
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
510 *(uint64_t*)bS= 0;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
511 mv_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
512 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
513 else if( FRAME_MBAFF && IS_INTERLACED(mb_type ^ mbn_type)) {
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
514 *(uint64_t*)bS= 0x0001000100010001ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
515 mv_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
516 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
517 else if( mask_par0 && (edge || (mbn_type & (MB_TYPE_16x16 | (MB_TYPE_8x16 >> dir)))) ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
518 int b_idx= 8 + 4 + edge * (dir ? 8:1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
519 int bn_idx= b_idx - (dir ? 8:1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
520 int v = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
521
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
522 for( l = 0; !v && l < 1 + (h->slice_type_nos == FF_B_TYPE); l++ ) {
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
523 v |= h->ref_cache[l][b_idx] != h->ref_cache[l][bn_idx] |
10901
2a5c3d89201d Another microopt, 4 cpu cycles for avoidance of FFABS().
michael
parents: 10899
diff changeset
524 h->mv_cache[l][b_idx][0] - h->mv_cache[l][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
525 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[l][bn_idx][1] ) >= mvy_limit;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
526 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
527
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
528 if(h->slice_type_nos == FF_B_TYPE && v){
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
529 v=0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
530 for( l = 0; !v && l < 2; l++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
531 int ln= 1-l;
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
532 v |= h->ref_cache[l][b_idx] != h->ref_cache[ln][bn_idx] |
10901
2a5c3d89201d Another microopt, 4 cpu cycles for avoidance of FFABS().
michael
parents: 10899
diff changeset
533 h->mv_cache[l][b_idx][0] - h->mv_cache[ln][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
534 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[ln][bn_idx][1] ) >= mvy_limit;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
535 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
536 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
537
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
538 bS[0] = bS[1] = bS[2] = bS[3] = v;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
539 mv_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
540 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
541 else
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
542 mv_done = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
543
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
544 for( i = 0; i < 4; i++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
545 int x = dir == 0 ? edge : i;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
546 int y = dir == 0 ? i : edge;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
547 int b_idx= 8 + 4 + x + 8*y;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
548 int bn_idx= b_idx - (dir ? 8:1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
549
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
550 if( h->non_zero_count_cache[b_idx] |
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
551 h->non_zero_count_cache[bn_idx] ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
552 bS[i] = 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
553 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
554 else if(!mv_done)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
555 {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
556 bS[i] = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
557 for( l = 0; l < 1 + (h->slice_type_nos == FF_B_TYPE); l++ ) {
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
558 if( h->ref_cache[l][b_idx] != h->ref_cache[l][bn_idx] |
10902
1e41e6ab9a18 Apply last 2 optimizations to similar code i forgot.
michael
parents: 10901
diff changeset
559 h->mv_cache[l][b_idx][0] - h->mv_cache[l][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
560 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[l][bn_idx][1] ) >= mvy_limit ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
561 bS[i] = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
562 break;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
563 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
564 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
565
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
566 if(h->slice_type_nos == FF_B_TYPE && bS[i]){
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
567 bS[i] = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
568 for( l = 0; l < 2; l++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
569 int ln= 1-l;
10913
497929e9d912 Perform reference remapping at fill_cache() time instead of in the
michael
parents: 10910
diff changeset
570 if( h->ref_cache[l][b_idx] != h->ref_cache[ln][bn_idx] |
10902
1e41e6ab9a18 Apply last 2 optimizations to similar code i forgot.
michael
parents: 10901
diff changeset
571 h->mv_cache[l][b_idx][0] - h->mv_cache[ln][bn_idx][0] + 3 >= 7U |
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
572 FFABS( h->mv_cache[l][b_idx][1] - h->mv_cache[ln][bn_idx][1] ) >= mvy_limit ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
573 bS[i] = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
574 break;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
575 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
576 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
577 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
578 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
579 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
580
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
581 if(bS[0]+bS[1]+bS[2]+bS[3] == 0)
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
582 continue;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
583 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
584
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
585 /* Filter edge */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
586 // Do not use s->qscale as luma quantizer because it has not the same
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
587 // value in IPCM macroblocks.
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
588 qp = ( s->current_picture.qscale_table[mb_xy] + s->current_picture.qscale_table[mbn_xy] + 1 ) >> 1;
10906
1b5fba731e24 Rearchitecturing the stiched up goose part 1
michael
parents: 10904
diff changeset
589 //tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d, QPc:%d, QPcn:%d\n", mb_x, mb_y, dir, edge, qp, h->chroma_qp[0], s->current_picture.qscale_table[mbn_xy]);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
590 tprintf(s->avctx, "filter mb:%d/%d dir:%d edge:%d, QPy:%d ls:%d uvls:%d", mb_x, mb_y, dir, edge, qp, linesize, uvlinesize);
10904
b30aef0c693f Comment for() ; out
michael
parents: 10903
diff changeset
591 //{ int i; for (i = 0; i < 4; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
592 if( dir == 0 ) {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
593 filter_mb_edgev( &img_y[4*edge], linesize, bS, qp, h );
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
594 if( (edge&1) == 0 ) {
10948
c80f0dfbf47d Only calculate the second chroma qp if it differs from the firstin the main
michael
parents: 10947
diff changeset
595 int qp= ( h->chroma_qp[0] + get_chroma_qp( h, 0, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
596 filter_mb_edgecv( &img_cb[2*edge], uvlinesize, bS, qp, h);
10948
c80f0dfbf47d Only calculate the second chroma qp if it differs from the firstin the main
michael
parents: 10947
diff changeset
597 if(h->pps.chroma_qp_diff)
c80f0dfbf47d Only calculate the second chroma qp if it differs from the firstin the main
michael
parents: 10947
diff changeset
598 qp= ( h->chroma_qp[1] + get_chroma_qp( h, 1, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
599 filter_mb_edgecv( &img_cr[2*edge], uvlinesize, bS, qp, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
600 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
601 } else {
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
602 filter_mb_edgeh( &img_y[4*edge*linesize], linesize, bS, qp, h );
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
603 if( (edge&1) == 0 ) {
10948
c80f0dfbf47d Only calculate the second chroma qp if it differs from the firstin the main
michael
parents: 10947
diff changeset
604 int qp= ( h->chroma_qp[0] + get_chroma_qp( h, 0, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
605 filter_mb_edgech( &img_cb[2*edge*uvlinesize], uvlinesize, bS, qp, h);
10948
c80f0dfbf47d Only calculate the second chroma qp if it differs from the firstin the main
michael
parents: 10947
diff changeset
606 if(h->pps.chroma_qp_diff)
c80f0dfbf47d Only calculate the second chroma qp if it differs from the firstin the main
michael
parents: 10947
diff changeset
607 qp= ( h->chroma_qp[1] + get_chroma_qp( h, 1, s->current_picture.qscale_table[mbn_xy] ) + 1 ) >> 1;
10960
10759fd39860 Gcc idiocy fixes related to filter_mb_edge*.
michael
parents: 10958
diff changeset
608 filter_mb_edgech( &img_cr[2*edge*uvlinesize], uvlinesize, bS, qp, h);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
609 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
610 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
611 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
612 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
613
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
614 void ff_h264_filter_mb( H264Context *h, int mb_x, int mb_y, uint8_t *img_y, uint8_t *img_cb, uint8_t *img_cr, unsigned int linesize, unsigned int uvlinesize) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
615 MpegEncContext * const s = &h->s;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
616 const int mb_xy= mb_x + mb_y*s->mb_stride;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
617 const int mb_type = s->current_picture.mb_type[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
618 const int mvy_limit = IS_INTERLACED(mb_type) ? 2 : 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
619 int first_vertical_edge_done = 0;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
620 av_unused int dir;
10906
1b5fba731e24 Rearchitecturing the stiched up goose part 1
michael
parents: 10904
diff changeset
621 int list;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
622
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
623 if (FRAME_MBAFF
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
624 // left mb is in picture
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
625 && h->slice_table[mb_xy-1] != 0xFFFF
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
626 // and current and left pair do not have the same interlaced type
10946
5a23fa01dec1 Merge multiple IS_* macro uses where possible.
michael
parents: 10945
diff changeset
627 && IS_INTERLACED(mb_type^s->current_picture.mb_type[mb_xy-1])
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
628 // and left mb is in the same slice if deblocking_filter == 2
10922
8945125b5ae6 Use h->slice_num where possible.
michael
parents: 10921
diff changeset
629 && (h->deblocking_filter!=2 || h->slice_table[mb_xy-1] == h->slice_num)) {
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
630 /* First vertical edge is different in MBAFF frames
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
631 * There are 8 different bS to compute and 2 different Qp
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
632 */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
633 const int pair_xy = mb_x + (mb_y&~1)*s->mb_stride;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
634 const int left_mb_xy[2] = { pair_xy-1, pair_xy-1+s->mb_stride };
10950
4776a56132e1 H.264: Declare bS with DECLARE_ALIGNED_8 for uint64_t casts.
astrange
parents: 10949
diff changeset
635 DECLARE_ALIGNED_8(int16_t, bS[8]);
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
636 int qp[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
637 int bqp[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
638 int rqp[2];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
639 int mb_qp, mbn0_qp, mbn1_qp;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
640 int i;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
641 first_vertical_edge_done = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
642
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
643 if( IS_INTRA(mb_type) )
10947
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
644 *(uint64_t*)&bS[0]=
df6bda2aa59a Set bS with 64bits at a time.
michael
parents: 10946
diff changeset
645 *(uint64_t*)&bS[4]= 0x0004000400040004ULL;
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
646 else {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
647 for( i = 0; i < 8; i++ ) {
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
648 int mbn_xy = MB_FIELD ? left_mb_xy[i>>2] : left_mb_xy[i&1];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
649
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
650 if( IS_INTRA( s->current_picture.mb_type[mbn_xy] ) )
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
651 bS[i] = 4;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
652 else if( h->non_zero_count_cache[12+8*(i>>1)] != 0 ||
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
653 ((!h->pps.cabac && IS_8x8DCT(s->current_picture.mb_type[mbn_xy])) ?
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
654 (h->cbp_table[mbn_xy] & ((MB_FIELD ? (i&2) : (mb_y&1)) ? 8 : 2))
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
655 :
10909
f4cf3960b8c6 Reorganize how values are stored in h->non_zero_count.
michael
parents: 10906
diff changeset
656 h->non_zero_count[mbn_xy][7+(MB_FIELD ? (i&3) : (i>>2)+(mb_y&1)*2)*8]))
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
657 bS[i] = 2;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
658 else
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
659 bS[i] = 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
660 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
661 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
662
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
663 mb_qp = s->current_picture.qscale_table[mb_xy];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
664 mbn0_qp = s->current_picture.qscale_table[left_mb_xy[0]];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
665 mbn1_qp = s->current_picture.qscale_table[left_mb_xy[1]];
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
666 qp[0] = ( mb_qp + mbn0_qp + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
667 bqp[0] = ( get_chroma_qp( h, 0, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
668 get_chroma_qp( h, 0, mbn0_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
669 rqp[0] = ( get_chroma_qp( h, 1, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
670 get_chroma_qp( h, 1, mbn0_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
671 qp[1] = ( mb_qp + mbn1_qp + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
672 bqp[1] = ( get_chroma_qp( h, 0, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
673 get_chroma_qp( h, 0, mbn1_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
674 rqp[1] = ( get_chroma_qp( h, 1, mb_qp ) +
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
675 get_chroma_qp( h, 1, mbn1_qp ) + 1 ) >> 1;
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
676
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
677 /* Filter edge */
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
678 tprintf(s->avctx, "filter mb:%d/%d MBAFF, QPy:%d/%d, QPb:%d/%d QPr:%d/%d ls:%d uvls:%d", mb_x, mb_y, qp[0], qp[1], bqp[0], bqp[1], rqp[0], rqp[1], linesize, uvlinesize);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
679 { int i; for (i = 0; i < 8; i++) tprintf(s->avctx, " bS[%d]:%d", i, bS[i]); tprintf(s->avctx, "\n"); }
10924
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
680 if(MB_FIELD){
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
681 filter_mb_mbaff_edgev ( h, img_y , linesize, bS , 1, qp [0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
682 filter_mb_mbaff_edgev ( h, img_y + 8* linesize, linesize, bS+4, 1, qp [1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
683 filter_mb_mbaff_edgecv( h, img_cb, uvlinesize, bS , 1, bqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
684 filter_mb_mbaff_edgecv( h, img_cb + 4*uvlinesize, uvlinesize, bS+4, 1, bqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
685 filter_mb_mbaff_edgecv( h, img_cr, uvlinesize, bS , 1, rqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
686 filter_mb_mbaff_edgecv( h, img_cr + 4*uvlinesize, uvlinesize, bS+4, 1, rqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
687 }else{
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
688 filter_mb_mbaff_edgev ( h, img_y , 2* linesize, bS , 2, qp [0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
689 filter_mb_mbaff_edgev ( h, img_y + linesize, 2* linesize, bS+1, 2, qp [1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
690 filter_mb_mbaff_edgecv( h, img_cb, 2*uvlinesize, bS , 2, bqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
691 filter_mb_mbaff_edgecv( h, img_cb + uvlinesize, 2*uvlinesize, bS+1, 2, bqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
692 filter_mb_mbaff_edgecv( h, img_cr, 2*uvlinesize, bS , 2, rqp[0] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
693 filter_mb_mbaff_edgecv( h, img_cr + uvlinesize, 2*uvlinesize, bS+1, 2, rqp[1] );
fb0307a3355e Rather call filter_mb_mbaff_edge*v() more often than do extra calculations
michael
parents: 10922
diff changeset
694 }
10854
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
695 }
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
696
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
697 #if CONFIG_SMALL
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
698 for( dir = 0; dir < 2; dir++ )
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
699 filter_mb_dir(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize, mb_xy, mb_type, mvy_limit, dir ? 0 : first_vertical_edge_done, dir);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
700 #else
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
701 filter_mb_dir(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize, mb_xy, mb_type, mvy_limit, first_vertical_edge_done, 0);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
702 filter_mb_dir(h, mb_x, mb_y, img_y, img_cb, img_cr, linesize, uvlinesize, mb_xy, mb_type, mvy_limit, 0, 1);
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
703 #endif
f6fc6ace95e3 Split h264 loop filter off h264.c.
michael
parents:
diff changeset
704 }