annotate mathops.h @ 9672:15276eb66180 libavcodec

LGPL version of ac3_decode_transform_coeffs_ch, ~12.4% faster.
author darkshikari
date Tue, 19 May 2009 21:29:21 +0000
parents 005cf8ba225f
children f1f95c604b56
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
1 /*
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
2 * simple math operations
8629
04423b2f6e0b cosmetics: Remove pointless period after copyright statement non-sentences.
diego
parents: 8627
diff changeset
3 * Copyright (c) 2001, 2002 Fabrice Bellard
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
4 * Copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at> et al
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
5 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
6 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
7 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
8 * FFmpeg is free software; you can redistribute it and/or
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
9 * modify it under the terms of the GNU Lesser General Public
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
10 * License as published by the Free Software Foundation; either
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
11 * version 2.1 of the License, or (at your option) any later version.
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
12 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
13 * FFmpeg is distributed in the hope that it will be useful,
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
16 * Lesser General Public License for more details.
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
17 *
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
18 * You should have received a copy of the GNU Lesser General Public
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
19 * License along with FFmpeg; if not, write to the Free Software
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
21 */
7760
c4a4495715dd Globally rename the header inclusion guard names.
stefano
parents: 7255
diff changeset
22 #ifndef AVCODEC_MATHOPS_H
c4a4495715dd Globally rename the header inclusion guard names.
stefano
parents: 7255
diff changeset
23 #define AVCODEC_MATHOPS_H
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
24
6763
f7cbb7733146 Use full path for #includes from another directory.
diego
parents: 6500
diff changeset
25 #include "libavutil/common.h"
5162
4394344397d8 include all prerequisites in header files
mru
parents: 4283
diff changeset
26
8759
4cea2f47219a re-enable mid_pred asm on x86_64. (broke in r16681)
lorenm
parents: 8629
diff changeset
27 #if ARCH_X86
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
28
8430
7768bdfd4f7b Rename libavcodec/i386/ --> libavcodec/x86/.
diego
parents: 8359
diff changeset
29 #include "x86/mathops.h"
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
30
8590
7a463923ecd1 Change semantic of CONFIG_*, HAVE_* and ARCH_*.
aurel
parents: 8496
diff changeset
31 #elif ARCH_ARM
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
32
8359
9281a8a9387a ARM: replace "armv4l" with "arm"
mru
parents: 8201
diff changeset
33 #include "arm/mathops.h"
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
34
8590
7a463923ecd1 Change semantic of CONFIG_*, HAVE_* and ARCH_*.
aurel
parents: 8496
diff changeset
35 #elif ARCH_PPC
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
36
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
37 #include "ppc/mathops.h"
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
38
8590
7a463923ecd1 Change semantic of CONFIG_*, HAVE_* and ARCH_*.
aurel
parents: 8496
diff changeset
39 #elif ARCH_BFIN
5615
7ffc96c9ab1a Hooking bfin/mathops.h
mhoffman
parents: 5162
diff changeset
40
7ffc96c9ab1a Hooking bfin/mathops.h
mhoffman
parents: 5162
diff changeset
41 #include "bfin/mathops.h"
7ffc96c9ab1a Hooking bfin/mathops.h
mhoffman
parents: 5162
diff changeset
42
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
43 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
44
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
45 /* generic implementation */
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
46
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
47 #ifndef MULL
8201
c6e2ffef3797 Add shift argument to MULL() macro
mru
parents: 7760
diff changeset
48 # define MULL(a,b,s) (((int64_t)(a) * (int64_t)(b)) >> (s))
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
49 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
50
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
51 #ifndef MULH
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
52 //gcc 3.4 creates an incredibly bloated mess out of this
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
53 //# define MULH(a,b) (((int64_t)(a) * (int64_t)(b))>>32)
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
54
4283
d6f83e2f8804 rename always_inline to av_always_inline and move to common.h
mru
parents: 4112
diff changeset
55 static av_always_inline int MULH(int a, int b){
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
56 return ((int64_t)(a) * (int64_t)(b))>>32;
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
57 }
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
58 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
59
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
60 #ifndef MUL64
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
61 # define MUL64(a,b) ((int64_t)(a) * (int64_t)(b))
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
62 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
63
7255
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
64 #ifndef MAC64
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
65 # define MAC64(d, a, b) ((d) += MUL64(a, b))
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
66 #endif
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
67
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
68 #ifndef MLS64
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
69 # define MLS64(d, a, b) ((d) -= MUL64(a, b))
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
70 #endif
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
71
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
72 /* signed 16x16 -> 32 multiply add accumulate */
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
73 #ifndef MAC16
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
74 # define MAC16(rt, ra, rb) rt += (ra) * (rb)
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
75 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
76
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
77 /* signed 16x16 -> 32 multiply */
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
78 #ifndef MUL16
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
79 # define MUL16(ra, rb) ((ra) * (rb))
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
80 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
81
7255
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
82 #ifndef MLS16
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
83 # define MLS16(rt, ra, rb) ((rt) -= (ra) * (rb))
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
84 #endif
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
85
8627
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
86 /* median of 3 */
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
87 #ifndef mid_pred
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
88 #define mid_pred mid_pred
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
89 static inline av_const int mid_pred(int a, int b, int c)
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
90 {
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
91 #if 0
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
92 int t= (a-b)&((a-b)>>31);
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
93 a-=t;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
94 b+=t;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
95 b-= (b-c)&((b-c)>>31);
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
96 b+= (a-b)&((a-b)>>31);
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
97
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
98 return b;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
99 #else
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
100 if(a>b){
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
101 if(c>b){
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
102 if(c>a) b=a;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
103 else b=c;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
104 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
105 }else{
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
106 if(b>c){
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
107 if(c>a) b=c;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
108 else b=a;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
109 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
110 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
111 return b;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
112 #endif
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
113 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
114 #endif
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
115
9096
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
116 #ifndef sign_extend
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
117 static inline av_const int sign_extend(int val, unsigned bits)
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
118 {
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
119 return (val << (INT_BIT - bits)) >> (INT_BIT - bits);
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
120 }
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
121 #endif
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
122
7760
c4a4495715dd Globally rename the header inclusion guard names.
stefano
parents: 7255
diff changeset
123 #endif /* AVCODEC_MATHOPS_H */
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
124