annotate mathops.h @ 9473:e38284cd69dc libavcodec

Use memcpy instead of the very inefficient bytecopy where both are correct (i.e. no overlap of src and dst is possible).
author reimar
date Fri, 17 Apr 2009 17:20:48 +0000
parents 005cf8ba225f
children f1f95c604b56
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
1 /*
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
2 * simple math operations
8629
04423b2f6e0b cosmetics: Remove pointless period after copyright statement non-sentences.
diego
parents: 8627
diff changeset
3 * Copyright (c) 2001, 2002 Fabrice Bellard
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
4 * Copyright (c) 2006 Michael Niedermayer <michaelni@gmx.at> et al
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
5 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
6 * This file is part of FFmpeg.
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
7 *
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
8 * FFmpeg is free software; you can redistribute it and/or
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
9 * modify it under the terms of the GNU Lesser General Public
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
10 * License as published by the Free Software Foundation; either
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
11 * version 2.1 of the License, or (at your option) any later version.
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
12 *
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
13 * FFmpeg is distributed in the hope that it will be useful,
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
16 * Lesser General Public License for more details.
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
17 *
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
18 * You should have received a copy of the GNU Lesser General Public
3947
c8c591fe26f8 Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents: 3733
diff changeset
19 * License along with FFmpeg; if not, write to the Free Software
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
21 */
7760
c4a4495715dd Globally rename the header inclusion guard names.
stefano
parents: 7255
diff changeset
22 #ifndef AVCODEC_MATHOPS_H
c4a4495715dd Globally rename the header inclusion guard names.
stefano
parents: 7255
diff changeset
23 #define AVCODEC_MATHOPS_H
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
24
6763
f7cbb7733146 Use full path for #includes from another directory.
diego
parents: 6500
diff changeset
25 #include "libavutil/common.h"
5162
4394344397d8 include all prerequisites in header files
mru
parents: 4283
diff changeset
26
8759
4cea2f47219a re-enable mid_pred asm on x86_64. (broke in r16681)
lorenm
parents: 8629
diff changeset
27 #if ARCH_X86
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
28
8430
7768bdfd4f7b Rename libavcodec/i386/ --> libavcodec/x86/.
diego
parents: 8359
diff changeset
29 #include "x86/mathops.h"
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
30
8590
7a463923ecd1 Change semantic of CONFIG_*, HAVE_* and ARCH_*.
aurel
parents: 8496
diff changeset
31 #elif ARCH_ARM
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
32
8359
9281a8a9387a ARM: replace "armv4l" with "arm"
mru
parents: 8201
diff changeset
33 #include "arm/mathops.h"
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
34
8590
7a463923ecd1 Change semantic of CONFIG_*, HAVE_* and ARCH_*.
aurel
parents: 8496
diff changeset
35 #elif ARCH_PPC
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
36
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
37 #include "ppc/mathops.h"
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
38
8590
7a463923ecd1 Change semantic of CONFIG_*, HAVE_* and ARCH_*.
aurel
parents: 8496
diff changeset
39 #elif ARCH_BFIN
5615
7ffc96c9ab1a Hooking bfin/mathops.h
mhoffman
parents: 5162
diff changeset
40
7ffc96c9ab1a Hooking bfin/mathops.h
mhoffman
parents: 5162
diff changeset
41 #include "bfin/mathops.h"
7ffc96c9ab1a Hooking bfin/mathops.h
mhoffman
parents: 5162
diff changeset
42
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
43 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
44
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
45 /* generic implementation */
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
46
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
47 #ifndef MULL
8201
c6e2ffef3797 Add shift argument to MULL() macro
mru
parents: 7760
diff changeset
48 # define MULL(a,b,s) (((int64_t)(a) * (int64_t)(b)) >> (s))
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
49 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
50
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
51 #ifndef MULH
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
52 //gcc 3.4 creates an incredibly bloated mess out of this
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
53 //# define MULH(a,b) (((int64_t)(a) * (int64_t)(b))>>32)
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
54
4283
d6f83e2f8804 rename always_inline to av_always_inline and move to common.h
mru
parents: 4112
diff changeset
55 static av_always_inline int MULH(int a, int b){
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
56 return ((int64_t)(a) * (int64_t)(b))>>32;
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
57 }
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
58 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
59
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
60 #ifndef MUL64
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
61 # define MUL64(a,b) ((int64_t)(a) * (int64_t)(b))
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
62 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
63
7255
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
64 #ifndef MAC64
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
65 # define MAC64(d, a, b) ((d) += MUL64(a, b))
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
66 #endif
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
67
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
68 #ifndef MLS64
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
69 # define MLS64(d, a, b) ((d) -= MUL64(a, b))
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
70 #endif
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
71
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
72 /* signed 16x16 -> 32 multiply add accumulate */
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
73 #ifndef MAC16
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
74 # define MAC16(rt, ra, rb) rt += (ra) * (rb)
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
75 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
76
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
77 /* signed 16x16 -> 32 multiply */
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
78 #ifndef MUL16
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
79 # define MUL16(ra, rb) ((ra) * (rb))
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
80 #endif
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
81
7255
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
82 #ifndef MLS16
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
83 # define MLS16(rt, ra, rb) ((rt) -= (ra) * (rb))
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
84 #endif
84dd52687931 mathops: add MAC64, MLS64, and MLS16
mru
parents: 6763
diff changeset
85
8627
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
86 /* median of 3 */
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
87 #ifndef mid_pred
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
88 #define mid_pred mid_pred
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
89 static inline av_const int mid_pred(int a, int b, int c)
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
90 {
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
91 #if 0
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
92 int t= (a-b)&((a-b)>>31);
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
93 a-=t;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
94 b+=t;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
95 b-= (b-c)&((b-c)>>31);
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
96 b+= (a-b)&((a-b)>>31);
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
97
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
98 return b;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
99 #else
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
100 if(a>b){
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
101 if(c>b){
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
102 if(c>a) b=a;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
103 else b=c;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
104 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
105 }else{
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
106 if(b>c){
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
107 if(c>a) b=c;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
108 else b=a;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
109 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
110 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
111 return b;
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
112 #endif
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
113 }
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
114 #endif
d6bab465b82c moves mid_pred() into mathops.h (with arch specific code split by directory)
aurel
parents: 8590
diff changeset
115
9096
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
116 #ifndef sign_extend
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
117 static inline av_const int sign_extend(int val, unsigned bits)
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
118 {
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
119 return (val << (INT_BIT - bits)) >> (INT_BIT - bits);
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
120 }
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
121 #endif
005cf8ba225f Add sign_extend() function to mathops.h
mru
parents: 8759
diff changeset
122
7760
c4a4495715dd Globally rename the header inclusion guard names.
stefano
parents: 7255
diff changeset
123 #endif /* AVCODEC_MATHOPS_H */
3733
d1b5acd0b680 New single instruction math operation header
lu_zero
parents:
diff changeset
124