Mercurial > libavcodec.hg
annotate i386/cputest.c @ 4961:3e8e345084cb libavcodec
sse2 version of fdct_col.
k8: 72->61 cycles, core2: 51->26 cycles.
author | lorenm |
---|---|
date | Thu, 10 May 2007 03:13:41 +0000 |
parents | f9325f2bc762 |
children | d5ba514e3f4a |
rev | line source |
---|---|
3699
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
1 /* |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
2 * CPU detection code, extracted from mmx.h |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
3 * (c)1997-99 by H. Dietz and R. Fisher |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
4 * Converted to C and improved by Fabrice Bellard. |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
5 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3944
diff
changeset
|
6 * This file is part of FFmpeg. |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3944
diff
changeset
|
7 * |
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3944
diff
changeset
|
8 * FFmpeg is free software; you can redistribute it and/or |
3699
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
9 * modify it under the terms of the GNU Lesser General Public |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
10 * License as published by the Free Software Foundation; either |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3944
diff
changeset
|
11 * version 2.1 of the License, or (at your option) any later version. |
3699
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
12 * |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3944
diff
changeset
|
13 * FFmpeg is distributed in the hope that it will be useful, |
3699
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
14 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
15 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
16 * Lesser General Public License for more details. |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
17 * |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
18 * You should have received a copy of the GNU Lesser General Public |
3947
c8c591fe26f8
Change license headers to say 'FFmpeg' instead of 'this program/this library'
diego
parents:
3944
diff
changeset
|
19 * License along with FFmpeg; if not, write to the Free Software |
3699
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
20 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA |
c537a97eec66
Add official LGPL license headers to the files that were missing them.
diego
parents:
3279
diff
changeset
|
21 */ |
0 | 22 |
23 #include <stdlib.h> | |
24 #include "../dsputil.h" | |
25 | |
3944
edacbbf46a19
Compilation fix, printf gets redefined to please_use_av_log.
diego
parents:
3699
diff
changeset
|
26 #undef printf |
edacbbf46a19
Compilation fix, printf gets redefined to please_use_av_log.
diego
parents:
3699
diff
changeset
|
27 |
2293
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
28 #ifdef ARCH_X86_64 |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
29 # define REG_b "rbx" |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
30 # define REG_S "rsi" |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
31 #else |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
32 # define REG_b "ebx" |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
33 # define REG_S "esi" |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
34 #endif |
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
35 |
22
c31fb57d17a6
Suppressing external gas stuff to improve portability to Win32
nickols_k
parents:
16
diff
changeset
|
36 /* ebx saving is necessary for PIC. gcc seems unable to see it alone */ |
c31fb57d17a6
Suppressing external gas stuff to improve portability to Win32
nickols_k
parents:
16
diff
changeset
|
37 #define cpuid(index,eax,ebx,ecx,edx)\ |
43 | 38 __asm __volatile\ |
2979 | 39 ("mov %%"REG_b", %%"REG_S"\n\t"\ |
22
c31fb57d17a6
Suppressing external gas stuff to improve portability to Win32
nickols_k
parents:
16
diff
changeset
|
40 "cpuid\n\t"\ |
2293
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
41 "xchg %%"REG_b", %%"REG_S\ |
22
c31fb57d17a6
Suppressing external gas stuff to improve portability to Win32
nickols_k
parents:
16
diff
changeset
|
42 : "=a" (eax), "=S" (ebx),\ |
c31fb57d17a6
Suppressing external gas stuff to improve portability to Win32
nickols_k
parents:
16
diff
changeset
|
43 "=c" (ecx), "=d" (edx)\ |
43 | 44 : "0" (index)); |
0 | 45 |
46 /* Function to test if multimedia instructions are supported... */ | |
47 int mm_support(void) | |
48 { | |
2377
9214c91cdfb7
detect sse on athlon-xp patch by (matthieu castet <castet >.< matthieu >at< free >.< fr>)
michael
parents:
2300
diff
changeset
|
49 int rval = 0; |
0 | 50 int eax, ebx, ecx, edx; |
2388 | 51 int max_std_level, max_ext_level, std_caps=0, ext_caps=0; |
2300
40542ea560d5
gcc 3.4.3 preversions do not appreciate invalid instruction and operand combinations anymore patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2293
diff
changeset
|
52 long a, c; |
2967 | 53 |
0 | 54 __asm__ __volatile__ ( |
55 /* See if CPUID instruction is supported ... */ | |
56 /* ... Get copies of EFLAGS into eax and ecx */ | |
57 "pushf\n\t" | |
2293
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
58 "pop %0\n\t" |
2300
40542ea560d5
gcc 3.4.3 preversions do not appreciate invalid instruction and operand combinations anymore patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2293
diff
changeset
|
59 "mov %0, %1\n\t" |
2967 | 60 |
0 | 61 /* ... Toggle the ID bit in one copy and store */ |
62 /* to the EFLAGS reg */ | |
2300
40542ea560d5
gcc 3.4.3 preversions do not appreciate invalid instruction and operand combinations anymore patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2293
diff
changeset
|
63 "xor $0x200000, %0\n\t" |
0 | 64 "push %0\n\t" |
65 "popf\n\t" | |
2967 | 66 |
0 | 67 /* ... Get the (hopefully modified) EFLAGS */ |
68 "pushf\n\t" | |
2293
15cfba1b97b5
adapting existing mmx/mmx2/sse/3dnow optimizations so they work on x86_64 patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2129
diff
changeset
|
69 "pop %0\n\t" |
2300
40542ea560d5
gcc 3.4.3 preversions do not appreciate invalid instruction and operand combinations anymore patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2293
diff
changeset
|
70 : "=a" (a), "=c" (c) |
0 | 71 : |
2967 | 72 : "cc" |
0 | 73 ); |
2967 | 74 |
2300
40542ea560d5
gcc 3.4.3 preversions do not appreciate invalid instruction and operand combinations anymore patch by (Aurelien Jacobs <aurel at gnuage dot org>)
michael
parents:
2293
diff
changeset
|
75 if (a == c) |
0 | 76 return 0; /* CPUID not supported */ |
2388 | 77 |
78 cpuid(0, max_std_level, ebx, ecx, edx); | |
79 | |
80 if(max_std_level >= 1){ | |
81 cpuid(1, eax, ebx, ecx, std_caps); | |
82 if (std_caps & (1<<23)) | |
83 rval |= MM_MMX; | |
2967 | 84 if (std_caps & (1<<25)) |
2388 | 85 rval |= MM_MMXEXT | MM_SSE; |
2967 | 86 if (std_caps & (1<<26)) |
2388 | 87 rval |= MM_SSE2; |
3279
647a677c00a4
Remove unused and unsupported Cyrix's "Extended MMX",
gpoirier
parents:
2979
diff
changeset
|
88 if (ecx & 1) |
647a677c00a4
Remove unused and unsupported Cyrix's "Extended MMX",
gpoirier
parents:
2979
diff
changeset
|
89 rval |= MM_SSE3; |
4311
f9325f2bc762
Add SSSE3 (Core2 aka Conroe/Merom/Woodcrester new instructions) detection
gpoirier
parents:
3947
diff
changeset
|
90 if (ecx & 0x00000200 ) |
f9325f2bc762
Add SSSE3 (Core2 aka Conroe/Merom/Woodcrester new instructions) detection
gpoirier
parents:
3947
diff
changeset
|
91 rval |= MM_SSSE3; |
2388 | 92 } |
0 | 93 |
2388 | 94 cpuid(0x80000000, max_ext_level, ebx, ecx, edx); |
95 | |
96 if(max_ext_level >= 0x80000001){ | |
97 cpuid(0x80000001, eax, ebx, ecx, ext_caps); | |
98 if (ext_caps & (1<<31)) | |
99 rval |= MM_3DNOW; | |
100 if (ext_caps & (1<<30)) | |
101 rval |= MM_3DNOWEXT; | |
102 if (ext_caps & (1<<23)) | |
103 rval |= MM_MMX; | |
3279
647a677c00a4
Remove unused and unsupported Cyrix's "Extended MMX",
gpoirier
parents:
2979
diff
changeset
|
104 if (ext_caps & (1<<22)) |
647a677c00a4
Remove unused and unsupported Cyrix's "Extended MMX",
gpoirier
parents:
2979
diff
changeset
|
105 rval |= MM_MMXEXT; |
2388 | 106 } |
107 | |
108 #if 0 | |
4311
f9325f2bc762
Add SSSE3 (Core2 aka Conroe/Merom/Woodcrester new instructions) detection
gpoirier
parents:
3947
diff
changeset
|
109 av_log(NULL, AV_LOG_DEBUG, "%s%s%s%s%s%s%s%s\n", |
2967 | 110 (rval&MM_MMX) ? "MMX ":"", |
111 (rval&MM_MMXEXT) ? "MMX2 ":"", | |
112 (rval&MM_SSE) ? "SSE ":"", | |
113 (rval&MM_SSE2) ? "SSE2 ":"", | |
4311
f9325f2bc762
Add SSSE3 (Core2 aka Conroe/Merom/Woodcrester new instructions) detection
gpoirier
parents:
3947
diff
changeset
|
114 (rval&MM_SSE3) ? "SSE3 ":"", |
f9325f2bc762
Add SSSE3 (Core2 aka Conroe/Merom/Woodcrester new instructions) detection
gpoirier
parents:
3947
diff
changeset
|
115 (rval&MM_SSSE3) ? "SSSE3 ":"", |
2967 | 116 (rval&MM_3DNOW) ? "3DNow ":"", |
2388 | 117 (rval&MM_3DNOWEXT) ? "3DNowExt ":""); |
118 #endif | |
119 return rval; | |
0 | 120 } |
43 | 121 |
122 #ifdef __TEST__ | |
123 int main ( void ) | |
124 { | |
125 int mm_flags; | |
126 mm_flags = mm_support(); | |
2129 | 127 printf("mm_support = 0x%08X\n",mm_flags); |
43 | 128 return 0; |
129 } | |
130 #endif |