annotate ppc/check_altivec.c @ 12253:112b3a0db187 libavcodec

Decode DCT tokens by branching to a different code path for each branch on the huffman tree, instead of traversing the tree in a while loop. Based on the similar optimization in libvpx's detokenize.c 10% faster at normal bitrates, and 30% faster for high-bitrate intra-only
author conrad
date Fri, 23 Jul 2010 21:46:17 +0000
parents fdafbcef52f5
children 06abedae2906
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
1 /*
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
2 * This file is part of FFmpeg.
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
3 *
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
4 * FFmpeg is free software; you can redistribute it and/or
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
5 * modify it under the terms of the GNU Lesser General Public
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
6 * License as published by the Free Software Foundation; either
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
7 * version 2.1 of the License, or (at your option) any later version.
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
8 *
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
9 * FFmpeg is distributed in the hope that it will be useful,
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
11 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
12 * Lesser General Public License for more details.
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
13 *
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
14 * You should have received a copy of the GNU Lesser General Public
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
15 * License along with FFmpeg; if not, write to the Free Software
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
16 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
17 */
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
18
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
19
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
20 /**
11644
7dd2a45249a9 Remove explicit filename from Doxygen @file commands.
diego
parents: 11407
diff changeset
21 * @file
12024
fdafbcef52f5 Fix grammar errors in documentation
mru
parents: 11644
diff changeset
22 * Check for AltiVec presence.
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
23 */
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
24
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
25 #ifdef __APPLE__
7852
0d60b8b7f30b Fix compilation on Mac OS X 10.4: Defining _POSIX_C_SOURCE hides the u_char &
diego
parents: 6750
diff changeset
26 #undef _POSIX_C_SOURCE
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
27 #include <sys/sysctl.h>
8699
450a1c5bab22 Use '#if defined()' for OS-specific preprocessor checks.
diego
parents: 8031
diff changeset
28 #elif defined(__OpenBSD__)
7904
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
29 #include <sys/param.h>
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
30 #include <sys/sysctl.h>
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
31 #include <machine/cpu.h>
8699
450a1c5bab22 Use '#if defined()' for OS-specific preprocessor checks.
diego
parents: 8031
diff changeset
32 #elif defined(__AMIGAOS4__)
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
33 #include <exec/exec.h>
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
34 #include <interfaces/exec.h>
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
35 #include <proto/exec.h>
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
36 #endif /* __APPLE__ */
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
37
11407
fb94047e23d2 Move the local includes below the system includes
mstorsjo
parents: 11382
diff changeset
38 #include "config.h"
fb94047e23d2 Move the local includes below the system includes
mstorsjo
parents: 11382
diff changeset
39 #include "dsputil_altivec.h"
fb94047e23d2 Move the local includes below the system includes
mstorsjo
parents: 11382
diff changeset
40
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
41 /**
7905
ae410599f388 spelling cosmetics
diego
parents: 7904
diff changeset
42 * This function MAY rely on signal() or fork() in order to make sure AltiVec
ae410599f388 spelling cosmetics
diego
parents: 7904
diff changeset
43 * is present.
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
44 */
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
45
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
46 int has_altivec(void)
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
47 {
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
48 #ifdef __AMIGAOS4__
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
49 ULONG result = 0;
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
50 extern struct ExecIFace *IExec;
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
51
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
52 IExec->GetCPUInfoTags(GCIT_VectorUnit, &result, TAG_DONE);
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
53 if (result == VECTORTYPE_ALTIVEC) return 1;
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
54 return 0;
7904
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
55 #elif defined(__APPLE__) || defined(__OpenBSD__)
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
56 #ifdef __OpenBSD__
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
57 int sels[2] = {CTL_MACHDEP, CPU_ALTIVEC};
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
58 #else
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
59 int sels[2] = {CTL_HW, HW_VECTORUNIT};
7904
47717d5239fa AltiVec detection support for OpenBSD, patch by Brad, brad comstyle com.
diego
parents: 7852
diff changeset
60 #endif
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
61 int has_vu = 0;
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
62 size_t len = sizeof(has_vu);
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
63 int err;
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
64
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
65 err = sysctl(sels, 2, &has_vu, &len, NULL, 0);
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
66
6750
c93570aeb3eb Remove unnecessary parentheses from return calls.
diego
parents: 6159
diff changeset
67 if (err == 0) return has_vu != 0;
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
68 return 0;
9361
53e5c6a453e9 configure: Add --enable-runtime-cpudetect
ramiro
parents: 8718
diff changeset
69 #elif CONFIG_RUNTIME_CPUDETECT
6159
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
70 int proc_ver;
7905
ae410599f388 spelling cosmetics
diego
parents: 7904
diff changeset
71 // Support of mfspr PVR emulation added in Linux 2.6.17.
8031
eebc7209c47f Convert asm keyword into __asm__.
flameeyes
parents: 7905
diff changeset
72 __asm__ volatile("mfspr %0, 287" : "=r" (proc_ver));
6159
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
73 proc_ver >>= 16;
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
74 if (proc_ver & 0x8000 ||
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
75 proc_ver == 0x000c ||
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
76 proc_ver == 0x0039 || proc_ver == 0x003c ||
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
77 proc_ver == 0x0044 || proc_ver == 0x0045 ||
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
78 proc_ver == 0x0070)
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
79 return 1;
eb2e3c3b7f78 Add mfspr-based AltiVec detection code.
reimar
parents: 5757
diff changeset
80 return 0;
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
81 #else
7905
ae410599f388 spelling cosmetics
diego
parents: 7904
diff changeset
82 // Since we were compiled for AltiVec, just assume we have it
5757
ace63c809071 Remove uses of SIGILL for CPU extension detection, that method is not acceptable
reimar
parents: 5750
diff changeset
83 // until someone comes up with a proper way (not involving signal hacks).
ace63c809071 Remove uses of SIGILL for CPU extension detection, that method is not acceptable
reimar
parents: 5750
diff changeset
84 return 1;
5750
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
85 #endif /* __AMIGAOS4__ */
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
86 }
09f99af1db40 Sanitize altivec code so it can be built with runtime check properly
lu_zero
parents:
diff changeset
87