annotate arm/asm.S @ 10644:5da7180afadf libavcodec

refactor and optimize scalarproduct 29-105% faster apply_filter, 6-90% faster ape decoding on core2 (Any x86 other than core2 probably gets much less, since this is mostly due to ssse3 cachesplit avoidance and I haven't written the full gamut of other cachesplit modes.) 9-123% faster ape decoding on G4.
author lorenm
date Sat, 05 Dec 2009 15:09:10 +0000
parents c44205b868dc
children 361a5fcb4393
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8068
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
1 /*
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
2 * Copyright (c) 2008 Mans Rullgard <mans@mansr.com>
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
3 *
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
4 * This file is part of FFmpeg.
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
5 *
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
6 * FFmpeg is free software; you can redistribute it and/or
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
7 * modify it under the terms of the GNU Lesser General Public
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
8 * License as published by the Free Software Foundation; either
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
9 * version 2.1 of the License, or (at your option) any later version.
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
10 *
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
11 * FFmpeg is distributed in the hope that it will be useful,
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
14 * Lesser General Public License for more details.
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
15 *
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
16 * You should have received a copy of the GNU Lesser General Public
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
17 * License along with FFmpeg; if not, write to the Free Software
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
19 */
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
20
8507
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
21 #include "config.h"
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
22
9991
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
23 #ifdef __ELF__
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
24 # define ELF
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
25 #else
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
26 # define ELF @
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
27 #endif
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
28
8068
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
29 .macro require8, val=1
9991
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
30 ELF .eabi_attribute 24, \val
8068
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
31 .endm
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
32
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
33 .macro preserve8, val=1
9991
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
34 ELF .eabi_attribute 25, \val
8068
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
35 .endm
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
36
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
37 .macro function name, export=0
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
38 .if \export
10346
f12b7ea2df2a ARM: apply extern symbol prefix where needed
mru
parents: 10182
diff changeset
39 .global EXTERN_ASM\name
f12b7ea2df2a ARM: apply extern symbol prefix where needed
mru
parents: 10182
diff changeset
40 EXTERN_ASM\name:
8068
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
41 .endif
9991
c50957bfd553 ARM: cleaner selection of ELF-spefic assembler directives
mru
parents: 9989
diff changeset
42 ELF .type \name, %function
8068
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
43 .func \name
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
44 \name:
923c713c0c48 ARM: add some assembler convenience macros
mru
parents:
diff changeset
45 .endm
8507
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
46
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
47 .macro movrel rd, val
10384
c44205b868dc ARM: simplify movrel definition as CONFIG_PIC is now set for shared libs
mru
parents: 10346
diff changeset
48 #if HAVE_ARMV6T2 && !CONFIG_PIC
8507
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
49 movw \rd, #:lower16:\val
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
50 movt \rd, #:upper16:\val
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
51 #else
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
52 ldr \rd, =\val
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
53 #endif
779a9c93bf61 ARM: work around linker bug with movw/movt relocations in shared libs
mru
parents: 8359
diff changeset
54 .endm
9968
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
55
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
56 #if HAVE_VFP_ARGS
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
57 .eabi_attribute 28, 1
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
58 # define VFP
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
59 # define NOVFP @
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
60 #else
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
61 # define VFP @
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
62 # define NOVFP
93c52263ff74 ARM: check for VFP register arguments
mru
parents: 8590
diff changeset
63 #endif
10346
f12b7ea2df2a ARM: apply extern symbol prefix where needed
mru
parents: 10182
diff changeset
64
f12b7ea2df2a ARM: apply extern symbol prefix where needed
mru
parents: 10182
diff changeset
65 #define GLUE(a, b) a ## b
f12b7ea2df2a ARM: apply extern symbol prefix where needed
mru
parents: 10182
diff changeset
66 #define JOIN(a, b) GLUE(a, b)
f12b7ea2df2a ARM: apply extern symbol prefix where needed
mru
parents: 10182
diff changeset
67 #define X(s) JOIN(EXTERN_ASM, s)