annotate ppc/intreadwrite.h @ 729:753953ed8ff0 libavutil

PPC asm for AV_RL*() PPC is normally big endian but has special little endian load/store instructions. Using these avoids a separate byteswap. This makes the vorbis decoder about 5% faster. Not much else uses little-endian read/write extensively. GCC generates horrible PPC code for the default AV_[RW]B64 (which uses a packed struct), so we override it with a plain pointer cast.
author mru
date Sat, 18 Apr 2009 00:00:31 +0000
parents
children eff5131d6a33
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
729
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
1 /*
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
2 * Copyright (c) 2008 Mans Rullgard <mans@mansr.com>
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
3 *
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
4 * This file is part of FFmpeg.
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
5 *
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
6 * FFmpeg is free software; you can redistribute it and/or
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
7 * modify it under the terms of the GNU Lesser General Public
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
8 * License as published by the Free Software Foundation; either
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
9 * version 2.1 of the License, or (at your option) any later version.
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
10 *
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
11 * FFmpeg is distributed in the hope that it will be useful,
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
12 * but WITHOUT ANY WARRANTY; without even the implied warranty of
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
13 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
14 * Lesser General Public License for more details.
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
15 *
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
16 * You should have received a copy of the GNU Lesser General Public
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
17 * License along with FFmpeg; if not, write to the Free Software
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
18 * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
19 */
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
20
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
21 #ifndef AVUTIL_PPC_INTREADWRITE_H
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
22 #define AVUTIL_PPC_INTREADWRITE_H
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
23
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
24 #include <stdint.h>
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
25 #include "config.h"
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
26
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
27 #define AV_RL16 AV_RL16
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
28 static inline uint16_t AV_RL16(const void *p)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
29 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
30 uint16_t v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
31 __asm__ ("lhbrx %0, %y1" : "=r"(v) : "Z"(*(const uint16_t*)p));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
32 return v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
33 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
34
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
35 #define AV_WL16 AV_WL16
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
36 static inline void AV_WL16(void *p, uint16_t v)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
37 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
38 __asm__ ("sthbrx %1, %y0" : "=Z"(*(uint16_t*)p) : "r"(v));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
39 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
40
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
41 #define AV_RL32 AV_RL32
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
42 static inline uint32_t AV_RL32(const void *p)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
43 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
44 uint32_t v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
45 __asm__ ("lwbrx %0, %y1" : "=r"(v) : "Z"(*(const uint32_t*)p));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
46 return v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
47 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
48
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
49 #define AV_WL32 AV_WL32
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
50 static inline void AV_WL32(void *p, uint32_t v)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
51 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
52 __asm__ ("stwbrx %1, %y0" : "=Z"(*(uint32_t*)p) : "r"(v));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
53 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
54
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
55 #if HAVE_LDBRX
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
56
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
57 #define AV_RL64 AV_RL64
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
58 static inline uint64_t AV_RL64(const void *p)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
59 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
60 uint64_t v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
61 __asm__ ("ldbrx %0, %y1" : "=r"(v) : "Z"(*(const uint64_t*)p));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
62 return v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
63 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
64
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
65 #define AV_WL64 AV_WL64
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
66 static inline void AV_WL64(void *p, uint64_t v)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
67 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
68 __asm__ ("stdbrx %1, %y0" : "=Z"(*(uint64_t*)p) : "r"(v));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
69 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
70
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
71 #else
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
72
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
73 #define AV_RL64 AV_RL64
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
74 static inline uint64_t AV_RL64(const void *p)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
75 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
76 union { uint64_t v; uint32_t hl[2]; } v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
77 __asm__ ("lwbrx %0, %y2 \n\t"
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
78 "lwbrx %1, %y3 \n\t"
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
79 : "=r"(v.hl[1]), "=r"(v.hl[0])
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
80 : "Z"(*(const uint32_t*)p), "Z"(*((const uint32_t*)p+1)));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
81 return v.v;
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
82 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
83
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
84 #define AV_WL64 AV_WL64
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
85 static inline void AV_WL64(void *p, uint64_t v)
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
86 {
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
87 union { uint64_t v; uint32_t hl[2]; } vv = { v };
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
88 __asm__ ("stwbrx %2, %y0 \n\t"
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
89 "stwbrx %3, %y1 \n\t"
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
90 : "=Z"(*(uint32_t*)p), "=Z"(*((uint32_t*)p+1))
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
91 : "r"(vv.hl[1]), "r"(vv.hl[0]));
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
92 }
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
93
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
94 #endif /* HAVE_LDBRX */
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
95
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
96 /*
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
97 * GCC fails miserably on the packed struct version which is used by
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
98 * default, so we override it here.
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
99 */
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
100
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
101 #define AV_RB64(p) (*(const uint64_t *)(p))
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
102 #define AV_WB64(p, v) (*(uint64_t *)(p) = (v))
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
103
753953ed8ff0 PPC asm for AV_RL*()
mru
parents:
diff changeset
104 #endif /* AVUTIL_PPC_INTREADWRITE_H */