changeset 8678:6c256fc075e3 libavcodec

ARM: change alignment of loops in put_pixels*_arm to 32
author mru
date Tue, 27 Jan 2009 16:06:41 +0000
parents 3c484b73ca73
children 9c1ea156d893
files arm/dsputil_arm_s.S
diffstat 1 files changed, 33 insertions(+), 38 deletions(-) [+]
line wrap: on
line diff
--- a/arm/dsputil_arm_s.S	Tue Jan 27 16:06:38 2009 +0000
+++ b/arm/dsputil_arm_s.S	Tue Jan 27 16:06:41 2009 +0000
@@ -91,7 +91,7 @@
 .endm
 
 @ ----------------------------------------------------------------
-        .align 8
+        .align 5
 function put_pixels16_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -111,7 +111,7 @@
         add r0, r0, r2
         bne 1b
         ldmfd sp!, {r4-r11, pc}
-        .align 8
+        .align 5
 2:
         ldmia r1, {r4-r8}
         add r1, r1, r2
@@ -122,7 +122,7 @@
         add r0, r0, r2
         bne 2b
         ldmfd sp!, {r4-r11, pc}
-        .align 8
+        .align 5
 3:
         ldmia r1, {r4-r8}
         add r1, r1, r2
@@ -133,7 +133,7 @@
         add r0, r0, r2
         bne 3b
         ldmfd sp!, {r4-r11, pc}
-        .align 8
+        .align 5
 4:
         ldmia r1, {r4-r8}
         add r1, r1, r2
@@ -144,7 +144,6 @@
         add r0, r0, r2
         bne 4b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
 5:
         .word 1b
         .word 2b
@@ -153,7 +152,7 @@
         .endfunc
 
 @ ----------------------------------------------------------------
-        .align 8
+        .align 5
 function put_pixels8_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -173,7 +172,7 @@
         add r0, r0, r2
         bne 1b
         ldmfd sp!, {r4-r5,pc}
-        .align 8
+        .align 5
 2:
         ldmia r1, {r4-r5, r12}
         add r1, r1, r2
@@ -184,7 +183,7 @@
         add r0, r0, r2
         bne 2b
         ldmfd sp!, {r4-r5,pc}
-        .align 8
+        .align 5
 3:
         ldmia r1, {r4-r5, r12}
         add r1, r1, r2
@@ -195,7 +194,7 @@
         add r0, r0, r2
         bne 3b
         ldmfd sp!, {r4-r5,pc}
-        .align 8
+        .align 5
 4:
         ldmia r1, {r4-r5, r12}
         add r1, r1, r2
@@ -206,7 +205,6 @@
         add r0, r0, r2
         bne 4b
         ldmfd sp!, {r4-r5,pc}
-        .align 8
 5:
         .word 1b
         .word 2b
@@ -215,7 +213,7 @@
         .endfunc
 
 @ ----------------------------------------------------------------
-        .align 8
+        .align 5
 function put_pixels8_x2_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -238,7 +236,7 @@
         add r0, r0, r2
         bne 1b
         ldmfd sp!, {r4-r10,pc}
-        .align 8
+        .align 5
 2:
         ldmia r1, {r4-r5, r10}
         add r1, r1, r2
@@ -251,7 +249,7 @@
         add r0, r0, r2
         bne 2b
         ldmfd sp!, {r4-r10,pc}
-        .align 8
+        .align 5
 3:
         ldmia r1, {r4-r5, r10}
         add r1, r1, r2
@@ -264,7 +262,7 @@
         add r0, r0, r2
         bne 3b
         ldmfd sp!, {r4-r10,pc}
-        .align 8
+        .align 5
 4:
         ldmia r1, {r4-r5, r10}
         add r1, r1, r2
@@ -276,7 +274,6 @@
         add r0, r0, r2
         bne 4b
         ldmfd sp!, {r4-r10,pc} @@ update PC with LR content.
-        .align 8
 5:
         .word 0xFEFEFEFE
         .word 2b
@@ -284,7 +281,7 @@
         .word 4b
         .endfunc
 
-        .align 8
+        .align 5
 function put_no_rnd_pixels8_x2_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -307,7 +304,7 @@
         add r0, r0, r2
         bne 1b
         ldmfd sp!, {r4-r10,pc}
-        .align 8
+        .align 5
 2:
         ldmia r1, {r4-r5, r10}
         add r1, r1, r2
@@ -320,7 +317,7 @@
         add r0, r0, r2
         bne 2b
         ldmfd sp!, {r4-r10,pc}
-        .align 8
+        .align 5
 3:
         ldmia r1, {r4-r5, r10}
         add r1, r1, r2
@@ -333,7 +330,7 @@
         add r0, r0, r2
         bne 3b
         ldmfd sp!, {r4-r10,pc}
-        .align 8
+        .align 5
 4:
         ldmia r1, {r4-r5, r10}
         add r1, r1, r2
@@ -345,7 +342,6 @@
         add r0, r0, r2
         bne 4b
         ldmfd sp!, {r4-r10,pc} @@ update PC with LR content.
-        .align 8
 5:
         .word 0xFEFEFEFE
         .word 2b
@@ -355,7 +351,7 @@
 
 
 @ ----------------------------------------------------------------
-        .align 8
+        .align 5
 function put_pixels8_y2_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -386,7 +382,7 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
+        .align 5
 2:
         ldmia r1, {r4-r6}
         add r1, r1, r2
@@ -409,7 +405,7 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
+        .align 5
 3:
         ldmia r1, {r4-r6}
         add r1, r1, r2
@@ -432,7 +428,7 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
+        .align 5
 4:
         ldmia r1, {r4-r6}
         add r1, r1, r2
@@ -456,7 +452,6 @@
         bne 6b
         ldmfd sp!, {r4-r11,pc}
 
-        .align 8
 5:
         .word 0xFEFEFEFE
         .word 2b
@@ -464,7 +459,7 @@
         .word 4b
         .endfunc
 
-        .align 8
+        .align 5
 function put_no_rnd_pixels8_y2_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -495,7 +490,7 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
+        .align 5
 2:
         ldmia r1, {r4-r6}
         add r1, r1, r2
@@ -518,7 +513,7 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
+        .align 5
 3:
         ldmia r1, {r4-r6}
         add r1, r1, r2
@@ -541,7 +536,7 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
+        .align 5
 4:
         ldmia r1, {r4-r6}
         add r1, r1, r2
@@ -564,7 +559,6 @@
         add r0, r0, r2
         bne 6b
         ldmfd sp!, {r4-r11,pc}
-        .align 8
 5:
         .word 0xFEFEFEFE
         .word 2b
@@ -637,7 +631,7 @@
         ldmfd sp!, {r4-r11,pc}
 .endm
 
-        .align 8
+        .align 5
 function put_pixels8_xy2_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -651,15 +645,15 @@
 1:
         RND_XY2_EXPAND 0
 
-        .align 8
+        .align 5
 2:
         RND_XY2_EXPAND 1
 
-        .align 8
+        .align 5
 3:
         RND_XY2_EXPAND 2
 
-        .align 8
+        .align 5
 4:
         RND_XY2_EXPAND 3
 
@@ -673,7 +667,7 @@
         .word 0x0F0F0F0F
         .endfunc
 
-        .align 8
+        .align 5
 function put_no_rnd_pixels8_xy2_arm, export=1
         @ void func(uint8_t *block, const uint8_t *pixels, int line_size, int h)
         @ block = word aligned, pixles = unaligned
@@ -687,15 +681,15 @@
 1:
         RND_XY2_EXPAND 0
 
-        .align 8
+        .align 5
 2:
         RND_XY2_EXPAND 1
 
-        .align 8
+        .align 5
 3:
         RND_XY2_EXPAND 2
 
-        .align 8
+        .align 5
 4:
         RND_XY2_EXPAND 3
 
@@ -709,6 +703,7 @@
         .word 0x0F0F0F0F
         .endfunc
 
+        .align 5
 @ void ff_add_pixels_clamped_ARM(int16_t *block, uint8_t *dest, int stride)
 function ff_add_pixels_clamped_ARM, export=1
         push            {r4-r10}