Mercurial > mplayer.hg
changeset 25350:2095f98cf0fa
cosmetics: Remove ugly and inconsistent uppercasing from filenames.
author | diego |
---|---|
date | Wed, 12 Dec 2007 08:50:54 +0000 |
parents | b257a1967539 |
children | f46e91c64b39 |
files | mp3lib/Makefile mp3lib/dct64_MMX.c mp3lib/dct64_mmx.c mp3lib/dct64_sse.c mp3lib/decode_MMX.c mp3lib/decode_mmx.c |
diffstat | 6 files changed, 1359 insertions(+), 1359 deletions(-) [+] |
line wrap: on
line diff
--- a/mp3lib/Makefile Wed Dec 12 08:45:05 2007 +0000 +++ b/mp3lib/Makefile Wed Dec 12 08:50:54 2007 +0000 @@ -3,11 +3,11 @@ LIBNAME_COMMON = libmp3.a SRCS_COMMON = sr1.c -SRCS_COMMON-$(HAVE_MMX) += decode_MMX.c +SRCS_COMMON-$(HAVE_MMX) += decode_mmx.c SRCS_COMMON-$(HAVE_SSE) += dct64_sse.c ifeq ($(ARCH_X86_32),yes) SRCS_COMMON += decode_i586.c -SRCS_COMMON-$(HAVE_MMX) += dct64_MMX.c +SRCS_COMMON-$(HAVE_MMX) += dct64_mmx.c SRCS_COMMON-$(HAVE_3DNOW) += dct36_3dnow.c dct64_3dnow.c SRCS_COMMON-$(HAVE_3DNOWEX) += dct36_k7.c dct64_k7.c endif
--- a/mp3lib/dct64_MMX.c Wed Dec 12 08:45:05 2007 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,985 +0,0 @@ -/* -* This code was taken from http://www.mpg123.org -* See ChangeLog of mpg123-0.59s-pre.1 for detail -* Applied to mplayer by Nick Kurshev <nickols_k@mail.ru> -*/ -#include "mangle.h" -#define real float /* ugly - but only way */ - -void dct64_MMX(short *a,short *b,real *c) -{ - char tmp[256]; - __asm __volatile( -" movl %2,%%eax\n\t" -/* Phase 1*/ -" flds (%%eax)\n\t" -" leal 128+%3,%%edx\n\t" -" fadds 124(%%eax)\n\t" -" movl %0,%%esi\n\t" -" fstps (%%edx)\n\t" -" movl %1,%%edi\n\t" - -" flds 4(%%eax)\n\t" -" movl $"MANGLE(costab_mmx)",%%ebx\n\t" -" fadds 120(%%eax)\n\t" -" orl %%ecx,%%ecx\n\t" -" fstps 4(%%edx)\n\t" - -" flds (%%eax)\n\t" -" leal %3,%%ecx\n\t" -" fsubs 124(%%eax)\n\t" -" fmuls (%%ebx)\n\t" -" fstps 124(%%edx)\n\t" - -" flds 4(%%eax)\n\t" -" fsubs 120(%%eax)\n\t" -" fmuls 4(%%ebx)\n\t" -" fstps 120(%%edx)\n\t" - -" flds 8(%%eax)\n\t" -" fadds 116(%%eax)\n\t" -" fstps 8(%%edx)\n\t" - -" flds 12(%%eax)\n\t" -" fadds 112(%%eax)\n\t" -" fstps 12(%%edx)\n\t" - -" flds 8(%%eax)\n\t" -" fsubs 116(%%eax)\n\t" -" fmuls 8(%%ebx)\n\t" -" fstps 116(%%edx)\n\t" - -" flds 12(%%eax)\n\t" -" fsubs 112(%%eax)\n\t" -" fmuls 12(%%ebx)\n\t" -" fstps 112(%%edx)\n\t" - -" flds 16(%%eax)\n\t" -" fadds 108(%%eax)\n\t" -" fstps 16(%%edx)\n\t" - -" flds 20(%%eax)\n\t" -" fadds 104(%%eax)\n\t" -" fstps 20(%%edx)\n\t" - -" flds 16(%%eax)\n\t" -" fsubs 108(%%eax)\n\t" -" fmuls 16(%%ebx)\n\t" -" fstps 108(%%edx)\n\t" - -" flds 20(%%eax)\n\t" -" fsubs 104(%%eax)\n\t" -" fmuls 20(%%ebx)\n\t" -" fstps 104(%%edx)\n\t" - -" flds 24(%%eax)\n\t" -" fadds 100(%%eax)\n\t" -" fstps 24(%%edx)\n\t" - -" flds 28(%%eax)\n\t" -" fadds 96(%%eax)\n\t" -" fstps 28(%%edx)\n\t" - -" flds 24(%%eax)\n\t" -" fsubs 100(%%eax)\n\t" -" fmuls 24(%%ebx)\n\t" -" fstps 100(%%edx)\n\t" - -" flds 28(%%eax)\n\t" -" fsubs 96(%%eax)\n\t" -" fmuls 28(%%ebx)\n\t" -" fstps 96(%%edx)\n\t" - -" flds 32(%%eax)\n\t" -" fadds 92(%%eax)\n\t" -" fstps 32(%%edx)\n\t" - -" flds 36(%%eax)\n\t" -" fadds 88(%%eax)\n\t" -" fstps 36(%%edx)\n\t" - -" flds 32(%%eax)\n\t" -" fsubs 92(%%eax)\n\t" -" fmuls 32(%%ebx)\n\t" -" fstps 92(%%edx)\n\t" - -" flds 36(%%eax)\n\t" -" fsubs 88(%%eax)\n\t" -" fmuls 36(%%ebx)\n\t" -" fstps 88(%%edx)\n\t" - -" flds 40(%%eax)\n\t" -" fadds 84(%%eax)\n\t" -" fstps 40(%%edx)\n\t" - -" flds 44(%%eax)\n\t" -" fadds 80(%%eax)\n\t" -" fstps 44(%%edx)\n\t" - -" flds 40(%%eax)\n\t" -" fsubs 84(%%eax)\n\t" -" fmuls 40(%%ebx)\n\t" -" fstps 84(%%edx)\n\t" - -" flds 44(%%eax)\n\t" -" fsubs 80(%%eax)\n\t" -" fmuls 44(%%ebx)\n\t" -" fstps 80(%%edx)\n\t" - -" flds 48(%%eax)\n\t" -" fadds 76(%%eax)\n\t" -" fstps 48(%%edx)\n\t" - -" flds 52(%%eax)\n\t" -" fadds 72(%%eax)\n\t" -" fstps 52(%%edx)\n\t" - -" flds 48(%%eax)\n\t" -" fsubs 76(%%eax)\n\t" -" fmuls 48(%%ebx)\n\t" -" fstps 76(%%edx)\n\t" - -" flds 52(%%eax)\n\t" -" fsubs 72(%%eax)\n\t" -" fmuls 52(%%ebx)\n\t" -" fstps 72(%%edx)\n\t" - -" flds 56(%%eax)\n\t" -" fadds 68(%%eax)\n\t" -" fstps 56(%%edx)\n\t" - -" flds 60(%%eax)\n\t" -" fadds 64(%%eax)\n\t" -" fstps 60(%%edx)\n\t" - -" flds 56(%%eax)\n\t" -" fsubs 68(%%eax)\n\t" -" fmuls 56(%%ebx)\n\t" -" fstps 68(%%edx)\n\t" - -" flds 60(%%eax)\n\t" -" fsubs 64(%%eax)\n\t" -" fmuls 60(%%ebx)\n\t" -" fstps 64(%%edx)\n\t" - -/* Phase 2*/ - -" flds (%%edx)\n\t" -" fadds 60(%%edx)\n\t" -" fstps (%%ecx)\n\t" - -" flds 4(%%edx)\n\t" -" fadds 56(%%edx)\n\t" -" fstps 4(%%ecx)\n\t" - -" flds (%%edx)\n\t" -" fsubs 60(%%edx)\n\t" -" fmuls 64(%%ebx)\n\t" -" fstps 60(%%ecx)\n\t" - -" flds 4(%%edx)\n\t" -" fsubs 56(%%edx)\n\t" -" fmuls 68(%%ebx)\n\t" -" fstps 56(%%ecx)\n\t" - -" flds 8(%%edx)\n\t" -" fadds 52(%%edx)\n\t" -" fstps 8(%%ecx)\n\t" - -" flds 12(%%edx)\n\t" -" fadds 48(%%edx)\n\t" -" fstps 12(%%ecx)\n\t" - -" flds 8(%%edx)\n\t" -" fsubs 52(%%edx)\n\t" -" fmuls 72(%%ebx)\n\t" -" fstps 52(%%ecx)\n\t" - -" flds 12(%%edx)\n\t" -" fsubs 48(%%edx)\n\t" -" fmuls 76(%%ebx)\n\t" -" fstps 48(%%ecx)\n\t" - -" flds 16(%%edx)\n\t" -" fadds 44(%%edx)\n\t" -" fstps 16(%%ecx)\n\t" - -" flds 20(%%edx)\n\t" -" fadds 40(%%edx)\n\t" -" fstps 20(%%ecx)\n\t" - -" flds 16(%%edx)\n\t" -" fsubs 44(%%edx)\n\t" -" fmuls 80(%%ebx)\n\t" -" fstps 44(%%ecx)\n\t" - -" flds 20(%%edx)\n\t" -" fsubs 40(%%edx)\n\t" -" fmuls 84(%%ebx)\n\t" -" fstps 40(%%ecx)\n\t" - -" flds 24(%%edx)\n\t" -" fadds 36(%%edx)\n\t" -" fstps 24(%%ecx)\n\t" - -" flds 28(%%edx)\n\t" -" fadds 32(%%edx)\n\t" -" fstps 28(%%ecx)\n\t" - -" flds 24(%%edx)\n\t" -" fsubs 36(%%edx)\n\t" -" fmuls 88(%%ebx)\n\t" -" fstps 36(%%ecx)\n\t" - -" flds 28(%%edx)\n\t" -" fsubs 32(%%edx)\n\t" -" fmuls 92(%%ebx)\n\t" -" fstps 32(%%ecx)\n\t" - -/* Phase 3*/ - -" flds 64(%%edx)\n\t" -" fadds 124(%%edx)\n\t" -" fstps 64(%%ecx)\n\t" - -" flds 68(%%edx)\n\t" -" fadds 120(%%edx)\n\t" -" fstps 68(%%ecx)\n\t" - -" flds 124(%%edx)\n\t" -" fsubs 64(%%edx)\n\t" -" fmuls 64(%%ebx)\n\t" -" fstps 124(%%ecx)\n\t" - -" flds 120(%%edx)\n\t" -" fsubs 68(%%edx)\n\t" -" fmuls 68(%%ebx)\n\t" -" fstps 120(%%ecx)\n\t" - -" flds 72(%%edx)\n\t" -" fadds 116(%%edx)\n\t" -" fstps 72(%%ecx)\n\t" - -" flds 76(%%edx)\n\t" -" fadds 112(%%edx)\n\t" -" fstps 76(%%ecx)\n\t" - -" flds 116(%%edx)\n\t" -" fsubs 72(%%edx)\n\t" -" fmuls 72(%%ebx)\n\t" -" fstps 116(%%ecx)\n\t" - -" flds 112(%%edx)\n\t" -" fsubs 76(%%edx)\n\t" -" fmuls 76(%%ebx)\n\t" -" fstps 112(%%ecx)\n\t" - -" flds 80(%%edx)\n\t" -" fadds 108(%%edx)\n\t" -" fstps 80(%%ecx)\n\t" - -" flds 84(%%edx)\n\t" -" fadds 104(%%edx)\n\t" -" fstps 84(%%ecx)\n\t" - -" flds 108(%%edx)\n\t" -" fsubs 80(%%edx)\n\t" -" fmuls 80(%%ebx)\n\t" -" fstps 108(%%ecx)\n\t" - -" flds 104(%%edx)\n\t" -" fsubs 84(%%edx)\n\t" -" fmuls 84(%%ebx)\n\t" -" fstps 104(%%ecx)\n\t" - -" flds 88(%%edx)\n\t" -" fadds 100(%%edx)\n\t" -" fstps 88(%%ecx)\n\t" - -" flds 92(%%edx)\n\t" -" fadds 96(%%edx)\n\t" -" fstps 92(%%ecx)\n\t" - -" flds 100(%%edx)\n\t" -" fsubs 88(%%edx)\n\t" -" fmuls 88(%%ebx)\n\t" -" fstps 100(%%ecx)\n\t" - -" flds 96(%%edx)\n\t" -" fsubs 92(%%edx)\n\t" -" fmuls 92(%%ebx)\n\t" -" fstps 96(%%ecx)\n\t" - -/* Phase 4*/ - -" flds (%%ecx)\n\t" -" fadds 28(%%ecx)\n\t" -" fstps (%%edx)\n\t" - -" flds (%%ecx)\n\t" -" fsubs 28(%%ecx)\n\t" -" fmuls 96(%%ebx)\n\t" -" fstps 28(%%edx)\n\t" - -" flds 4(%%ecx)\n\t" -" fadds 24(%%ecx)\n\t" -" fstps 4(%%edx)\n\t" - -" flds 4(%%ecx)\n\t" -" fsubs 24(%%ecx)\n\t" -" fmuls 100(%%ebx)\n\t" -" fstps 24(%%edx)\n\t" - -" flds 8(%%ecx)\n\t" -" fadds 20(%%ecx)\n\t" -" fstps 8(%%edx)\n\t" - -" flds 8(%%ecx)\n\t" -" fsubs 20(%%ecx)\n\t" -" fmuls 104(%%ebx)\n\t" -" fstps 20(%%edx)\n\t" - -" flds 12(%%ecx)\n\t" -" fadds 16(%%ecx)\n\t" -" fstps 12(%%edx)\n\t" - -" flds 12(%%ecx)\n\t" -" fsubs 16(%%ecx)\n\t" -" fmuls 108(%%ebx)\n\t" -" fstps 16(%%edx)\n\t" - -" flds 32(%%ecx)\n\t" -" fadds 60(%%ecx)\n\t" -" fstps 32(%%edx)\n\t" - -" flds 60(%%ecx)\n\t" -" fsubs 32(%%ecx)\n\t" -" fmuls 96(%%ebx)\n\t" -" fstps 60(%%edx)\n\t" - -" flds 36(%%ecx)\n\t" -" fadds 56(%%ecx)\n\t" -" fstps 36(%%edx)\n\t" - -" flds 56(%%ecx)\n\t" -" fsubs 36(%%ecx)\n\t" -" fmuls 100(%%ebx)\n\t" -" fstps 56(%%edx)\n\t" - -" flds 40(%%ecx)\n\t" -" fadds 52(%%ecx)\n\t" -" fstps 40(%%edx)\n\t" - -" flds 52(%%ecx)\n\t" -" fsubs 40(%%ecx)\n\t" -" fmuls 104(%%ebx)\n\t" -" fstps 52(%%edx)\n\t" - -" flds 44(%%ecx)\n\t" -" fadds 48(%%ecx)\n\t" -" fstps 44(%%edx)\n\t" - -" flds 48(%%ecx)\n\t" -" fsubs 44(%%ecx)\n\t" -" fmuls 108(%%ebx)\n\t" -" fstps 48(%%edx)\n\t" - -" flds 64(%%ecx)\n\t" -" fadds 92(%%ecx)\n\t" -" fstps 64(%%edx)\n\t" - -" flds 64(%%ecx)\n\t" -" fsubs 92(%%ecx)\n\t" -" fmuls 96(%%ebx)\n\t" -" fstps 92(%%edx)\n\t" - -" flds 68(%%ecx)\n\t" -" fadds 88(%%ecx)\n\t" -" fstps 68(%%edx)\n\t" - -" flds 68(%%ecx)\n\t" -" fsubs 88(%%ecx)\n\t" -" fmuls 100(%%ebx)\n\t" -" fstps 88(%%edx)\n\t" - -" flds 72(%%ecx)\n\t" -" fadds 84(%%ecx)\n\t" -" fstps 72(%%edx)\n\t" - -" flds 72(%%ecx)\n\t" -" fsubs 84(%%ecx)\n\t" -" fmuls 104(%%ebx)\n\t" -" fstps 84(%%edx)\n\t" - -" flds 76(%%ecx)\n\t" -" fadds 80(%%ecx)\n\t" -" fstps 76(%%edx)\n\t" - -" flds 76(%%ecx)\n\t" -" fsubs 80(%%ecx)\n\t" -" fmuls 108(%%ebx)\n\t" -" fstps 80(%%edx)\n\t" - -" flds 96(%%ecx)\n\t" -" fadds 124(%%ecx)\n\t" -" fstps 96(%%edx)\n\t" - -" flds 124(%%ecx)\n\t" -" fsubs 96(%%ecx)\n\t" -" fmuls 96(%%ebx)\n\t" -" fstps 124(%%edx)\n\t" - -" flds 100(%%ecx)\n\t" -" fadds 120(%%ecx)\n\t" -" fstps 100(%%edx)\n\t" - -" flds 120(%%ecx)\n\t" -" fsubs 100(%%ecx)\n\t" -" fmuls 100(%%ebx)\n\t" -" fstps 120(%%edx)\n\t" - -" flds 104(%%ecx)\n\t" -" fadds 116(%%ecx)\n\t" -" fstps 104(%%edx)\n\t" - -" flds 116(%%ecx)\n\t" -" fsubs 104(%%ecx)\n\t" -" fmuls 104(%%ebx)\n\t" -" fstps 116(%%edx)\n\t" - -" flds 108(%%ecx)\n\t" -" fadds 112(%%ecx)\n\t" -" fstps 108(%%edx)\n\t" - -" flds 112(%%ecx)\n\t" -" fsubs 108(%%ecx)\n\t" -" fmuls 108(%%ebx)\n\t" -" fstps 112(%%edx)\n\t" - -" flds (%%edx)\n\t" -" fadds 12(%%edx)\n\t" -" fstps (%%ecx)\n\t" - -" flds (%%edx)\n\t" -" fsubs 12(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 12(%%ecx)\n\t" - -" flds 4(%%edx)\n\t" -" fadds 8(%%edx)\n\t" -" fstps 4(%%ecx)\n\t" - -" flds 4(%%edx)\n\t" -" fsubs 8(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 8(%%ecx)\n\t" - -" flds 16(%%edx)\n\t" -" fadds 28(%%edx)\n\t" -" fstps 16(%%ecx)\n\t" - -" flds 28(%%edx)\n\t" -" fsubs 16(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 28(%%ecx)\n\t" - -" flds 20(%%edx)\n\t" -" fadds 24(%%edx)\n\t" -" fstps 20(%%ecx)\n\t" - -" flds 24(%%edx)\n\t" -" fsubs 20(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 24(%%ecx)\n\t" - -" flds 32(%%edx)\n\t" -" fadds 44(%%edx)\n\t" -" fstps 32(%%ecx)\n\t" - -" flds 32(%%edx)\n\t" -" fsubs 44(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 44(%%ecx)\n\t" - -" flds 36(%%edx)\n\t" -" fadds 40(%%edx)\n\t" -" fstps 36(%%ecx)\n\t" - -" flds 36(%%edx)\n\t" -" fsubs 40(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 40(%%ecx)\n\t" - -" flds 48(%%edx)\n\t" -" fadds 60(%%edx)\n\t" -" fstps 48(%%ecx)\n\t" - -" flds 60(%%edx)\n\t" -" fsubs 48(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 60(%%ecx)\n\t" - -" flds 52(%%edx)\n\t" -" fadds 56(%%edx)\n\t" -" fstps 52(%%ecx)\n\t" - -" flds 56(%%edx)\n\t" -" fsubs 52(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 56(%%ecx)\n\t" - -" flds 64(%%edx)\n\t" -" fadds 76(%%edx)\n\t" -" fstps 64(%%ecx)\n\t" - -" flds 64(%%edx)\n\t" -" fsubs 76(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 76(%%ecx)\n\t" - -" flds 68(%%edx)\n\t" -" fadds 72(%%edx)\n\t" -" fstps 68(%%ecx)\n\t" - -" flds 68(%%edx)\n\t" -" fsubs 72(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 72(%%ecx)\n\t" - -" flds 80(%%edx)\n\t" -" fadds 92(%%edx)\n\t" -" fstps 80(%%ecx)\n\t" - -" flds 92(%%edx)\n\t" -" fsubs 80(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 92(%%ecx)\n\t" - -" flds 84(%%edx)\n\t" -" fadds 88(%%edx)\n\t" -" fstps 84(%%ecx)\n\t" - -" flds 88(%%edx)\n\t" -" fsubs 84(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 88(%%ecx)\n\t" - -" flds 96(%%edx)\n\t" -" fadds 108(%%edx)\n\t" -" fstps 96(%%ecx)\n\t" - -" flds 96(%%edx)\n\t" -" fsubs 108(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 108(%%ecx)\n\t" - -" flds 100(%%edx)\n\t" -" fadds 104(%%edx)\n\t" -" fstps 100(%%ecx)\n\t" - -" flds 100(%%edx)\n\t" -" fsubs 104(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 104(%%ecx)\n\t" - -" flds 112(%%edx)\n\t" -" fadds 124(%%edx)\n\t" -" fstps 112(%%ecx)\n\t" - -" flds 124(%%edx)\n\t" -" fsubs 112(%%edx)\n\t" -" fmuls 112(%%ebx)\n\t" -" fstps 124(%%ecx)\n\t" - -" flds 116(%%edx)\n\t" -" fadds 120(%%edx)\n\t" -" fstps 116(%%ecx)\n\t" - -" flds 120(%%edx)\n\t" -" fsubs 116(%%edx)\n\t" -" fmuls 116(%%ebx)\n\t" -" fstps 120(%%ecx)\n\t" - -/* Phase 5*/ - -" flds 32(%%ecx)\n\t" -" fadds 36(%%ecx)\n\t" -" fstps 32(%%edx)\n\t" - -" flds 32(%%ecx)\n\t" -" fsubs 36(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fstps 36(%%edx)\n\t" - -" flds 44(%%ecx)\n\t" -" fsubs 40(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 44(%%edx)\n\t" -" fadds 40(%%ecx)\n\t" -" fadds 44(%%ecx)\n\t" -" fstps 40(%%edx)\n\t" - -" flds 48(%%ecx)\n\t" -" fsubs 52(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" - -" flds 60(%%ecx)\n\t" -" fsubs 56(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fld %%st(0)\n\t" -" fadds 56(%%ecx)\n\t" -" fadds 60(%%ecx)\n\t" -" fld %%st(0)\n\t" -" fadds 48(%%ecx)\n\t" -" fadds 52(%%ecx)\n\t" -" fstps 48(%%edx)\n\t" -" fadd %%st(2)\n\t" -" fstps 56(%%edx)\n\t" -" fsts 60(%%edx)\n\t" -" faddp %%st(1)\n\t" -" fstps 52(%%edx)\n\t" - -" flds 64(%%ecx)\n\t" -" fadds 68(%%ecx)\n\t" -" fstps 64(%%edx)\n\t" - -" flds 64(%%ecx)\n\t" -" fsubs 68(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fstps 68(%%edx)\n\t" - -" flds 76(%%ecx)\n\t" -" fsubs 72(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 76(%%edx)\n\t" -" fadds 72(%%ecx)\n\t" -" fadds 76(%%ecx)\n\t" -" fstps 72(%%edx)\n\t" - -" flds 92(%%ecx)\n\t" -" fsubs 88(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 92(%%edx)\n\t" -" fadds 92(%%ecx)\n\t" -" fadds 88(%%ecx)\n\t" -" fld %%st(0)\n\t" -" fadds 80(%%ecx)\n\t" -" fadds 84(%%ecx)\n\t" -" fstps 80(%%edx)\n\t" - -" flds 80(%%ecx)\n\t" -" fsubs 84(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fadd %%st(0), %%st(1)\n\t" -" fadds 92(%%edx)\n\t" -" fstps 84(%%edx)\n\t" -" fstps 88(%%edx)\n\t" - -" flds 96(%%ecx)\n\t" -" fadds 100(%%ecx)\n\t" -" fstps 96(%%edx)\n\t" - -" flds 96(%%ecx)\n\t" -" fsubs 100(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fstps 100(%%edx)\n\t" - -" flds 108(%%ecx)\n\t" -" fsubs 104(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 108(%%edx)\n\t" -" fadds 104(%%ecx)\n\t" -" fadds 108(%%ecx)\n\t" -" fstps 104(%%edx)\n\t" - -" flds 124(%%ecx)\n\t" -" fsubs 120(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 124(%%edx)\n\t" -" fadds 120(%%ecx)\n\t" -" fadds 124(%%ecx)\n\t" -" fld %%st(0)\n\t" -" fadds 112(%%ecx)\n\t" -" fadds 116(%%ecx)\n\t" -" fstps 112(%%edx)\n\t" - -" flds 112(%%ecx)\n\t" -" fsubs 116(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fadd %%st(0),%%st(1)\n\t" -" fadds 124(%%edx)\n\t" -" fstps 116(%%edx)\n\t" -" fstps 120(%%edx)\n\t" -" jnz .L01\n\t" - -/* Phase 6*/ - -" flds (%%ecx)\n\t" -" fadds 4(%%ecx)\n\t" -" fstps 1024(%%esi)\n\t" - -" flds (%%ecx)\n\t" -" fsubs 4(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts (%%esi)\n\t" -" fstps (%%edi)\n\t" - -" flds 12(%%ecx)\n\t" -" fsubs 8(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 512(%%edi)\n\t" -" fadds 12(%%ecx)\n\t" -" fadds 8(%%ecx)\n\t" -" fstps 512(%%esi)\n\t" - -" flds 16(%%ecx)\n\t" -" fsubs 20(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" - -" flds 28(%%ecx)\n\t" -" fsubs 24(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fsts 768(%%edi)\n\t" -" fld %%st(0)\n\t" -" fadds 24(%%ecx)\n\t" -" fadds 28(%%ecx)\n\t" -" fld %%st(0)\n\t" -" fadds 16(%%ecx)\n\t" -" fadds 20(%%ecx)\n\t" -" fstps 768(%%esi)\n\t" -" fadd %%st(2)\n\t" -" fstps 256(%%esi)\n\t" -" faddp %%st(1)\n\t" -" fstps 256(%%edi)\n\t" - -/* Phase 7*/ - -" flds 32(%%edx)\n\t" -" fadds 48(%%edx)\n\t" -" fstps 896(%%esi)\n\t" - -" flds 48(%%edx)\n\t" -" fadds 40(%%edx)\n\t" -" fstps 640(%%esi)\n\t" - -" flds 40(%%edx)\n\t" -" fadds 56(%%edx)\n\t" -" fstps 384(%%esi)\n\t" - -" flds 56(%%edx)\n\t" -" fadds 36(%%edx)\n\t" -" fstps 128(%%esi)\n\t" - -" flds 36(%%edx)\n\t" -" fadds 52(%%edx)\n\t" -" fstps 128(%%edi)\n\t" - -" flds 52(%%edx)\n\t" -" fadds 44(%%edx)\n\t" -" fstps 384(%%edi)\n\t" - -" flds 60(%%edx)\n\t" -" fsts 896(%%edi)\n\t" -" fadds 44(%%edx)\n\t" -" fstps 640(%%edi)\n\t" - -" flds 96(%%edx)\n\t" -" fadds 112(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 64(%%edx)\n\t" -" fstps 960(%%esi)\n\t" -" fadds 80(%%edx)\n\t" -" fstps 832(%%esi)\n\t" - -" flds 112(%%edx)\n\t" -" fadds 104(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 80(%%edx)\n\t" -" fstps 704(%%esi)\n\t" -" fadds 72(%%edx)\n\t" -" fstps 576(%%esi)\n\t" - -" flds 104(%%edx)\n\t" -" fadds 120(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 72(%%edx)\n\t" -" fstps 448(%%esi)\n\t" -" fadds 88(%%edx)\n\t" -" fstps 320(%%esi)\n\t" - -" flds 120(%%edx)\n\t" -" fadds 100(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 88(%%edx)\n\t" -" fstps 192(%%esi)\n\t" -" fadds 68(%%edx)\n\t" -" fstps 64(%%esi)\n\t" - -" flds 100(%%edx)\n\t" -" fadds 116(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 68(%%edx)\n\t" -" fstps 64(%%edi)\n\t" -" fadds 84(%%edx)\n\t" -" fstps 192(%%edi)\n\t" - -" flds 116(%%edx)\n\t" -" fadds 108(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 84(%%edx)\n\t" -" fstps 320(%%edi)\n\t" -" fadds 76(%%edx)\n\t" -" fstps 448(%%edi)\n\t" - -" flds 108(%%edx)\n\t" -" fadds 124(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 76(%%edx)\n\t" -" fstps 576(%%edi)\n\t" -" fadds 92(%%edx)\n\t" -" fstps 704(%%edi)\n\t" - -" flds 124(%%edx)\n\t" -" fsts 960(%%edi)\n\t" -" fadds 92(%%edx)\n\t" -" fstps 832(%%edi)\n\t" -" jmp .L_bye\n\t" -".L01:\n\t" -/* Phase 8*/ - -" flds (%%ecx)\n\t" -" fadds 4(%%ecx)\n\t" -" fistp 512(%%esi)\n\t" - -" flds (%%ecx)\n\t" -" fsubs 4(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" - -" fistp (%%esi)\n\t" - - -" flds 12(%%ecx)\n\t" -" fsubs 8(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fist 256(%%edi)\n\t" -" fadds 12(%%ecx)\n\t" -" fadds 8(%%ecx)\n\t" -" fistp 256(%%esi)\n\t" - -" flds 16(%%ecx)\n\t" -" fsubs 20(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" - -" flds 28(%%ecx)\n\t" -" fsubs 24(%%ecx)\n\t" -" fmuls 120(%%ebx)\n\t" -" fist 384(%%edi)\n\t" -" fld %%st(0)\n\t" -" fadds 24(%%ecx)\n\t" -" fadds 28(%%ecx)\n\t" -" fld %%st(0)\n\t" -" fadds 16(%%ecx)\n\t" -" fadds 20(%%ecx)\n\t" -" fistp 384(%%esi)\n\t" -" fadd %%st(2)\n\t" -" fistp 128(%%esi)\n\t" -" faddp %%st(1)\n\t" -" fistp 128(%%edi)\n\t" - -/* Phase 9*/ - -" flds 32(%%edx)\n\t" -" fadds 48(%%edx)\n\t" -" fistp 448(%%esi)\n\t" - -" flds 48(%%edx)\n\t" -" fadds 40(%%edx)\n\t" -" fistp 320(%%esi)\n\t" - -" flds 40(%%edx)\n\t" -" fadds 56(%%edx)\n\t" -" fistp 192(%%esi)\n\t" - -" flds 56(%%edx)\n\t" -" fadds 36(%%edx)\n\t" -" fistp 64(%%esi)\n\t" - -" flds 36(%%edx)\n\t" -" fadds 52(%%edx)\n\t" -" fistp 64(%%edi)\n\t" - -" flds 52(%%edx)\n\t" -" fadds 44(%%edx)\n\t" -" fistp 192(%%edi)\n\t" - -" flds 60(%%edx)\n\t" -" fist 448(%%edi)\n\t" -" fadds 44(%%edx)\n\t" -" fistp 320(%%edi)\n\t" - -" flds 96(%%edx)\n\t" -" fadds 112(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 64(%%edx)\n\t" -" fistp 480(%%esi)\n\t" -" fadds 80(%%edx)\n\t" -" fistp 416(%%esi)\n\t" - -" flds 112(%%edx)\n\t" -" fadds 104(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 80(%%edx)\n\t" -" fistp 352(%%esi)\n\t" -" fadds 72(%%edx)\n\t" -" fistp 288(%%esi)\n\t" - -" flds 104(%%edx)\n\t" -" fadds 120(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 72(%%edx)\n\t" -" fistp 224(%%esi)\n\t" -" fadds 88(%%edx)\n\t" -" fistp 160(%%esi)\n\t" - -" flds 120(%%edx)\n\t" -" fadds 100(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 88(%%edx)\n\t" -" fistp 96(%%esi)\n\t" -" fadds 68(%%edx)\n\t" -" fistp 32(%%esi)\n\t" - -" flds 100(%%edx)\n\t" -" fadds 116(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 68(%%edx)\n\t" -" fistp 32(%%edi)\n\t" -" fadds 84(%%edx)\n\t" -" fistp 96(%%edi)\n\t" - -" flds 116(%%edx)\n\t" -" fadds 108(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 84(%%edx)\n\t" -" fistp 160(%%edi)\n\t" -" fadds 76(%%edx)\n\t" -" fistp 224(%%edi)\n\t" - -" flds 108(%%edx)\n\t" -" fadds 124(%%edx)\n\t" -" fld %%st(0)\n\t" -" fadds 76(%%edx)\n\t" -" fistp 288(%%edi)\n\t" -" fadds 92(%%edx)\n\t" -" fistp 352(%%edi)\n\t" - -" flds 124(%%edx)\n\t" -" fist 480(%%edi)\n\t" -" fadds 92(%%edx)\n\t" -" fistp 416(%%edi)\n\t" -" movsw\n\t" -".L_bye:" - : - :"m"(a),"m"(b),"m"(c),"m"(tmp[0]) - :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi"); -}
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mp3lib/dct64_mmx.c Wed Dec 12 08:50:54 2007 +0000 @@ -0,0 +1,985 @@ +/* +* This code was taken from http://www.mpg123.org +* See ChangeLog of mpg123-0.59s-pre.1 for detail +* Applied to mplayer by Nick Kurshev <nickols_k@mail.ru> +*/ +#include "mangle.h" +#define real float /* ugly - but only way */ + +void dct64_MMX(short *a,short *b,real *c) +{ + char tmp[256]; + __asm __volatile( +" movl %2,%%eax\n\t" +/* Phase 1*/ +" flds (%%eax)\n\t" +" leal 128+%3,%%edx\n\t" +" fadds 124(%%eax)\n\t" +" movl %0,%%esi\n\t" +" fstps (%%edx)\n\t" +" movl %1,%%edi\n\t" + +" flds 4(%%eax)\n\t" +" movl $"MANGLE(costab_mmx)",%%ebx\n\t" +" fadds 120(%%eax)\n\t" +" orl %%ecx,%%ecx\n\t" +" fstps 4(%%edx)\n\t" + +" flds (%%eax)\n\t" +" leal %3,%%ecx\n\t" +" fsubs 124(%%eax)\n\t" +" fmuls (%%ebx)\n\t" +" fstps 124(%%edx)\n\t" + +" flds 4(%%eax)\n\t" +" fsubs 120(%%eax)\n\t" +" fmuls 4(%%ebx)\n\t" +" fstps 120(%%edx)\n\t" + +" flds 8(%%eax)\n\t" +" fadds 116(%%eax)\n\t" +" fstps 8(%%edx)\n\t" + +" flds 12(%%eax)\n\t" +" fadds 112(%%eax)\n\t" +" fstps 12(%%edx)\n\t" + +" flds 8(%%eax)\n\t" +" fsubs 116(%%eax)\n\t" +" fmuls 8(%%ebx)\n\t" +" fstps 116(%%edx)\n\t" + +" flds 12(%%eax)\n\t" +" fsubs 112(%%eax)\n\t" +" fmuls 12(%%ebx)\n\t" +" fstps 112(%%edx)\n\t" + +" flds 16(%%eax)\n\t" +" fadds 108(%%eax)\n\t" +" fstps 16(%%edx)\n\t" + +" flds 20(%%eax)\n\t" +" fadds 104(%%eax)\n\t" +" fstps 20(%%edx)\n\t" + +" flds 16(%%eax)\n\t" +" fsubs 108(%%eax)\n\t" +" fmuls 16(%%ebx)\n\t" +" fstps 108(%%edx)\n\t" + +" flds 20(%%eax)\n\t" +" fsubs 104(%%eax)\n\t" +" fmuls 20(%%ebx)\n\t" +" fstps 104(%%edx)\n\t" + +" flds 24(%%eax)\n\t" +" fadds 100(%%eax)\n\t" +" fstps 24(%%edx)\n\t" + +" flds 28(%%eax)\n\t" +" fadds 96(%%eax)\n\t" +" fstps 28(%%edx)\n\t" + +" flds 24(%%eax)\n\t" +" fsubs 100(%%eax)\n\t" +" fmuls 24(%%ebx)\n\t" +" fstps 100(%%edx)\n\t" + +" flds 28(%%eax)\n\t" +" fsubs 96(%%eax)\n\t" +" fmuls 28(%%ebx)\n\t" +" fstps 96(%%edx)\n\t" + +" flds 32(%%eax)\n\t" +" fadds 92(%%eax)\n\t" +" fstps 32(%%edx)\n\t" + +" flds 36(%%eax)\n\t" +" fadds 88(%%eax)\n\t" +" fstps 36(%%edx)\n\t" + +" flds 32(%%eax)\n\t" +" fsubs 92(%%eax)\n\t" +" fmuls 32(%%ebx)\n\t" +" fstps 92(%%edx)\n\t" + +" flds 36(%%eax)\n\t" +" fsubs 88(%%eax)\n\t" +" fmuls 36(%%ebx)\n\t" +" fstps 88(%%edx)\n\t" + +" flds 40(%%eax)\n\t" +" fadds 84(%%eax)\n\t" +" fstps 40(%%edx)\n\t" + +" flds 44(%%eax)\n\t" +" fadds 80(%%eax)\n\t" +" fstps 44(%%edx)\n\t" + +" flds 40(%%eax)\n\t" +" fsubs 84(%%eax)\n\t" +" fmuls 40(%%ebx)\n\t" +" fstps 84(%%edx)\n\t" + +" flds 44(%%eax)\n\t" +" fsubs 80(%%eax)\n\t" +" fmuls 44(%%ebx)\n\t" +" fstps 80(%%edx)\n\t" + +" flds 48(%%eax)\n\t" +" fadds 76(%%eax)\n\t" +" fstps 48(%%edx)\n\t" + +" flds 52(%%eax)\n\t" +" fadds 72(%%eax)\n\t" +" fstps 52(%%edx)\n\t" + +" flds 48(%%eax)\n\t" +" fsubs 76(%%eax)\n\t" +" fmuls 48(%%ebx)\n\t" +" fstps 76(%%edx)\n\t" + +" flds 52(%%eax)\n\t" +" fsubs 72(%%eax)\n\t" +" fmuls 52(%%ebx)\n\t" +" fstps 72(%%edx)\n\t" + +" flds 56(%%eax)\n\t" +" fadds 68(%%eax)\n\t" +" fstps 56(%%edx)\n\t" + +" flds 60(%%eax)\n\t" +" fadds 64(%%eax)\n\t" +" fstps 60(%%edx)\n\t" + +" flds 56(%%eax)\n\t" +" fsubs 68(%%eax)\n\t" +" fmuls 56(%%ebx)\n\t" +" fstps 68(%%edx)\n\t" + +" flds 60(%%eax)\n\t" +" fsubs 64(%%eax)\n\t" +" fmuls 60(%%ebx)\n\t" +" fstps 64(%%edx)\n\t" + +/* Phase 2*/ + +" flds (%%edx)\n\t" +" fadds 60(%%edx)\n\t" +" fstps (%%ecx)\n\t" + +" flds 4(%%edx)\n\t" +" fadds 56(%%edx)\n\t" +" fstps 4(%%ecx)\n\t" + +" flds (%%edx)\n\t" +" fsubs 60(%%edx)\n\t" +" fmuls 64(%%ebx)\n\t" +" fstps 60(%%ecx)\n\t" + +" flds 4(%%edx)\n\t" +" fsubs 56(%%edx)\n\t" +" fmuls 68(%%ebx)\n\t" +" fstps 56(%%ecx)\n\t" + +" flds 8(%%edx)\n\t" +" fadds 52(%%edx)\n\t" +" fstps 8(%%ecx)\n\t" + +" flds 12(%%edx)\n\t" +" fadds 48(%%edx)\n\t" +" fstps 12(%%ecx)\n\t" + +" flds 8(%%edx)\n\t" +" fsubs 52(%%edx)\n\t" +" fmuls 72(%%ebx)\n\t" +" fstps 52(%%ecx)\n\t" + +" flds 12(%%edx)\n\t" +" fsubs 48(%%edx)\n\t" +" fmuls 76(%%ebx)\n\t" +" fstps 48(%%ecx)\n\t" + +" flds 16(%%edx)\n\t" +" fadds 44(%%edx)\n\t" +" fstps 16(%%ecx)\n\t" + +" flds 20(%%edx)\n\t" +" fadds 40(%%edx)\n\t" +" fstps 20(%%ecx)\n\t" + +" flds 16(%%edx)\n\t" +" fsubs 44(%%edx)\n\t" +" fmuls 80(%%ebx)\n\t" +" fstps 44(%%ecx)\n\t" + +" flds 20(%%edx)\n\t" +" fsubs 40(%%edx)\n\t" +" fmuls 84(%%ebx)\n\t" +" fstps 40(%%ecx)\n\t" + +" flds 24(%%edx)\n\t" +" fadds 36(%%edx)\n\t" +" fstps 24(%%ecx)\n\t" + +" flds 28(%%edx)\n\t" +" fadds 32(%%edx)\n\t" +" fstps 28(%%ecx)\n\t" + +" flds 24(%%edx)\n\t" +" fsubs 36(%%edx)\n\t" +" fmuls 88(%%ebx)\n\t" +" fstps 36(%%ecx)\n\t" + +" flds 28(%%edx)\n\t" +" fsubs 32(%%edx)\n\t" +" fmuls 92(%%ebx)\n\t" +" fstps 32(%%ecx)\n\t" + +/* Phase 3*/ + +" flds 64(%%edx)\n\t" +" fadds 124(%%edx)\n\t" +" fstps 64(%%ecx)\n\t" + +" flds 68(%%edx)\n\t" +" fadds 120(%%edx)\n\t" +" fstps 68(%%ecx)\n\t" + +" flds 124(%%edx)\n\t" +" fsubs 64(%%edx)\n\t" +" fmuls 64(%%ebx)\n\t" +" fstps 124(%%ecx)\n\t" + +" flds 120(%%edx)\n\t" +" fsubs 68(%%edx)\n\t" +" fmuls 68(%%ebx)\n\t" +" fstps 120(%%ecx)\n\t" + +" flds 72(%%edx)\n\t" +" fadds 116(%%edx)\n\t" +" fstps 72(%%ecx)\n\t" + +" flds 76(%%edx)\n\t" +" fadds 112(%%edx)\n\t" +" fstps 76(%%ecx)\n\t" + +" flds 116(%%edx)\n\t" +" fsubs 72(%%edx)\n\t" +" fmuls 72(%%ebx)\n\t" +" fstps 116(%%ecx)\n\t" + +" flds 112(%%edx)\n\t" +" fsubs 76(%%edx)\n\t" +" fmuls 76(%%ebx)\n\t" +" fstps 112(%%ecx)\n\t" + +" flds 80(%%edx)\n\t" +" fadds 108(%%edx)\n\t" +" fstps 80(%%ecx)\n\t" + +" flds 84(%%edx)\n\t" +" fadds 104(%%edx)\n\t" +" fstps 84(%%ecx)\n\t" + +" flds 108(%%edx)\n\t" +" fsubs 80(%%edx)\n\t" +" fmuls 80(%%ebx)\n\t" +" fstps 108(%%ecx)\n\t" + +" flds 104(%%edx)\n\t" +" fsubs 84(%%edx)\n\t" +" fmuls 84(%%ebx)\n\t" +" fstps 104(%%ecx)\n\t" + +" flds 88(%%edx)\n\t" +" fadds 100(%%edx)\n\t" +" fstps 88(%%ecx)\n\t" + +" flds 92(%%edx)\n\t" +" fadds 96(%%edx)\n\t" +" fstps 92(%%ecx)\n\t" + +" flds 100(%%edx)\n\t" +" fsubs 88(%%edx)\n\t" +" fmuls 88(%%ebx)\n\t" +" fstps 100(%%ecx)\n\t" + +" flds 96(%%edx)\n\t" +" fsubs 92(%%edx)\n\t" +" fmuls 92(%%ebx)\n\t" +" fstps 96(%%ecx)\n\t" + +/* Phase 4*/ + +" flds (%%ecx)\n\t" +" fadds 28(%%ecx)\n\t" +" fstps (%%edx)\n\t" + +" flds (%%ecx)\n\t" +" fsubs 28(%%ecx)\n\t" +" fmuls 96(%%ebx)\n\t" +" fstps 28(%%edx)\n\t" + +" flds 4(%%ecx)\n\t" +" fadds 24(%%ecx)\n\t" +" fstps 4(%%edx)\n\t" + +" flds 4(%%ecx)\n\t" +" fsubs 24(%%ecx)\n\t" +" fmuls 100(%%ebx)\n\t" +" fstps 24(%%edx)\n\t" + +" flds 8(%%ecx)\n\t" +" fadds 20(%%ecx)\n\t" +" fstps 8(%%edx)\n\t" + +" flds 8(%%ecx)\n\t" +" fsubs 20(%%ecx)\n\t" +" fmuls 104(%%ebx)\n\t" +" fstps 20(%%edx)\n\t" + +" flds 12(%%ecx)\n\t" +" fadds 16(%%ecx)\n\t" +" fstps 12(%%edx)\n\t" + +" flds 12(%%ecx)\n\t" +" fsubs 16(%%ecx)\n\t" +" fmuls 108(%%ebx)\n\t" +" fstps 16(%%edx)\n\t" + +" flds 32(%%ecx)\n\t" +" fadds 60(%%ecx)\n\t" +" fstps 32(%%edx)\n\t" + +" flds 60(%%ecx)\n\t" +" fsubs 32(%%ecx)\n\t" +" fmuls 96(%%ebx)\n\t" +" fstps 60(%%edx)\n\t" + +" flds 36(%%ecx)\n\t" +" fadds 56(%%ecx)\n\t" +" fstps 36(%%edx)\n\t" + +" flds 56(%%ecx)\n\t" +" fsubs 36(%%ecx)\n\t" +" fmuls 100(%%ebx)\n\t" +" fstps 56(%%edx)\n\t" + +" flds 40(%%ecx)\n\t" +" fadds 52(%%ecx)\n\t" +" fstps 40(%%edx)\n\t" + +" flds 52(%%ecx)\n\t" +" fsubs 40(%%ecx)\n\t" +" fmuls 104(%%ebx)\n\t" +" fstps 52(%%edx)\n\t" + +" flds 44(%%ecx)\n\t" +" fadds 48(%%ecx)\n\t" +" fstps 44(%%edx)\n\t" + +" flds 48(%%ecx)\n\t" +" fsubs 44(%%ecx)\n\t" +" fmuls 108(%%ebx)\n\t" +" fstps 48(%%edx)\n\t" + +" flds 64(%%ecx)\n\t" +" fadds 92(%%ecx)\n\t" +" fstps 64(%%edx)\n\t" + +" flds 64(%%ecx)\n\t" +" fsubs 92(%%ecx)\n\t" +" fmuls 96(%%ebx)\n\t" +" fstps 92(%%edx)\n\t" + +" flds 68(%%ecx)\n\t" +" fadds 88(%%ecx)\n\t" +" fstps 68(%%edx)\n\t" + +" flds 68(%%ecx)\n\t" +" fsubs 88(%%ecx)\n\t" +" fmuls 100(%%ebx)\n\t" +" fstps 88(%%edx)\n\t" + +" flds 72(%%ecx)\n\t" +" fadds 84(%%ecx)\n\t" +" fstps 72(%%edx)\n\t" + +" flds 72(%%ecx)\n\t" +" fsubs 84(%%ecx)\n\t" +" fmuls 104(%%ebx)\n\t" +" fstps 84(%%edx)\n\t" + +" flds 76(%%ecx)\n\t" +" fadds 80(%%ecx)\n\t" +" fstps 76(%%edx)\n\t" + +" flds 76(%%ecx)\n\t" +" fsubs 80(%%ecx)\n\t" +" fmuls 108(%%ebx)\n\t" +" fstps 80(%%edx)\n\t" + +" flds 96(%%ecx)\n\t" +" fadds 124(%%ecx)\n\t" +" fstps 96(%%edx)\n\t" + +" flds 124(%%ecx)\n\t" +" fsubs 96(%%ecx)\n\t" +" fmuls 96(%%ebx)\n\t" +" fstps 124(%%edx)\n\t" + +" flds 100(%%ecx)\n\t" +" fadds 120(%%ecx)\n\t" +" fstps 100(%%edx)\n\t" + +" flds 120(%%ecx)\n\t" +" fsubs 100(%%ecx)\n\t" +" fmuls 100(%%ebx)\n\t" +" fstps 120(%%edx)\n\t" + +" flds 104(%%ecx)\n\t" +" fadds 116(%%ecx)\n\t" +" fstps 104(%%edx)\n\t" + +" flds 116(%%ecx)\n\t" +" fsubs 104(%%ecx)\n\t" +" fmuls 104(%%ebx)\n\t" +" fstps 116(%%edx)\n\t" + +" flds 108(%%ecx)\n\t" +" fadds 112(%%ecx)\n\t" +" fstps 108(%%edx)\n\t" + +" flds 112(%%ecx)\n\t" +" fsubs 108(%%ecx)\n\t" +" fmuls 108(%%ebx)\n\t" +" fstps 112(%%edx)\n\t" + +" flds (%%edx)\n\t" +" fadds 12(%%edx)\n\t" +" fstps (%%ecx)\n\t" + +" flds (%%edx)\n\t" +" fsubs 12(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 12(%%ecx)\n\t" + +" flds 4(%%edx)\n\t" +" fadds 8(%%edx)\n\t" +" fstps 4(%%ecx)\n\t" + +" flds 4(%%edx)\n\t" +" fsubs 8(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 8(%%ecx)\n\t" + +" flds 16(%%edx)\n\t" +" fadds 28(%%edx)\n\t" +" fstps 16(%%ecx)\n\t" + +" flds 28(%%edx)\n\t" +" fsubs 16(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 28(%%ecx)\n\t" + +" flds 20(%%edx)\n\t" +" fadds 24(%%edx)\n\t" +" fstps 20(%%ecx)\n\t" + +" flds 24(%%edx)\n\t" +" fsubs 20(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 24(%%ecx)\n\t" + +" flds 32(%%edx)\n\t" +" fadds 44(%%edx)\n\t" +" fstps 32(%%ecx)\n\t" + +" flds 32(%%edx)\n\t" +" fsubs 44(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 44(%%ecx)\n\t" + +" flds 36(%%edx)\n\t" +" fadds 40(%%edx)\n\t" +" fstps 36(%%ecx)\n\t" + +" flds 36(%%edx)\n\t" +" fsubs 40(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 40(%%ecx)\n\t" + +" flds 48(%%edx)\n\t" +" fadds 60(%%edx)\n\t" +" fstps 48(%%ecx)\n\t" + +" flds 60(%%edx)\n\t" +" fsubs 48(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 60(%%ecx)\n\t" + +" flds 52(%%edx)\n\t" +" fadds 56(%%edx)\n\t" +" fstps 52(%%ecx)\n\t" + +" flds 56(%%edx)\n\t" +" fsubs 52(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 56(%%ecx)\n\t" + +" flds 64(%%edx)\n\t" +" fadds 76(%%edx)\n\t" +" fstps 64(%%ecx)\n\t" + +" flds 64(%%edx)\n\t" +" fsubs 76(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 76(%%ecx)\n\t" + +" flds 68(%%edx)\n\t" +" fadds 72(%%edx)\n\t" +" fstps 68(%%ecx)\n\t" + +" flds 68(%%edx)\n\t" +" fsubs 72(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 72(%%ecx)\n\t" + +" flds 80(%%edx)\n\t" +" fadds 92(%%edx)\n\t" +" fstps 80(%%ecx)\n\t" + +" flds 92(%%edx)\n\t" +" fsubs 80(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 92(%%ecx)\n\t" + +" flds 84(%%edx)\n\t" +" fadds 88(%%edx)\n\t" +" fstps 84(%%ecx)\n\t" + +" flds 88(%%edx)\n\t" +" fsubs 84(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 88(%%ecx)\n\t" + +" flds 96(%%edx)\n\t" +" fadds 108(%%edx)\n\t" +" fstps 96(%%ecx)\n\t" + +" flds 96(%%edx)\n\t" +" fsubs 108(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 108(%%ecx)\n\t" + +" flds 100(%%edx)\n\t" +" fadds 104(%%edx)\n\t" +" fstps 100(%%ecx)\n\t" + +" flds 100(%%edx)\n\t" +" fsubs 104(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 104(%%ecx)\n\t" + +" flds 112(%%edx)\n\t" +" fadds 124(%%edx)\n\t" +" fstps 112(%%ecx)\n\t" + +" flds 124(%%edx)\n\t" +" fsubs 112(%%edx)\n\t" +" fmuls 112(%%ebx)\n\t" +" fstps 124(%%ecx)\n\t" + +" flds 116(%%edx)\n\t" +" fadds 120(%%edx)\n\t" +" fstps 116(%%ecx)\n\t" + +" flds 120(%%edx)\n\t" +" fsubs 116(%%edx)\n\t" +" fmuls 116(%%ebx)\n\t" +" fstps 120(%%ecx)\n\t" + +/* Phase 5*/ + +" flds 32(%%ecx)\n\t" +" fadds 36(%%ecx)\n\t" +" fstps 32(%%edx)\n\t" + +" flds 32(%%ecx)\n\t" +" fsubs 36(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fstps 36(%%edx)\n\t" + +" flds 44(%%ecx)\n\t" +" fsubs 40(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 44(%%edx)\n\t" +" fadds 40(%%ecx)\n\t" +" fadds 44(%%ecx)\n\t" +" fstps 40(%%edx)\n\t" + +" flds 48(%%ecx)\n\t" +" fsubs 52(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" + +" flds 60(%%ecx)\n\t" +" fsubs 56(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fld %%st(0)\n\t" +" fadds 56(%%ecx)\n\t" +" fadds 60(%%ecx)\n\t" +" fld %%st(0)\n\t" +" fadds 48(%%ecx)\n\t" +" fadds 52(%%ecx)\n\t" +" fstps 48(%%edx)\n\t" +" fadd %%st(2)\n\t" +" fstps 56(%%edx)\n\t" +" fsts 60(%%edx)\n\t" +" faddp %%st(1)\n\t" +" fstps 52(%%edx)\n\t" + +" flds 64(%%ecx)\n\t" +" fadds 68(%%ecx)\n\t" +" fstps 64(%%edx)\n\t" + +" flds 64(%%ecx)\n\t" +" fsubs 68(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fstps 68(%%edx)\n\t" + +" flds 76(%%ecx)\n\t" +" fsubs 72(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 76(%%edx)\n\t" +" fadds 72(%%ecx)\n\t" +" fadds 76(%%ecx)\n\t" +" fstps 72(%%edx)\n\t" + +" flds 92(%%ecx)\n\t" +" fsubs 88(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 92(%%edx)\n\t" +" fadds 92(%%ecx)\n\t" +" fadds 88(%%ecx)\n\t" +" fld %%st(0)\n\t" +" fadds 80(%%ecx)\n\t" +" fadds 84(%%ecx)\n\t" +" fstps 80(%%edx)\n\t" + +" flds 80(%%ecx)\n\t" +" fsubs 84(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fadd %%st(0), %%st(1)\n\t" +" fadds 92(%%edx)\n\t" +" fstps 84(%%edx)\n\t" +" fstps 88(%%edx)\n\t" + +" flds 96(%%ecx)\n\t" +" fadds 100(%%ecx)\n\t" +" fstps 96(%%edx)\n\t" + +" flds 96(%%ecx)\n\t" +" fsubs 100(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fstps 100(%%edx)\n\t" + +" flds 108(%%ecx)\n\t" +" fsubs 104(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 108(%%edx)\n\t" +" fadds 104(%%ecx)\n\t" +" fadds 108(%%ecx)\n\t" +" fstps 104(%%edx)\n\t" + +" flds 124(%%ecx)\n\t" +" fsubs 120(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 124(%%edx)\n\t" +" fadds 120(%%ecx)\n\t" +" fadds 124(%%ecx)\n\t" +" fld %%st(0)\n\t" +" fadds 112(%%ecx)\n\t" +" fadds 116(%%ecx)\n\t" +" fstps 112(%%edx)\n\t" + +" flds 112(%%ecx)\n\t" +" fsubs 116(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fadd %%st(0),%%st(1)\n\t" +" fadds 124(%%edx)\n\t" +" fstps 116(%%edx)\n\t" +" fstps 120(%%edx)\n\t" +" jnz .L01\n\t" + +/* Phase 6*/ + +" flds (%%ecx)\n\t" +" fadds 4(%%ecx)\n\t" +" fstps 1024(%%esi)\n\t" + +" flds (%%ecx)\n\t" +" fsubs 4(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts (%%esi)\n\t" +" fstps (%%edi)\n\t" + +" flds 12(%%ecx)\n\t" +" fsubs 8(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 512(%%edi)\n\t" +" fadds 12(%%ecx)\n\t" +" fadds 8(%%ecx)\n\t" +" fstps 512(%%esi)\n\t" + +" flds 16(%%ecx)\n\t" +" fsubs 20(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" + +" flds 28(%%ecx)\n\t" +" fsubs 24(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fsts 768(%%edi)\n\t" +" fld %%st(0)\n\t" +" fadds 24(%%ecx)\n\t" +" fadds 28(%%ecx)\n\t" +" fld %%st(0)\n\t" +" fadds 16(%%ecx)\n\t" +" fadds 20(%%ecx)\n\t" +" fstps 768(%%esi)\n\t" +" fadd %%st(2)\n\t" +" fstps 256(%%esi)\n\t" +" faddp %%st(1)\n\t" +" fstps 256(%%edi)\n\t" + +/* Phase 7*/ + +" flds 32(%%edx)\n\t" +" fadds 48(%%edx)\n\t" +" fstps 896(%%esi)\n\t" + +" flds 48(%%edx)\n\t" +" fadds 40(%%edx)\n\t" +" fstps 640(%%esi)\n\t" + +" flds 40(%%edx)\n\t" +" fadds 56(%%edx)\n\t" +" fstps 384(%%esi)\n\t" + +" flds 56(%%edx)\n\t" +" fadds 36(%%edx)\n\t" +" fstps 128(%%esi)\n\t" + +" flds 36(%%edx)\n\t" +" fadds 52(%%edx)\n\t" +" fstps 128(%%edi)\n\t" + +" flds 52(%%edx)\n\t" +" fadds 44(%%edx)\n\t" +" fstps 384(%%edi)\n\t" + +" flds 60(%%edx)\n\t" +" fsts 896(%%edi)\n\t" +" fadds 44(%%edx)\n\t" +" fstps 640(%%edi)\n\t" + +" flds 96(%%edx)\n\t" +" fadds 112(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 64(%%edx)\n\t" +" fstps 960(%%esi)\n\t" +" fadds 80(%%edx)\n\t" +" fstps 832(%%esi)\n\t" + +" flds 112(%%edx)\n\t" +" fadds 104(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 80(%%edx)\n\t" +" fstps 704(%%esi)\n\t" +" fadds 72(%%edx)\n\t" +" fstps 576(%%esi)\n\t" + +" flds 104(%%edx)\n\t" +" fadds 120(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 72(%%edx)\n\t" +" fstps 448(%%esi)\n\t" +" fadds 88(%%edx)\n\t" +" fstps 320(%%esi)\n\t" + +" flds 120(%%edx)\n\t" +" fadds 100(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 88(%%edx)\n\t" +" fstps 192(%%esi)\n\t" +" fadds 68(%%edx)\n\t" +" fstps 64(%%esi)\n\t" + +" flds 100(%%edx)\n\t" +" fadds 116(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 68(%%edx)\n\t" +" fstps 64(%%edi)\n\t" +" fadds 84(%%edx)\n\t" +" fstps 192(%%edi)\n\t" + +" flds 116(%%edx)\n\t" +" fadds 108(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 84(%%edx)\n\t" +" fstps 320(%%edi)\n\t" +" fadds 76(%%edx)\n\t" +" fstps 448(%%edi)\n\t" + +" flds 108(%%edx)\n\t" +" fadds 124(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 76(%%edx)\n\t" +" fstps 576(%%edi)\n\t" +" fadds 92(%%edx)\n\t" +" fstps 704(%%edi)\n\t" + +" flds 124(%%edx)\n\t" +" fsts 960(%%edi)\n\t" +" fadds 92(%%edx)\n\t" +" fstps 832(%%edi)\n\t" +" jmp .L_bye\n\t" +".L01:\n\t" +/* Phase 8*/ + +" flds (%%ecx)\n\t" +" fadds 4(%%ecx)\n\t" +" fistp 512(%%esi)\n\t" + +" flds (%%ecx)\n\t" +" fsubs 4(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" + +" fistp (%%esi)\n\t" + + +" flds 12(%%ecx)\n\t" +" fsubs 8(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fist 256(%%edi)\n\t" +" fadds 12(%%ecx)\n\t" +" fadds 8(%%ecx)\n\t" +" fistp 256(%%esi)\n\t" + +" flds 16(%%ecx)\n\t" +" fsubs 20(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" + +" flds 28(%%ecx)\n\t" +" fsubs 24(%%ecx)\n\t" +" fmuls 120(%%ebx)\n\t" +" fist 384(%%edi)\n\t" +" fld %%st(0)\n\t" +" fadds 24(%%ecx)\n\t" +" fadds 28(%%ecx)\n\t" +" fld %%st(0)\n\t" +" fadds 16(%%ecx)\n\t" +" fadds 20(%%ecx)\n\t" +" fistp 384(%%esi)\n\t" +" fadd %%st(2)\n\t" +" fistp 128(%%esi)\n\t" +" faddp %%st(1)\n\t" +" fistp 128(%%edi)\n\t" + +/* Phase 9*/ + +" flds 32(%%edx)\n\t" +" fadds 48(%%edx)\n\t" +" fistp 448(%%esi)\n\t" + +" flds 48(%%edx)\n\t" +" fadds 40(%%edx)\n\t" +" fistp 320(%%esi)\n\t" + +" flds 40(%%edx)\n\t" +" fadds 56(%%edx)\n\t" +" fistp 192(%%esi)\n\t" + +" flds 56(%%edx)\n\t" +" fadds 36(%%edx)\n\t" +" fistp 64(%%esi)\n\t" + +" flds 36(%%edx)\n\t" +" fadds 52(%%edx)\n\t" +" fistp 64(%%edi)\n\t" + +" flds 52(%%edx)\n\t" +" fadds 44(%%edx)\n\t" +" fistp 192(%%edi)\n\t" + +" flds 60(%%edx)\n\t" +" fist 448(%%edi)\n\t" +" fadds 44(%%edx)\n\t" +" fistp 320(%%edi)\n\t" + +" flds 96(%%edx)\n\t" +" fadds 112(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 64(%%edx)\n\t" +" fistp 480(%%esi)\n\t" +" fadds 80(%%edx)\n\t" +" fistp 416(%%esi)\n\t" + +" flds 112(%%edx)\n\t" +" fadds 104(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 80(%%edx)\n\t" +" fistp 352(%%esi)\n\t" +" fadds 72(%%edx)\n\t" +" fistp 288(%%esi)\n\t" + +" flds 104(%%edx)\n\t" +" fadds 120(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 72(%%edx)\n\t" +" fistp 224(%%esi)\n\t" +" fadds 88(%%edx)\n\t" +" fistp 160(%%esi)\n\t" + +" flds 120(%%edx)\n\t" +" fadds 100(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 88(%%edx)\n\t" +" fistp 96(%%esi)\n\t" +" fadds 68(%%edx)\n\t" +" fistp 32(%%esi)\n\t" + +" flds 100(%%edx)\n\t" +" fadds 116(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 68(%%edx)\n\t" +" fistp 32(%%edi)\n\t" +" fadds 84(%%edx)\n\t" +" fistp 96(%%edi)\n\t" + +" flds 116(%%edx)\n\t" +" fadds 108(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 84(%%edx)\n\t" +" fistp 160(%%edi)\n\t" +" fadds 76(%%edx)\n\t" +" fistp 224(%%edi)\n\t" + +" flds 108(%%edx)\n\t" +" fadds 124(%%edx)\n\t" +" fld %%st(0)\n\t" +" fadds 76(%%edx)\n\t" +" fistp 288(%%edi)\n\t" +" fadds 92(%%edx)\n\t" +" fistp 352(%%edi)\n\t" + +" flds 124(%%edx)\n\t" +" fist 480(%%edi)\n\t" +" fadds 92(%%edx)\n\t" +" fistp 416(%%edi)\n\t" +" movsw\n\t" +".L_bye:" + : + :"m"(a),"m"(b),"m"(c),"m"(tmp[0]) + :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi"); +}
--- a/mp3lib/dct64_sse.c Wed Dec 12 08:45:05 2007 +0000 +++ b/mp3lib/dct64_sse.c Wed Dec 12 08:50:54 2007 +0000 @@ -2,7 +2,7 @@ * Discrete Cosine Tansform (DCT) for SSE * Copyright (c) 2006 Zuxy MENG <zuxy.meng@gmail.com> * based upon code from mp3lib/dct64.c, mp3lib/dct64_altivec.c - * and mp3lib/dct64_MMX.c + * and mp3lib/dct64_mmx.c */ #include <libavutil/mem.h>
--- a/mp3lib/decode_MMX.c Wed Dec 12 08:45:05 2007 +0000 +++ /dev/null Thu Jan 01 00:00:00 1970 +0000 @@ -1,371 +0,0 @@ -/* - * this code comes under GPL - * This code was taken from http://www.mpg123.org - * See ChangeLog of mpg123-0.59s-pre.1 for detail - * Applied to mplayer by Nick Kurshev <nickols_k@mail.ru> - * - * Local ChangeLog: - * - Partial loops unrolling and removing MOVW insn from loops -*/ -#include "config.h" -#include "mangle.h" -#define real float /* ugly - but only way */ - -extern void (*dct64_MMX_func)(short*, short*, real*); -static unsigned long long attribute_used __attribute__((aligned(8))) null_one = 0x0000ffff0000ffffULL; -static unsigned long long attribute_used __attribute__((aligned(8))) one_null = 0xffff0000ffff0000ULL; -unsigned int __attribute__((aligned(16))) costab_mmx[] = -{ - 1056974725, - 1057056395, - 1057223771, - 1057485416, - 1057855544, - 1058356026, - 1059019886, - 1059897405, - 1061067246, - 1062657950, - 1064892987, - 1066774581, - 1069414683, - 1073984175, - 1079645762, - 1092815430, - 1057005197, - 1057342072, - 1058087743, - 1059427869, - 1061799040, - 1065862217, - 1071413542, - 1084439708, - 1057128951, - 1058664893, - 1063675095, - 1076102863, - 1057655764, - 1067924853, - 1060439283, -}; - -/** - This array of magic numbers were calculated by the pure function - make_decode_tables_MMX(32768), which had been implemented in (deleted since - r23383) tabinit_MMX.c. - */ -static short __attribute__((aligned(8))) mp3lib_decwins[] = -{ - 0, 7, 54, 114, 510, 1288, 1644, 9372, - 18760, -9373, 1644, -1289, 510, -115, 54, -8, - 0, 7, 54, 114, 510, 1288, 1644, 9372, - 18760, -9373, 1644, -1289, 510, -115, 54, -8, - 0, 7, 55, 129, 500, 1379, 1490, 9834, - 18748, -8910, 1784, -1197, 516, -101, 52, -7, - 0, 7, 55, 129, 500, 1379, 1490, 9834, - 18748, -8910, 1784, -1197, 516, -101, 52, -7, - 0, 8, 56, 145, 488, 1469, 1322, 10294, - 18714, -8448, 1910, -1107, 520, -87, 51, -6, - 0, 8, 56, 145, 488, 1469, 1322, 10294, - 18714, -8448, 1910, -1107, 520, -87, 51, -6, - 0, 9, 57, 161, 474, 1559, 1141, 10751, - 18658, -7987, 2023, -1016, 522, -74, 49, -6, - 0, 9, 57, 161, 474, 1559, 1141, 10751, - 18658, -7987, 2023, -1016, 522, -74, 49, -6, - 0, 10, 57, 177, 456, 1647, 944, 11205, - 18579, -7528, 2123, -927, 522, -61, 48, -5, - 0, 10, 57, 177, 456, 1647, 944, 11205, - 18579, -7528, 2123, -927, 522, -61, 48, -5, - 0, 11, 57, 194, 435, 1733, 734, 11654, - 18477, -7073, 2210, -838, 519, -50, 46, -5, - 0, 11, 57, 194, 435, 1733, 734, 11654, - 18477, -7073, 2210, -838, 519, -50, 46, -5, - 0, 12, 57, 212, 411, 1817, 510, 12097, - 18354, -6621, 2285, -751, 515, -39, 44, -4, - 0, 12, 57, 212, 411, 1817, 510, 12097, - 18354, -6621, 2285, -751, 515, -39, 44, -4, - 0, 13, 57, 229, 384, 1899, 271, 12534, - 18209, -6174, 2348, -666, 508, -28, 43, -4, - 0, 13, 57, 229, 384, 1899, 271, 12534, - 18209, -6174, 2348, -666, 508, -28, 43, -4, - 0, 14, 56, 247, 354, 1977, 18, 12963, - 18043, -5733, 2398, -583, 501, -18, 41, -4, - 0, 14, 56, 247, 354, 1977, 18, 12963, - 18043, -5733, 2398, -583, 501, -18, 41, -4, - 0, 15, 56, 266, 320, 2052, -249, 13383, - 17855, -5298, 2438, -502, 491, -9, 39, -3, - 0, 15, 56, 266, 320, 2052, -249, 13383, - 17855, -5298, 2438, -502, 491, -9, 39, -3, - 0, 17, 54, 284, 283, 2122, -530, 13794, - 17648, -4870, 2466, -423, 480, -1, 37, -3, - 0, 17, 54, 284, 283, 2122, -530, 13794, - 17648, -4870, 2466, -423, 480, -1, 37, -3, - 0, 18, 52, 302, 243, 2188, -825, 14194, - 17420, -4450, 2484, -347, 468, 7, 35, -3, - 0, 18, 52, 302, 243, 2188, -825, 14194, - 17420, -4450, 2484, -347, 468, 7, 35, -3, - 0, 19, 50, 320, 199, 2249, -1133, 14583, - 17173, -4039, 2492, -274, 455, 14, 33, -2, - 0, 19, 50, 320, 199, 2249, -1133, 14583, - 17173, -4039, 2492, -274, 455, 14, 33, -2, - -1, 21, 48, 339, 152, 2304, -1454, 14959, - 16908, -3637, 2490, -204, 440, 20, 32, -2, - -1, 21, 48, 339, 152, 2304, -1454, 14959, - 16908, -3637, 2490, -204, 440, 20, 32, -2, - -1, 22, 45, 357, 101, 2354, -1788, 15322, - 16624, -3245, 2479, -137, 425, 26, 30, -2, - -1, 22, 45, 357, 101, 2354, -1788, 15322, - 16624, -3245, 2479, -137, 425, 26, 30, -2, - -1, 24, 41, 374, 47, 2396, -2135, 15671, - 16323, -2864, 2460, -72, 409, 31, 28, -2, - -1, 24, 41, 374, 47, 2396, -2135, 15671, - 16323, -2864, 2460, -72, 409, 31, 28, -2, - -1, 26, 37, 391, -11, 2431, -2493, 16004, - 16005, -2494, 2432, -12, 392, 36, 26, -2, - -1, 26, 37, 391, -11, 2431, -2493, 16004, - 16005, -2494, 2432, -12, 392, 36, 26, -2, - -2, -28, 31, -409, -72, -2460, -2864, -16323, - 15671, 2135, 2396, -47, 374, -41, 24, 1, - -2, -28, 31, -409, -72, -2460, -2864, -16323, - 15671, 2135, 2396, -47, 374, -41, 24, 1, - -2, -30, 26, -425, -137, -2479, -3245, -16624, - 15322, 1788, 2354, -101, 357, -45, 22, 1, - -2, -30, 26, -425, -137, -2479, -3245, -16624, - 15322, 1788, 2354, -101, 357, -45, 22, 1, - -2, -32, 20, -440, -204, -2490, -3637, -16908, - 14959, 1454, 2304, -152, 339, -48, 21, 1, - -2, -32, 20, -440, -204, -2490, -3637, -16908, - 14959, 1454, 2304, -152, 339, -48, 21, 1, - -2, -33, 14, -455, -274, -2492, -4039, -17173, - 14583, 1133, 2249, -199, 320, -50, 19, 0, - -2, -33, 14, -455, -274, -2492, -4039, -17173, - 14583, 1133, 2249, -199, 320, -50, 19, 0, - -3, -35, 7, -468, -347, -2484, -4450, -17420, - 14194, 825, 2188, -243, 302, -52, 18, 0, - -3, -35, 7, -468, -347, -2484, -4450, -17420, - 14194, 825, 2188, -243, 302, -52, 18, 0, - -3, -37, -1, -480, -423, -2466, -4870, -17648, - 13794, 530, 2122, -283, 284, -54, 17, 0, - -3, -37, -1, -480, -423, -2466, -4870, -17648, - 13794, 530, 2122, -283, 284, -54, 17, 0, - -3, -39, -9, -491, -502, -2438, -5298, -17855, - 13383, 249, 2052, -320, 266, -56, 15, 0, - -3, -39, -9, -491, -502, -2438, -5298, -17855, - 13383, 249, 2052, -320, 266, -56, 15, 0, - -4, -41, -18, -501, -583, -2398, -5733, -18043, - 12963, -18, 1977, -354, 247, -56, 14, 0, - -4, -41, -18, -501, -583, -2398, -5733, -18043, - 12963, -18, 1977, -354, 247, -56, 14, 0, - -4, -43, -28, -508, -666, -2348, -6174, -18209, - 12534, -271, 1899, -384, 229, -57, 13, 0, - -4, -43, -28, -508, -666, -2348, -6174, -18209, - 12534, -271, 1899, -384, 229, -57, 13, 0, - -4, -44, -39, -515, -751, -2285, -6621, -18354, - 12097, -510, 1817, -411, 212, -57, 12, 0, - -4, -44, -39, -515, -751, -2285, -6621, -18354, - 12097, -510, 1817, -411, 212, -57, 12, 0, - -5, -46, -50, -519, -838, -2210, -7073, -18477, - 11654, -734, 1733, -435, 194, -57, 11, 0, - -5, -46, -50, -519, -838, -2210, -7073, -18477, - 11654, -734, 1733, -435, 194, -57, 11, 0, - -5, -48, -61, -522, -927, -2123, -7528, -18579, - 11205, -944, 1647, -456, 177, -57, 10, 0, - -5, -48, -61, -522, -927, -2123, -7528, -18579, - 11205, -944, 1647, -456, 177, -57, 10, 0, - -6, -49, -74, -522, -1016, -2023, -7987, -18658, - 10751, -1141, 1559, -474, 161, -57, 9, 0, - -6, -49, -74, -522, -1016, -2023, -7987, -18658, - 10751, -1141, 1559, -474, 161, -57, 9, 0, - -6, -51, -87, -520, -1107, -1910, -8448, -18714, - 10294, -1322, 1469, -488, 145, -56, 8, 0, - -6, -51, -87, -520, -1107, -1910, -8448, -18714, - 10294, -1322, 1469, -488, 145, -56, 8, 0, - -7, -52, -101, -516, -1197, -1784, -8910, -18748, - 9834, -1490, 1379, -500, 129, -55, 7, 0, - -7, -52, -101, -516, -1197, -1784, -8910, -18748, - 9834, -1490, 1379, -500, 129, -55, 7, 0, -}; - -int synth_1to1_MMX(real *bandPtr, int channel, short *samples) -{ - static short buffs[2][2][0x110] __attribute__((aligned(8))); - static int bo = 1; - short *b0, (*buf)[0x110], *a, *b; - short* window; - int bo1, i = 8; - - if (channel == 0) { - bo = (bo - 1) & 0xf; - buf = buffs[1]; - } else { - samples++; - buf = buffs[0]; - } - - if (bo & 1) { - b0 = buf[1]; - bo1 = bo + 1; - a = buf[0] + bo; - b = buf[1] + ((bo + 1) & 0xf); - } else { - b0 = buf[0]; - bo1 = bo; - b = buf[0] + bo; - a = buf[1] + ((bo + 1) & 0xf); - } - - dct64_MMX_func(a, b, bandPtr); - window = mp3lib_decwins + 16 - bo1; - //printf("DEBUG: channel %d, bo %d, off %d\n", channel, bo, 16 - bo1); -__asm __volatile( -ASMALIGN(4) -".L03:\n\t" - "movq (%1),%%mm0\n\t" - "movq 64(%1),%%mm4\n\t" - "pmaddwd (%2),%%mm0\n\t" - "pmaddwd 32(%2),%%mm4\n\t" - "movq 8(%1),%%mm1\n\t" - "movq 72(%1),%%mm5\n\t" - "pmaddwd 8(%2),%%mm1\n\t" - "pmaddwd 40(%2),%%mm5\n\t" - "movq 16(%1),%%mm2\n\t" - "movq 80(%1),%%mm6\n\t" - "pmaddwd 16(%2),%%mm2\n\t" - "pmaddwd 48(%2),%%mm6\n\t" - "movq 24(%1),%%mm3\n\t" - "movq 88(%1),%%mm7\n\t" - "pmaddwd 24(%2),%%mm3\n\t" - "pmaddwd 56(%2),%%mm7\n\t" - "paddd %%mm1,%%mm0\n\t" - "paddd %%mm5,%%mm4\n\t" - "paddd %%mm2,%%mm0\n\t" - "paddd %%mm6,%%mm4\n\t" - "paddd %%mm3,%%mm0\n\t" - "paddd %%mm7,%%mm4\n\t" - "movq %%mm0,%%mm1\n\t" - "movq %%mm4,%%mm5\n\t" - "psrlq $32,%%mm1\n\t" - "psrlq $32,%%mm5\n\t" - "paddd %%mm1,%%mm0\n\t" - "paddd %%mm5,%%mm4\n\t" - "psrad $13,%%mm0\n\t" - "psrad $13,%%mm4\n\t" - "packssdw %%mm0,%%mm0\n\t" - "packssdw %%mm4,%%mm4\n\t" - - "movq (%3), %%mm1\n\t" - "punpckldq %%mm4, %%mm0\n\t" - "pand "MANGLE(one_null)", %%mm1\n\t" - "pand "MANGLE(null_one)", %%mm0\n\t" - "por %%mm0, %%mm1\n\t" - "movq %%mm1,(%3)\n\t" - - "add $64,%2\n\t" - "add $128,%1\n\t" - "add $8,%3\n\t" - - "decl %0\n\t" - "jnz .L03\n\t" - - "movq (%1),%%mm0\n\t" - "pmaddwd (%2),%%mm0\n\t" - "movq 8(%1),%%mm1\n\t" - "pmaddwd 8(%2),%%mm1\n\t" - "movq 16(%1),%%mm2\n\t" - "pmaddwd 16(%2),%%mm2\n\t" - "movq 24(%1),%%mm3\n\t" - "pmaddwd 24(%2),%%mm3\n\t" - "paddd %%mm1,%%mm0\n\t" - "paddd %%mm2,%%mm0\n\t" - "paddd %%mm3,%%mm0\n\t" - "movq %%mm0,%%mm1\n\t" - "psrlq $32,%%mm1\n\t" - "paddd %%mm1,%%mm0\n\t" - "psrad $13,%%mm0\n\t" - "packssdw %%mm0,%%mm0\n\t" - "movd %%mm0,%%eax\n\t" - "movw %%ax, (%3)\n\t" - "sub $32,%2\n\t" - "add $64,%1\n\t" - "add $4,%3\n\t" - - "movl $7,%0\n\t" -ASMALIGN(4) -".L04:\n\t" - "movq (%1),%%mm0\n\t" - "movq 64(%1),%%mm4\n\t" - "pmaddwd (%2),%%mm0\n\t" - "pmaddwd -32(%2),%%mm4\n\t" - "movq 8(%1),%%mm1\n\t" - "movq 72(%1),%%mm5\n\t" - "pmaddwd 8(%2),%%mm1\n\t" - "pmaddwd -24(%2),%%mm5\n\t" - "movq 16(%1),%%mm2\n\t" - "movq 80(%1),%%mm6\n\t" - "pmaddwd 16(%2),%%mm2\n\t" - "pmaddwd -16(%2),%%mm6\n\t" - "movq 24(%1),%%mm3\n\t" - "movq 88(%1),%%mm7\n\t" - "pmaddwd 24(%2),%%mm3\n\t" - "pmaddwd -8(%2),%%mm7\n\t" - "paddd %%mm1,%%mm0\n\t" - "paddd %%mm5,%%mm4\n\t" - "paddd %%mm2,%%mm0\n\t" - "paddd %%mm6,%%mm4\n\t" - "paddd %%mm3,%%mm0\n\t" - "paddd %%mm7,%%mm4\n\t" - "movq %%mm0,%%mm1\n\t" - "movq %%mm4,%%mm5\n\t" - "psrlq $32,%%mm1\n\t" - "psrlq $32,%%mm5\n\t" - "paddd %%mm0,%%mm1\n\t" - "paddd %%mm4,%%mm5\n\t" - "psrad $13,%%mm1\n\t" - "psrad $13,%%mm5\n\t" - "packssdw %%mm1,%%mm1\n\t" - "packssdw %%mm5,%%mm5\n\t" - "psubd %%mm0,%%mm0\n\t" - "psubd %%mm4,%%mm4\n\t" - "psubsw %%mm1,%%mm0\n\t" - "psubsw %%mm5,%%mm4\n\t" - - "movq (%3), %%mm1\n\t" - "punpckldq %%mm4, %%mm0\n\t" - "pand "MANGLE(one_null)", %%mm1\n\t" - "pand "MANGLE(null_one)", %%mm0\n\t" - "por %%mm0, %%mm1\n\t" - "movq %%mm1,(%3)\n\t" - - "sub $64,%2\n\t" - "add $128,%1\n\t" - "add $8,%3\n\t" - "decl %0\n\t" - "jnz .L04\n\t" - - "movq (%1),%%mm0\n\t" - "pmaddwd (%2),%%mm0\n\t" - "movq 8(%1),%%mm1\n\t" - "pmaddwd 8(%2),%%mm1\n\t" - "movq 16(%1),%%mm2\n\t" - "pmaddwd 16(%2),%%mm2\n\t" - "movq 24(%1),%%mm3\n\t" - "pmaddwd 24(%2),%%mm3\n\t" - "paddd %%mm1,%%mm0\n\t" - "paddd %%mm2,%%mm0\n\t" - "paddd %%mm3,%%mm0\n\t" - "movq %%mm0,%%mm1\n\t" - "psrlq $32,%%mm1\n\t" - "paddd %%mm0,%%mm1\n\t" - "psrad $13,%%mm1\n\t" - "packssdw %%mm1,%%mm1\n\t" - "psubd %%mm0,%%mm0\n\t" - "psubsw %%mm1,%%mm0\n\t" - "movd %%mm0,%%eax\n\t" - "movw %%ax,(%3)\n\t" - "emms\n\t" - :"+r"(i), "+r"(window), "+r"(b0), "+r"(samples) - : - :"memory", "%eax"); - return 0; -} -
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/mp3lib/decode_mmx.c Wed Dec 12 08:50:54 2007 +0000 @@ -0,0 +1,371 @@ +/* + * this code comes under GPL + * This code was taken from http://www.mpg123.org + * See ChangeLog of mpg123-0.59s-pre.1 for detail + * Applied to mplayer by Nick Kurshev <nickols_k@mail.ru> + * + * Local ChangeLog: + * - Partial loops unrolling and removing MOVW insn from loops +*/ +#include "config.h" +#include "mangle.h" +#define real float /* ugly - but only way */ + +extern void (*dct64_MMX_func)(short*, short*, real*); +static unsigned long long attribute_used __attribute__((aligned(8))) null_one = 0x0000ffff0000ffffULL; +static unsigned long long attribute_used __attribute__((aligned(8))) one_null = 0xffff0000ffff0000ULL; +unsigned int __attribute__((aligned(16))) costab_mmx[] = +{ + 1056974725, + 1057056395, + 1057223771, + 1057485416, + 1057855544, + 1058356026, + 1059019886, + 1059897405, + 1061067246, + 1062657950, + 1064892987, + 1066774581, + 1069414683, + 1073984175, + 1079645762, + 1092815430, + 1057005197, + 1057342072, + 1058087743, + 1059427869, + 1061799040, + 1065862217, + 1071413542, + 1084439708, + 1057128951, + 1058664893, + 1063675095, + 1076102863, + 1057655764, + 1067924853, + 1060439283, +}; + +/** + This array of magic numbers were calculated by the pure function + make_decode_tables_MMX(32768), which had been implemented in (deleted since + r23383) tabinit_MMX.c. + */ +static short __attribute__((aligned(8))) mp3lib_decwins[] = +{ + 0, 7, 54, 114, 510, 1288, 1644, 9372, + 18760, -9373, 1644, -1289, 510, -115, 54, -8, + 0, 7, 54, 114, 510, 1288, 1644, 9372, + 18760, -9373, 1644, -1289, 510, -115, 54, -8, + 0, 7, 55, 129, 500, 1379, 1490, 9834, + 18748, -8910, 1784, -1197, 516, -101, 52, -7, + 0, 7, 55, 129, 500, 1379, 1490, 9834, + 18748, -8910, 1784, -1197, 516, -101, 52, -7, + 0, 8, 56, 145, 488, 1469, 1322, 10294, + 18714, -8448, 1910, -1107, 520, -87, 51, -6, + 0, 8, 56, 145, 488, 1469, 1322, 10294, + 18714, -8448, 1910, -1107, 520, -87, 51, -6, + 0, 9, 57, 161, 474, 1559, 1141, 10751, + 18658, -7987, 2023, -1016, 522, -74, 49, -6, + 0, 9, 57, 161, 474, 1559, 1141, 10751, + 18658, -7987, 2023, -1016, 522, -74, 49, -6, + 0, 10, 57, 177, 456, 1647, 944, 11205, + 18579, -7528, 2123, -927, 522, -61, 48, -5, + 0, 10, 57, 177, 456, 1647, 944, 11205, + 18579, -7528, 2123, -927, 522, -61, 48, -5, + 0, 11, 57, 194, 435, 1733, 734, 11654, + 18477, -7073, 2210, -838, 519, -50, 46, -5, + 0, 11, 57, 194, 435, 1733, 734, 11654, + 18477, -7073, 2210, -838, 519, -50, 46, -5, + 0, 12, 57, 212, 411, 1817, 510, 12097, + 18354, -6621, 2285, -751, 515, -39, 44, -4, + 0, 12, 57, 212, 411, 1817, 510, 12097, + 18354, -6621, 2285, -751, 515, -39, 44, -4, + 0, 13, 57, 229, 384, 1899, 271, 12534, + 18209, -6174, 2348, -666, 508, -28, 43, -4, + 0, 13, 57, 229, 384, 1899, 271, 12534, + 18209, -6174, 2348, -666, 508, -28, 43, -4, + 0, 14, 56, 247, 354, 1977, 18, 12963, + 18043, -5733, 2398, -583, 501, -18, 41, -4, + 0, 14, 56, 247, 354, 1977, 18, 12963, + 18043, -5733, 2398, -583, 501, -18, 41, -4, + 0, 15, 56, 266, 320, 2052, -249, 13383, + 17855, -5298, 2438, -502, 491, -9, 39, -3, + 0, 15, 56, 266, 320, 2052, -249, 13383, + 17855, -5298, 2438, -502, 491, -9, 39, -3, + 0, 17, 54, 284, 283, 2122, -530, 13794, + 17648, -4870, 2466, -423, 480, -1, 37, -3, + 0, 17, 54, 284, 283, 2122, -530, 13794, + 17648, -4870, 2466, -423, 480, -1, 37, -3, + 0, 18, 52, 302, 243, 2188, -825, 14194, + 17420, -4450, 2484, -347, 468, 7, 35, -3, + 0, 18, 52, 302, 243, 2188, -825, 14194, + 17420, -4450, 2484, -347, 468, 7, 35, -3, + 0, 19, 50, 320, 199, 2249, -1133, 14583, + 17173, -4039, 2492, -274, 455, 14, 33, -2, + 0, 19, 50, 320, 199, 2249, -1133, 14583, + 17173, -4039, 2492, -274, 455, 14, 33, -2, + -1, 21, 48, 339, 152, 2304, -1454, 14959, + 16908, -3637, 2490, -204, 440, 20, 32, -2, + -1, 21, 48, 339, 152, 2304, -1454, 14959, + 16908, -3637, 2490, -204, 440, 20, 32, -2, + -1, 22, 45, 357, 101, 2354, -1788, 15322, + 16624, -3245, 2479, -137, 425, 26, 30, -2, + -1, 22, 45, 357, 101, 2354, -1788, 15322, + 16624, -3245, 2479, -137, 425, 26, 30, -2, + -1, 24, 41, 374, 47, 2396, -2135, 15671, + 16323, -2864, 2460, -72, 409, 31, 28, -2, + -1, 24, 41, 374, 47, 2396, -2135, 15671, + 16323, -2864, 2460, -72, 409, 31, 28, -2, + -1, 26, 37, 391, -11, 2431, -2493, 16004, + 16005, -2494, 2432, -12, 392, 36, 26, -2, + -1, 26, 37, 391, -11, 2431, -2493, 16004, + 16005, -2494, 2432, -12, 392, 36, 26, -2, + -2, -28, 31, -409, -72, -2460, -2864, -16323, + 15671, 2135, 2396, -47, 374, -41, 24, 1, + -2, -28, 31, -409, -72, -2460, -2864, -16323, + 15671, 2135, 2396, -47, 374, -41, 24, 1, + -2, -30, 26, -425, -137, -2479, -3245, -16624, + 15322, 1788, 2354, -101, 357, -45, 22, 1, + -2, -30, 26, -425, -137, -2479, -3245, -16624, + 15322, 1788, 2354, -101, 357, -45, 22, 1, + -2, -32, 20, -440, -204, -2490, -3637, -16908, + 14959, 1454, 2304, -152, 339, -48, 21, 1, + -2, -32, 20, -440, -204, -2490, -3637, -16908, + 14959, 1454, 2304, -152, 339, -48, 21, 1, + -2, -33, 14, -455, -274, -2492, -4039, -17173, + 14583, 1133, 2249, -199, 320, -50, 19, 0, + -2, -33, 14, -455, -274, -2492, -4039, -17173, + 14583, 1133, 2249, -199, 320, -50, 19, 0, + -3, -35, 7, -468, -347, -2484, -4450, -17420, + 14194, 825, 2188, -243, 302, -52, 18, 0, + -3, -35, 7, -468, -347, -2484, -4450, -17420, + 14194, 825, 2188, -243, 302, -52, 18, 0, + -3, -37, -1, -480, -423, -2466, -4870, -17648, + 13794, 530, 2122, -283, 284, -54, 17, 0, + -3, -37, -1, -480, -423, -2466, -4870, -17648, + 13794, 530, 2122, -283, 284, -54, 17, 0, + -3, -39, -9, -491, -502, -2438, -5298, -17855, + 13383, 249, 2052, -320, 266, -56, 15, 0, + -3, -39, -9, -491, -502, -2438, -5298, -17855, + 13383, 249, 2052, -320, 266, -56, 15, 0, + -4, -41, -18, -501, -583, -2398, -5733, -18043, + 12963, -18, 1977, -354, 247, -56, 14, 0, + -4, -41, -18, -501, -583, -2398, -5733, -18043, + 12963, -18, 1977, -354, 247, -56, 14, 0, + -4, -43, -28, -508, -666, -2348, -6174, -18209, + 12534, -271, 1899, -384, 229, -57, 13, 0, + -4, -43, -28, -508, -666, -2348, -6174, -18209, + 12534, -271, 1899, -384, 229, -57, 13, 0, + -4, -44, -39, -515, -751, -2285, -6621, -18354, + 12097, -510, 1817, -411, 212, -57, 12, 0, + -4, -44, -39, -515, -751, -2285, -6621, -18354, + 12097, -510, 1817, -411, 212, -57, 12, 0, + -5, -46, -50, -519, -838, -2210, -7073, -18477, + 11654, -734, 1733, -435, 194, -57, 11, 0, + -5, -46, -50, -519, -838, -2210, -7073, -18477, + 11654, -734, 1733, -435, 194, -57, 11, 0, + -5, -48, -61, -522, -927, -2123, -7528, -18579, + 11205, -944, 1647, -456, 177, -57, 10, 0, + -5, -48, -61, -522, -927, -2123, -7528, -18579, + 11205, -944, 1647, -456, 177, -57, 10, 0, + -6, -49, -74, -522, -1016, -2023, -7987, -18658, + 10751, -1141, 1559, -474, 161, -57, 9, 0, + -6, -49, -74, -522, -1016, -2023, -7987, -18658, + 10751, -1141, 1559, -474, 161, -57, 9, 0, + -6, -51, -87, -520, -1107, -1910, -8448, -18714, + 10294, -1322, 1469, -488, 145, -56, 8, 0, + -6, -51, -87, -520, -1107, -1910, -8448, -18714, + 10294, -1322, 1469, -488, 145, -56, 8, 0, + -7, -52, -101, -516, -1197, -1784, -8910, -18748, + 9834, -1490, 1379, -500, 129, -55, 7, 0, + -7, -52, -101, -516, -1197, -1784, -8910, -18748, + 9834, -1490, 1379, -500, 129, -55, 7, 0, +}; + +int synth_1to1_MMX(real *bandPtr, int channel, short *samples) +{ + static short buffs[2][2][0x110] __attribute__((aligned(8))); + static int bo = 1; + short *b0, (*buf)[0x110], *a, *b; + short* window; + int bo1, i = 8; + + if (channel == 0) { + bo = (bo - 1) & 0xf; + buf = buffs[1]; + } else { + samples++; + buf = buffs[0]; + } + + if (bo & 1) { + b0 = buf[1]; + bo1 = bo + 1; + a = buf[0] + bo; + b = buf[1] + ((bo + 1) & 0xf); + } else { + b0 = buf[0]; + bo1 = bo; + b = buf[0] + bo; + a = buf[1] + ((bo + 1) & 0xf); + } + + dct64_MMX_func(a, b, bandPtr); + window = mp3lib_decwins + 16 - bo1; + //printf("DEBUG: channel %d, bo %d, off %d\n", channel, bo, 16 - bo1); +__asm __volatile( +ASMALIGN(4) +".L03:\n\t" + "movq (%1),%%mm0\n\t" + "movq 64(%1),%%mm4\n\t" + "pmaddwd (%2),%%mm0\n\t" + "pmaddwd 32(%2),%%mm4\n\t" + "movq 8(%1),%%mm1\n\t" + "movq 72(%1),%%mm5\n\t" + "pmaddwd 8(%2),%%mm1\n\t" + "pmaddwd 40(%2),%%mm5\n\t" + "movq 16(%1),%%mm2\n\t" + "movq 80(%1),%%mm6\n\t" + "pmaddwd 16(%2),%%mm2\n\t" + "pmaddwd 48(%2),%%mm6\n\t" + "movq 24(%1),%%mm3\n\t" + "movq 88(%1),%%mm7\n\t" + "pmaddwd 24(%2),%%mm3\n\t" + "pmaddwd 56(%2),%%mm7\n\t" + "paddd %%mm1,%%mm0\n\t" + "paddd %%mm5,%%mm4\n\t" + "paddd %%mm2,%%mm0\n\t" + "paddd %%mm6,%%mm4\n\t" + "paddd %%mm3,%%mm0\n\t" + "paddd %%mm7,%%mm4\n\t" + "movq %%mm0,%%mm1\n\t" + "movq %%mm4,%%mm5\n\t" + "psrlq $32,%%mm1\n\t" + "psrlq $32,%%mm5\n\t" + "paddd %%mm1,%%mm0\n\t" + "paddd %%mm5,%%mm4\n\t" + "psrad $13,%%mm0\n\t" + "psrad $13,%%mm4\n\t" + "packssdw %%mm0,%%mm0\n\t" + "packssdw %%mm4,%%mm4\n\t" + + "movq (%3), %%mm1\n\t" + "punpckldq %%mm4, %%mm0\n\t" + "pand "MANGLE(one_null)", %%mm1\n\t" + "pand "MANGLE(null_one)", %%mm0\n\t" + "por %%mm0, %%mm1\n\t" + "movq %%mm1,(%3)\n\t" + + "add $64,%2\n\t" + "add $128,%1\n\t" + "add $8,%3\n\t" + + "decl %0\n\t" + "jnz .L03\n\t" + + "movq (%1),%%mm0\n\t" + "pmaddwd (%2),%%mm0\n\t" + "movq 8(%1),%%mm1\n\t" + "pmaddwd 8(%2),%%mm1\n\t" + "movq 16(%1),%%mm2\n\t" + "pmaddwd 16(%2),%%mm2\n\t" + "movq 24(%1),%%mm3\n\t" + "pmaddwd 24(%2),%%mm3\n\t" + "paddd %%mm1,%%mm0\n\t" + "paddd %%mm2,%%mm0\n\t" + "paddd %%mm3,%%mm0\n\t" + "movq %%mm0,%%mm1\n\t" + "psrlq $32,%%mm1\n\t" + "paddd %%mm1,%%mm0\n\t" + "psrad $13,%%mm0\n\t" + "packssdw %%mm0,%%mm0\n\t" + "movd %%mm0,%%eax\n\t" + "movw %%ax, (%3)\n\t" + "sub $32,%2\n\t" + "add $64,%1\n\t" + "add $4,%3\n\t" + + "movl $7,%0\n\t" +ASMALIGN(4) +".L04:\n\t" + "movq (%1),%%mm0\n\t" + "movq 64(%1),%%mm4\n\t" + "pmaddwd (%2),%%mm0\n\t" + "pmaddwd -32(%2),%%mm4\n\t" + "movq 8(%1),%%mm1\n\t" + "movq 72(%1),%%mm5\n\t" + "pmaddwd 8(%2),%%mm1\n\t" + "pmaddwd -24(%2),%%mm5\n\t" + "movq 16(%1),%%mm2\n\t" + "movq 80(%1),%%mm6\n\t" + "pmaddwd 16(%2),%%mm2\n\t" + "pmaddwd -16(%2),%%mm6\n\t" + "movq 24(%1),%%mm3\n\t" + "movq 88(%1),%%mm7\n\t" + "pmaddwd 24(%2),%%mm3\n\t" + "pmaddwd -8(%2),%%mm7\n\t" + "paddd %%mm1,%%mm0\n\t" + "paddd %%mm5,%%mm4\n\t" + "paddd %%mm2,%%mm0\n\t" + "paddd %%mm6,%%mm4\n\t" + "paddd %%mm3,%%mm0\n\t" + "paddd %%mm7,%%mm4\n\t" + "movq %%mm0,%%mm1\n\t" + "movq %%mm4,%%mm5\n\t" + "psrlq $32,%%mm1\n\t" + "psrlq $32,%%mm5\n\t" + "paddd %%mm0,%%mm1\n\t" + "paddd %%mm4,%%mm5\n\t" + "psrad $13,%%mm1\n\t" + "psrad $13,%%mm5\n\t" + "packssdw %%mm1,%%mm1\n\t" + "packssdw %%mm5,%%mm5\n\t" + "psubd %%mm0,%%mm0\n\t" + "psubd %%mm4,%%mm4\n\t" + "psubsw %%mm1,%%mm0\n\t" + "psubsw %%mm5,%%mm4\n\t" + + "movq (%3), %%mm1\n\t" + "punpckldq %%mm4, %%mm0\n\t" + "pand "MANGLE(one_null)", %%mm1\n\t" + "pand "MANGLE(null_one)", %%mm0\n\t" + "por %%mm0, %%mm1\n\t" + "movq %%mm1,(%3)\n\t" + + "sub $64,%2\n\t" + "add $128,%1\n\t" + "add $8,%3\n\t" + "decl %0\n\t" + "jnz .L04\n\t" + + "movq (%1),%%mm0\n\t" + "pmaddwd (%2),%%mm0\n\t" + "movq 8(%1),%%mm1\n\t" + "pmaddwd 8(%2),%%mm1\n\t" + "movq 16(%1),%%mm2\n\t" + "pmaddwd 16(%2),%%mm2\n\t" + "movq 24(%1),%%mm3\n\t" + "pmaddwd 24(%2),%%mm3\n\t" + "paddd %%mm1,%%mm0\n\t" + "paddd %%mm2,%%mm0\n\t" + "paddd %%mm3,%%mm0\n\t" + "movq %%mm0,%%mm1\n\t" + "psrlq $32,%%mm1\n\t" + "paddd %%mm0,%%mm1\n\t" + "psrad $13,%%mm1\n\t" + "packssdw %%mm1,%%mm1\n\t" + "psubd %%mm0,%%mm0\n\t" + "psubsw %%mm1,%%mm0\n\t" + "movd %%mm0,%%eax\n\t" + "movw %%ax,(%3)\n\t" + "emms\n\t" + :"+r"(i), "+r"(window), "+r"(b0), "+r"(samples) + : + :"memory", "%eax"); + return 0; +} +