annotate mp3lib/dct64_sse.s @ 2316:bcb229557e9b

fixed alignment (static variables where sometimes not 8-byte aligned) added half uv interpolation support added prefetch BGR15 support in MMX (untested) (so BGR15,16,24,32 are supported) special unscaled height version (not much faster but it doesnt interpolate uv vertically)
author michael
date Sat, 20 Oct 2001 21:12:09 +0000
parents d9e3f91d6da9
children 8312f4bc8dab
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1394
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1 # This code is a translation of dct64_k7.s from MPlayer.
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2 # Coded by Felix Buenemann <atmosfear at users.sourceforge.net>
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
3 #
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
4 # TODO: - fix phases 4 and 5 (sse)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
5 # - optimize scalar FPU code? (interleave with sse code)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
6 #
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
8 //.data
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
9 // .align 8
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
10 //x_plus_minus_3dnow: .long 0x00000000, 0x80000000
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
11 //plus_1f: .float 1.0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
12
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
13 .text
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
14
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
15 .align 16
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
16
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
17 .global dct64_MMX_sse
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
18
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
19 dct64_MMX_sse:
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
20 pushl %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
21 pushl %esi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
22 pushl %edi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
23 subl $256,%esp
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
24 movl 280(%esp),%eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
25
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
26 leal 128(%esp),%edx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
27 movl 272(%esp),%esi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
28 movl 276(%esp),%edi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
29 movl $costab_mmx,%ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
30 orl %ecx,%ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
31 movl %esp,%ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
32
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
33 /* Phase 1 (complete, worx) */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
34
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
35 // [1] Process Block A1 (16 Bytes)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
36 / movq (%eax), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
37 / movq 8(%eax), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
38 movups (%eax), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
39
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
40 // Copy A1 to another register A2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
41 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
42 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
43 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
44
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
45 // Process Block B1 (last 16 bytes)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
46 / movq 120(%eax), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
47 / movq 112(%eax), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
48 movups 112(%eax), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
49
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
50 /* The PSWAPD instruction swaps or reverses the upper and lower
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
51 * doublewords of the source operand. PSWAPD mmreg1, mmreg2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
52 * performs the following operations:
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
53 * temp = mmreg2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
54 * mmreg1[63:32] = temp[31:0 ]
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
55 * mmreg1[31:0 ] = temp[63:32]
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
56 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
57 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
58 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
59 // shufps here exchanges a,b,c,d to b,a,d,c in xmm1 (desc ia32-ref p.752)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
60 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
61 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
62
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
63 // Add B1 to A1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
64 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
65 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
66 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
67
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
68 // Save Block A1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
69 / movq %mm0, (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
70 / movq %mm4, 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
71 movups %xmm0, (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
72
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
73 // Sub B1 from A2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
74 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
75 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
76 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
77
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
78 // Mul mem with A2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
79 / pfmul (%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
80 / pfmul 8(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
81 movups (%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
82 mulps %xmm7, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
83
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
84 // Shuffle A2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
85 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
86 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
87 // I do a,b,c,d -> d,c,b,a to suit order when writing to mem (saves one shufps)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
88 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
89
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
90 // Save A2 to mem (end)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
91 / movq %mm3, 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
92 / movq %mm7, 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
93 movups %xmm2, 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
94
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
95 // [2] Process next data block
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
96 / movq 16(%eax), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
97 / movq 24(%eax), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
98 movups 16(%eax), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
99
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
100 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
101 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
102 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
103
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
104 / movq 104(%eax), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
105 / movq 96(%eax), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
106 movups 96(%eax), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
107
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
108 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
109 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
110 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
111 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
112
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
113 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
114 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
115 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
116
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
117 / movq %mm0, 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
118 / movq %mm4, 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
119 movups %xmm0, 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
120
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
121 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
122 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
123 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
124
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
125 / pfmul 16(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
126 / pfmul 24(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
127 movups 16(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
128 mulps %xmm7, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
129
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
130 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
131 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
132 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
133
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
134 / movq %mm3, 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
135 / movq %mm7, 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
136 movups %xmm2, 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
137
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
138 // [3]
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
139 / movq 32(%eax), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
140 / movq 40(%eax), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
141 movups 32(%eax), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
142
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
143 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
144 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
145 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
146
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
147 / movq 88(%eax), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
148 / movq 80(%eax), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
149 movups 80(%eax), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
150
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
151 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
152 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
153 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
154 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
155
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
156 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
157 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
158 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
159
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
160 / movq %mm0, 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
161 / movq %mm4, 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
162 movups %xmm0, 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
163
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
164 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
165 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
166 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
167
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
168 / pfmul 32(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
169 / pfmul 40(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
170 movups 32(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
171 mulps %xmm7, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
172
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
173 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
174 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
175 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
176
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
177 / movq %mm3, 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
178 / movq %mm7, 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
179 movups %xmm2, 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
180
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
181 // [4]
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
182 / movq 48(%eax), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
183 / movq 56(%eax), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
184 movups 48(%eax), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
185
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
186 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
187 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
188 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
189
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
190 / movq 72(%eax), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
191 / movq 64(%eax), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
192 movups 64(%eax), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
193
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
194 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
195 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
196 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
197 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
198
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
199 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
200 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
201 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
202
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
203 / movq %mm0, 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
204 / movq %mm4, 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
205 movups %xmm0, 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
206
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
207 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
208 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
209 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
210
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
211 / pfmul 48(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
212 / pfmul 56(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
213 movups 48(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
214 mulps %xmm7, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
215
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
216 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
217 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
218 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
219
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
220 / movq %mm3, 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
221 / movq %mm7, 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
222 movups %xmm2, 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
223
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
224
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
225 // phase 1 fpu code
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
226 /* Phase 1*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
227 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
228 flds (%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
229 leal 128(%esp),%edx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
230 fadds 124(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
231 movl 272(%esp),%esi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
232 fstps (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
233 movl 276(%esp),%edi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
234
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
235 flds 4(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
236 movl $costab_mmx,%ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
237 fadds 120(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
238 orl %ecx,%ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
239 fstps 4(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
240
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
241 flds (%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
242 movl %esp,%ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
243 fsubs 124(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
244 fmuls (%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
245 fstps 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
246
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
247 flds 4(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
248 fsubs 120(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
249 fmuls 4(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
250 fstps 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
251
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
252 flds 8(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
253 fadds 116(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
254 fstps 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
255
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
256 flds 12(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
257 fadds 112(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
258 fstps 12(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
259
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
260 flds 8(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
261 fsubs 116(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
262 fmuls 8(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
263 fstps 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
264
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
265 flds 12(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
266 fsubs 112(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
267 fmuls 12(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
268 fstps 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
269
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
270 flds 16(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
271 fadds 108(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
272 fstps 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
273
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
274 flds 20(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
275 fadds 104(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
276 fstps 20(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
277
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
278 flds 16(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
279 fsubs 108(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
280 fmuls 16(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
281 fstps 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
282
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
283 flds 20(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
284 fsubs 104(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
285 fmuls 20(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
286 fstps 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
287
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
288 flds 24(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
289 fadds 100(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
290 fstps 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
291
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
292 flds 28(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
293 fadds 96(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
294 fstps 28(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
295
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
296 flds 24(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
297 fsubs 100(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
298 fmuls 24(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
299 fstps 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
300
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
301 flds 28(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
302 fsubs 96(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
303 fmuls 28(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
304 fstps 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
305
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
306 flds 32(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
307 fadds 92(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
308 fstps 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
309
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
310 flds 36(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
311 fadds 88(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
312 fstps 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
313
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
314 flds 32(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
315 fsubs 92(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
316 fmuls 32(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
317 fstps 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
318
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
319 flds 36(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
320 fsubs 88(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
321 fmuls 36(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
322 fstps 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
323
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
324 flds 40(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
325 fadds 84(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
326 fstps 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
327
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
328 flds 44(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
329 fadds 80(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
330 fstps 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
331
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
332 flds 40(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
333 fsubs 84(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
334 fmuls 40(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
335 fstps 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
336
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
337 flds 44(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
338 fsubs 80(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
339 fmuls 44(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
340 fstps 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
341
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
342 flds 48(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
343 fadds 76(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
344 fstps 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
345
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
346 flds 52(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
347 fadds 72(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
348 fstps 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
349
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
350 flds 48(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
351 fsubs 76(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
352 fmuls 48(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
353 fstps 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
354
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
355 flds 52(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
356 fsubs 72(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
357 fmuls 52(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
358 fstps 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
359
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
360 flds 56(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
361 fadds 68(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
362 fstps 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
363
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
364 flds 60(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
365 fadds 64(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
366 fstps 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
367
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
368 flds 56(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
369 fsubs 68(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
370 fmuls 56(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
371 fstps 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
372
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
373 flds 60(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
374 fsubs 64(%eax)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
375 fmuls 60(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
376 fstps 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
377 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
378 // end phase 1 fpu code
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
379
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
380 /* Phase 2 (completed, worx) */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
381
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
382 / movq (%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
383 / movq 8(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
384 movups (%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
385
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
386 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
387 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
388 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
389
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
390 / movq 56(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
391 / movq 48(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
392 movups 48(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
393
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
394 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
395 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
396 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
397 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
398
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
399 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
400 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
401 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
402
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
403 / movq %mm0, (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
404 / movq %mm4, 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
405 movups %xmm0, (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
406
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
407 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
408 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
409 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
410
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
411 / pfmul 64(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
412 / pfmul 72(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
413 movups 64(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
414 mulps %xmm7, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
415
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
416 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
417 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
418 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
419
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
420 / movq %mm3, 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
421 / movq %mm7, 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
422 movups %xmm2, 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
423
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
424 / movq 16(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
425 / movq 24(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
426 movups 16(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
427
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
428 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
429 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
430 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
431
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
432 / movq 40(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
433 / movq 32(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
434 movups 32(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
435
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
436 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
437 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
438 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
439 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
440
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
441 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
442 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
443 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
444
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
445 / movq %mm0, 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
446 / movq %mm4, 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
447 movups %xmm0, 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
448
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
449 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
450 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
451 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
452
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
453 / pfmul 80(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
454 / pfmul 88(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
455 movups 80(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
456 mulps %xmm7, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
457
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
458 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
459 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
460 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
461
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
462 / movq %mm3, 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
463 / movq %mm7, 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
464 movups %xmm2, 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
465
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
466
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
467 // phase 2 fpu
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
468 /* Phase 2*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
469 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
470 flds (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
471 fadds 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
472 fstps (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
473
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
474 flds 4(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
475 fadds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
476 fstps 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
477
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
478 flds (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
479 fsubs 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
480 fmuls 64(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
481 fstps 60(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
482
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
483 flds 4(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
484 fsubs 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
485 fmuls 68(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
486 fstps 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
487
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
488 flds 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
489 fadds 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
490 fstps 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
491
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
492 flds 12(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
493 fadds 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
494 fstps 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
495
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
496 flds 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
497 fsubs 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
498 fmuls 72(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
499 fstps 52(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
500
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
501 flds 12(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
502 fsubs 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
503 fmuls 76(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
504 fstps 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
505
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
506 flds 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
507 fadds 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
508 fstps 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
509
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
510 flds 20(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
511 fadds 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
512 fstps 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
513
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
514 flds 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
515 fsubs 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
516 fmuls 80(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
517 fstps 44(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
518
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
519 flds 20(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
520 fsubs 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
521 fmuls 84(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
522 fstps 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
523
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
524 flds 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
525 fadds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
526 fstps 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
527
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
528 flds 28(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
529 fadds 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
530 fstps 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
531
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
532 flds 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
533 fsubs 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
534 fmuls 88(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
535 fstps 36(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
536
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
537 flds 28(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
538 fsubs 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
539 fmuls 92(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
540 fstps 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
541 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
542 // end phase 2 fpu
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
543
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
544 /* Phase 3 (completed, working) */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
545
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
546 / movq 64(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
547 / movq 72(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
548 movups 64(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
549
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
550 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
551 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
552 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
553
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
554 / movq 120(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
555 / movq 112(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
556 movups 112(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
557
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
558 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
559 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
560 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
561 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
562
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
563 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
564 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
565 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
566
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
567 / movq %mm0, 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
568 / movq %mm4, 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
569 movups %xmm0, 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
570
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
571 / pfsubr %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
572 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
573 // optimized (xmm1<->xmm2)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
574 subps %xmm2, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
575
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
576 / pfmul 64(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
577 / pfmul 72(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
578 movups 64(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
579 mulps %xmm7, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
580
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
581 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
582 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
583 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
584
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
585 / movq %mm3, 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
586 / movq %mm7, 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
587 movups %xmm1, 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
588
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
589
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
590 / movq 80(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
591 / movq 88(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
592 movups 80(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
593
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
594 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
595 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
596 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
597
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
598 / movq 104(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
599 / movq 96(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
600 movups 96(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
601
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
602 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
603 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
604 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
605 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
606
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
607 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
608 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
609 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
610
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
611 / movq %mm0, 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
612 / movq %mm4, 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
613 movups %xmm0, 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
614
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
615 / pfsubr %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
616 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
617 // optimized (xmm1<->xmm2)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
618 subps %xmm2, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
619
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
620 / pfmul 80(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
621 / pfmul 88(%ebx), %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
622 movups 80(%ebx), %xmm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
623 mulps %xmm7, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
624
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
625 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
626 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
627 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
628
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
629 / movq %mm3, 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
630 / movq %mm7, 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
631 movups %xmm1, 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
632
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
633
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
634 // phase 3 fpu
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
635 /* Phase 3*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
636 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
637 flds 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
638 fadds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
639 fstps 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
640
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
641 flds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
642 fadds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
643 fstps 68(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
644
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
645 flds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
646 fsubs 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
647 fmuls 64(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
648 fstps 124(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
649
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
650 flds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
651 fsubs 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
652 fmuls 68(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
653 fstps 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
654
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
655 flds 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
656 fadds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
657 fstps 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
658
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
659 flds 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
660 fadds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
661 fstps 76(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
662
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
663 flds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
664 fsubs 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
665 fmuls 72(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
666 fstps 116(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
667
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
668 flds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
669 fsubs 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
670 fmuls 76(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
671 fstps 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
672
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
673 flds 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
674 fadds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
675 fstps 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
676
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
677 flds 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
678 fadds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
679 fstps 84(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
680
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
681 flds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
682 fsubs 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
683 fmuls 80(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
684 fstps 108(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
685
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
686 flds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
687 fsubs 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
688 fmuls 84(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
689 fstps 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
690
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
691 flds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
692 fadds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
693 fstps 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
694
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
695 flds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
696 fadds 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
697 fstps 92(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
698
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
699 flds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
700 fsubs 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
701 fmuls 88(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
702 fstps 100(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
703
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
704 flds 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
705 fsubs 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
706 fmuls 92(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
707 fstps 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
708 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
709 // end phase 3 fpu
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
710
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
711
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
712 /* Phase 4 (completed, buggy) */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
713 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
714 / movq 96(%ebx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
715 / movq 104(%ebx), %mm6
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
716 movups 96(%ebx), %xmm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
717
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
718
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
719 / movq (%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
720 / movq 8(%ecx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
721 movups (%ecx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
722
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
723 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
724 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
725 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
726
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
727 / movq 24(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
728 / movq 16(%ecx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
729 movups 16(%ecx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
730
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
731 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
732 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
733 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
734 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
735
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
736 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
737 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
738 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
739
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
740 / movq %mm0, (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
741 / movq %mm4, 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
742 movups %xmm0, (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
743
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
744 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
745 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
746 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
747
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
748 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
749 / pfmul %mm6, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
750 mulps %xmm4, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
751
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
752 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
753 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
754 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
755
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
756 / movq %mm3, 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
757 / movq %mm7, 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
758 movups %xmm2, 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
759
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
760 / movq 32(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
761 / movq 40(%ecx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
762 movups 32(%ecx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
763
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
764 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
765 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
766 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
767
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
768 / movq 56(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
769 / movq 48(%ecx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
770 movups 48(%ecx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
771
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
772 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
773 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
774 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
775 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
776
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
777 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
778 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
779 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
780
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
781 / movq %mm0, 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
782 / movq %mm4, 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
783 movups %xmm0, 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
784
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
785 / pfsubr %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
786 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
787 // Luckily we can swap this (xmm1<->xmm2)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
788 subps %xmm2, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
789
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
790 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
791 / pfmul %mm6, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
792 mulps %xmm4, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
793
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
794 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
795 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
796 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
797
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
798 / movq %mm3, 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
799 / movq %mm7, 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
800 movups %xmm1, 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
801
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
802
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
803 / movq 64(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
804 / movq 72(%ecx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
805 movups 64(%ecx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
806
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
807 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
808 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
809 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
810
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
811 / movq 88(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
812 / movq 80(%ecx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
813 movups 80(%ecx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
814
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
815 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
816 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
817 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
818 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
819
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
820 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
821 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
822 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
823
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
824 / movq %mm0, 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
825 / movq %mm4, 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
826 movups %xmm0, 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
827
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
828 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
829 / pfsub %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
830 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
831
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
832 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
833 / pfmul %mm6, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
834 mulps %xmm4, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
835
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
836 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
837 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
838 shufps $27, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
839
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
840 / movq %mm3, 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
841 / movq %mm7, 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
842 movups %xmm2, 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
843
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
844
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
845 / movq 96(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
846 / movq 104(%ecx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
847 movups 96(%ecx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
848
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
849 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
850 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
851 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
852
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
853 / movq 120(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
854 / movq 112(%ecx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
855 movups 112(%ecx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
856
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
857 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
858 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
859 //// shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
860 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
861
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
862 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
863 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
864 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
865
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
866 / movq %mm0, 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
867 / movq %mm4, 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
868 movups %xmm0, 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
869
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
870 / pfsubr %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
871 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
872 // This is already optimized, so xmm2 must be swapped with xmm1 for rest of phase
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
873 subps %xmm2, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
874
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
875 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
876 / pfmul %mm6, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
877 mulps %xmm4, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
878
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
879 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
880 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
881 shufps $27, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
882
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
883 / movq %mm3, 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
884 / movq %mm7, 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
885 movups %xmm1, 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
886 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
887
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
888 // phase 4 fpu code
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
889 /* Phase 4*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
890
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
891 flds (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
892 fadds 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
893 fstps (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
894
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
895 flds (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
896 fsubs 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
897 fmuls 96(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
898 fstps 28(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
899
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
900 flds 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
901 fadds 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
902 fstps 4(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
903
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
904 flds 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
905 fsubs 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
906 fmuls 100(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
907 fstps 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
908
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
909 flds 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
910 fadds 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
911 fstps 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
912
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
913 flds 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
914 fsubs 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
915 fmuls 104(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
916 fstps 20(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
917
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
918 flds 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
919 fadds 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
920 fstps 12(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
921
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
922 flds 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
923 fsubs 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
924 fmuls 108(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
925 fstps 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
926
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
927 flds 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
928 fadds 60(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
929 fstps 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
930
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
931 flds 60(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
932 fsubs 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
933 fmuls 96(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
934 fstps 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
935
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
936 flds 36(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
937 fadds 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
938 fstps 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
939
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
940 flds 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
941 fsubs 36(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
942 fmuls 100(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
943 fstps 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
944
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
945 flds 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
946 fadds 52(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
947 fstps 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
948
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
949 flds 52(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
950 fsubs 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
951 fmuls 104(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
952 fstps 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
953
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
954 flds 44(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
955 fadds 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
956 fstps 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
957
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
958 flds 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
959 fsubs 44(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
960 fmuls 108(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
961 fstps 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
962
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
963 flds 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
964 fadds 92(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
965 fstps 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
966
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
967 flds 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
968 fsubs 92(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
969 fmuls 96(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
970 fstps 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
971
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
972 flds 68(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
973 fadds 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
974 fstps 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
975
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
976 flds 68(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
977 fsubs 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
978 fmuls 100(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
979 fstps 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
980
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
981 flds 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
982 fadds 84(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
983 fstps 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
984
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
985 flds 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
986 fsubs 84(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
987 fmuls 104(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
988 fstps 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
989
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
990 flds 76(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
991 fadds 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
992 fstps 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
993
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
994 flds 76(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
995 fsubs 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
996 fmuls 108(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
997 fstps 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
998
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
999 flds 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1000 fadds 124(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1001 fstps 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1002
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1003 flds 124(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1004 fsubs 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1005 fmuls 96(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1006 fstps 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1007
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1008 flds 100(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1009 fadds 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1010 fstps 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1011
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1012 flds 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1013 fsubs 100(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1014 fmuls 100(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1015 fstps 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1016
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1017 flds 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1018 fadds 116(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1019 fstps 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1020
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1021 flds 116(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1022 fsubs 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1023 fmuls 104(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1024 fstps 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1025
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1026 flds 108(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1027 fadds 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1028 fstps 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1029
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1030 flds 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1031 fsubs 108(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1032 fmuls 108(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1033 fstps 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1034
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1035 flds (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1036 fadds 12(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1037 fstps (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1038
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1039 flds (%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1040 fsubs 12(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1041 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1042 fstps 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1043
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1044 flds 4(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1045 fadds 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1046 fstps 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1047
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1048 flds 4(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1049 fsubs 8(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1050 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1051 fstps 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1052
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1053 flds 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1054 fadds 28(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1055 fstps 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1056
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1057 flds 28(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1058 fsubs 16(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1059 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1060 fstps 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1061
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1062 flds 20(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1063 fadds 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1064 fstps 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1065
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1066 flds 24(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1067 fsubs 20(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1068 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1069 fstps 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1070
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1071 flds 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1072 fadds 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1073 fstps 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1074
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1075 flds 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1076 fsubs 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1077 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1078 fstps 44(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1079
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1080 flds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1081 fadds 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1082 fstps 36(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1083
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1084 flds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1085 fsubs 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1086 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1087 fstps 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1088
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1089 flds 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1090 fadds 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1091 fstps 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1092
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1093 flds 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1094 fsubs 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1095 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1096 fstps 60(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1097
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1098 flds 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1099 fadds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1100 fstps 52(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1101
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1102 flds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1103 fsubs 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1104 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1105 fstps 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1106
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1107 flds 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1108 fadds 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1109 fstps 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1110
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1111 flds 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1112 fsubs 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1113 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1114 fstps 76(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1115
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1116 flds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1117 fadds 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1118 fstps 68(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1119
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1120 flds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1121 fsubs 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1122 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1123 fstps 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1124
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1125 flds 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1126 fadds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1127 fstps 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1128
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1129 flds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1130 fsubs 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1131 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1132 fstps 92(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1133
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1134 flds 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1135 fadds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1136 fstps 84(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1137
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1138 flds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1139 fsubs 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1140 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1141 fstps 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1142
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1143 flds 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1144 fadds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1145 fstps 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1146
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1147 flds 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1148 fsubs 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1149 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1150 fstps 108(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1151
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1152 flds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1153 fadds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1154 fstps 100(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1155
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1156 flds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1157 fsubs 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1158 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1159 fstps 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1160
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1161 flds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1162 fadds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1163 fstps 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1164
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1165 flds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1166 fsubs 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1167 fmuls 112(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1168 fstps 124(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1169
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1170 flds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1171 fadds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1172 fstps 116(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1173
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1174 flds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1175 fsubs 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1176 fmuls 116(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1177 fstps 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1178
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1179 // end of phase 4 fpu
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1180
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1181 // below stuff needs to be finished I use FPU code for first
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1182 /* Phase 5 (completed, crashing) */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1183 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1184 / movq 112(%ebx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1185 // move 8 byte data to (low)high quadword - check this! atmos
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1186 movlps 112(%ebx), %xmm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1187 // maybe I need movhlps too to get data into correct quadword
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1188 movlhps %xmm4, %xmm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1189
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1190 / movq (%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1191 / movq 16(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1192 movups (%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1193
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1194 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1195 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1196 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1197
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1198 // hmm? this is strange
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1199 / movq 8(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1200 / movq 24(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1201 movlps 8(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1202 movhps 24(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1203
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1204 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1205 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1206 pshufd $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1207
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1208 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1209 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1210 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1211
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1212 / movq %mm0, (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1213 / movq %mm4, 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1214 movlps %xmm0, (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1215 movhps %xmm0, 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1216
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1217 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1218 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1219 // I need to emulate pfsubr here
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1220 movaps %xmm1, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1221 subps %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1222 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1223 // now move correct quadword from reverse substration in xmm3 to correct
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1224 // quadword in xmm2 and leave other quadword with non-reversed substration untouched
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1225 /// shufpd $2, %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1226 // (or $1?) (see ia32-ref p.749)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1227 // optimize
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1228 movq %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1229 movaps %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1230
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1231 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1232 / pfmul %mm2, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1233 mulps %xmm4, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1234
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1235 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1236 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1237 shufps $177, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1238
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1239 / movq %mm3, 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1240 / movq %mm7, 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1241 movlps %xmm2, 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1242 movhps %xmm2, 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1243
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1244 / movq 32(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1245 / movq 48(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1246 movlps 32(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1247 movhps 48(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1248
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1249 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1250 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1251 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1252
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1253 / movq 40(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1254 / movq 56(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1255 movlps 40(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1256 movhps 56(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1257
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1258 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1259 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1260 shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1261
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1262 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1263 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1264 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1265
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1266 / movq %mm0, 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1267 / movq %mm4, 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1268 movlps %xmm0, 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1269 movhps %xmm0, 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1270
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1271 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1272 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1273 movaps %xmm1, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1274 subps %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1275 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1276 /// shufpd $2, %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1277 // (or $1?)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1278 // optimize
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1279 movq %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1280 movaps %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1281
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1282 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1283 / pfmul %mm2, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1284 mulps %xmm4, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1285
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1286 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1287 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1288 shufps $177, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1289
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1290 / movq %mm3, 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1291 / movq %mm7, 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1292 movlps %xmm2, 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1293 movhps %xmm2, 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1294
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1295
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1296 / movq 64(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1297 / movq 80(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1298 movlps 64(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1299 movhps 80(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1300
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1301 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1302 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1303 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1304
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1305 / movq 72(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1306 / movq 88(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1307 movlps 72(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1308 movhps 88(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1309
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1310 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1311 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1312 shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1313
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1314 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1315 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1316 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1317
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1318 / movq %mm0, 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1319 / movq %mm4, 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1320 movlps %xmm0, 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1321 movhps %xmm0, 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1322
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1323 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1324 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1325 movaps %xmm1, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1326 subps %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1327 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1328 /// shufpd $2, %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1329 // (or $1?)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1330 // optimize
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1331 movq %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1332 movaps %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1333
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1334 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1335 / pfmul %mm2, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1336 mulps %xmm4, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1337
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1338 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1339 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1340 shufps $177, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1341
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1342 / movq %mm3, 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1343 / movq %mm7, 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1344 movlps %xmm2, 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1345 movhps %xmm2, 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1346
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1347 / movq 96(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1348 / movq 112(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1349 movups 96(%edx), %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1350
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1351 / movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1352 / movq %mm4, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1353 movaps %xmm0, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1354
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1355 / movq 104(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1356 / movq 120(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1357 movlps 104(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1358 movhps 120(%edx), %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1359
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1360 / pswapd %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1361 / pswapd %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1362 shufps $177, %xmm1, %xmm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1363
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1364 / pfadd %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1365 / pfadd %mm5, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1366 addps %xmm1, %xmm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1367
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1368 / movq %mm0, 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1369 / movq %mm4, 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1370 movups %xmm0, 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1371
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1372 / pfsub %mm1, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1373 / pfsubr %mm5, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1374 movaps %xmm1, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1375 subps %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1376 subps %xmm1, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1377 /// shufpd $2, %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1378 // (or $1?)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1379 // optimize
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1380 movq %xmm2, %xmm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1381 movaps %xmm3, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1382
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1383 / pfmul %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1384 / pfmul %mm2, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1385 mulps %xmm4, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1386
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1387 / pswapd %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1388 / pswapd %mm7, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1389 shufps $177, %xmm2, %xmm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1390
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1391 / movq %mm3, 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1392 / movq %mm7, 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1393 movlps %xmm2, 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1394 movhps %xmm2, 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1395 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1396
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1397
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1398 /* Phase 6. This is the end of easy road. */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1399 /* Code below is coded in scalar mode. Should be optimized */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1400 //
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1401 // movd plus_1f, %mm6
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1402 // punpckldq 120(%ebx), %mm6 /* mm6 = 1.0 | 120(%ebx)*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1403 // movq x_plus_minus_3dnow, %mm7 /* mm7 = +1 | -1 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1404 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1405 movq 32(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1406 movq 64(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1407 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1408 movq %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1409 pxor %mm7, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1410 pxor %mm7, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1411 pfacc %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1412 pfacc %mm3, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1413 pfmul %mm6, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1414 pfmul %mm6, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1415 movq %mm0, 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1416 movq %mm2, 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1417
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1418 movd 44(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1419 movd 40(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1420 movd 120(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1421 punpckldq 76(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1422 punpckldq 72(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1423 punpckldq %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1424 movq %mm0, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1425 movq %mm2, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1426 pfsub %mm2, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1427 pfmul %mm3, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1428 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1429 pfadd %mm5, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1430 pfadd %mm4, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1431 movq %mm0, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1432 punpckldq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1433 punpckhdq %mm1, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1434 movq %mm0, 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1435 movq %mm2, 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1436
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1437 movd 48(%ecx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1438 movd 60(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1439 pfsub 52(%ecx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1440 pfsub 56(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1441 pfmul 120(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1442 pfmul 120(%ebx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1443 movq %mm2, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1444
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1445 pfadd 56(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1446 pfadd 60(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1447 movq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1448
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1449 pfadd 48(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1450 pfadd 52(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1451 pfadd %mm3, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1452 punpckldq %mm2, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1453 pfadd %mm3, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1454 punpckldq %mm2, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1455 movq %mm1, 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1456 movq %mm0, 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1457 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1458 /*---*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1459 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1460 movd 92(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1461 pfsub 88(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1462 pfmul 120(%ebx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1463 movd %mm1, 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1464 pfadd 92(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1465 pfadd 88(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1466 movq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1467
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1468 pfadd 80(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1469 pfadd 84(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1470 movd %mm0, 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1471
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1472 movd 80(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1473 pfsub 84(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1474 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1475 pfadd %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1476 pfadd 92(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1477 punpckldq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1478 movq %mm0, 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1479
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1480 movq 96(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1481 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1482 pxor %mm7, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1483 pfacc %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1484 pfmul %mm6, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1485 movq %mm0, 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1486
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1487 movd 108(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1488 pfsub 104(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1489 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1490 movd %mm0, 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1491 pfadd 104(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1492 pfadd 108(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1493 movd %mm0, 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1494
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1495 movd 124(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1496 pfsub 120(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1497 pfmul 120(%ebx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1498 movd %mm1, 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1499 pfadd 120(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1500 pfadd 124(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1501 movq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1502
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1503 pfadd 112(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1504 pfadd 116(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1505 movd %mm0, 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1506
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1507 movd 112(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1508 pfsub 116(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1509 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1510 pfadd %mm0,%mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1511 pfadd 124(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1512 punpckldq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1513 movq %mm0, 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1514
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1515 jnz .L01
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1516 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1517
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1518
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1519 /* Phase 7*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1520 /* Code below is coded in scalar mode. Should be optimized */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1521 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1522 movd (%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1523 pfadd 4(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1524 movd %mm0, 1024(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1525
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1526 movd (%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1527 pfsub 4(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1528 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1529 movd %mm0, (%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1530 movd %mm0, (%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1531
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1532 movd 12(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1533 pfsub 8(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1534 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1535 movd %mm0, 512(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1536 pfadd 12(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1537 pfadd 8(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1538 movd %mm0, 512(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1539
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1540 movd 16(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1541 pfsub 20(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1542 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1543 movq %mm0, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1544
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1545 movd 28(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1546 pfsub 24(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1547 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1548 movd %mm0, 768(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1549 movq %mm0, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1550
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1551 pfadd 24(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1552 pfadd 28(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1553 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1554
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1555 pfadd 16(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1556 pfadd 20(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1557 movd %mm0, 768(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1558 pfadd %mm3, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1559 movd %mm1, 256(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1560 pfadd %mm3, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1561 movd %mm2, 256(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1562 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1563
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1564
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1565 /* Phase 8*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1566 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1567 movq 32(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1568 movq 48(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1569 pfadd 48(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1570 pfadd 40(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1571 movd %mm0, 896(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1572 movd %mm1, 640(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1573 psrlq $32, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1574 psrlq $32, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1575 movd %mm0, 128(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1576 movd %mm1, 384(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1577
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1578 movd 40(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1579 pfadd 56(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1580 movd %mm0, 384(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1581
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1582 movd 56(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1583 pfadd 36(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1584 movd %mm0, 128(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1585
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1586 movd 60(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1587 movd %mm0, 896(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1588 pfadd 44(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1589 movd %mm0, 640(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1590
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1591 movq 96(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1592 movq 112(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1593 movq 104(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1594 pfadd 112(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1595 pfadd 104(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1596 pfadd 120(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1597 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1598 movq %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1599 movq %mm4, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1600 pfadd 64(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1601 pfadd 80(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1602 pfadd 72(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1603 movd %mm0, 960(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1604 movd %mm2, 704(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1605 movd %mm4, 448(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1606 psrlq $32, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1607 psrlq $32, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1608 psrlq $32, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1609 movd %mm0, 64(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1610 movd %mm2, 320(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1611 movd %mm4, 576(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1612 pfadd 80(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1613 pfadd 72(%edx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1614 pfadd 88(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1615 movd %mm1, 832(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1616 movd %mm3, 576(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1617 movd %mm5, 320(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1618 psrlq $32, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1619 psrlq $32, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1620 psrlq $32, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1621 movd %mm1, 192(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1622 movd %mm3, 448(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1623 movd %mm5, 704(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1624
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1625 movd 120(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1626 pfadd 100(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1627 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1628 pfadd 88(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1629 movd %mm0, 192(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1630 pfadd 68(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1631 movd %mm1, 64(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1632
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1633 movd 124(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1634 movd %mm0, 960(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1635 pfadd 92(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1636 movd %mm0, 832(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1637
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1638 jmp .L_bye
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1639 .L01:
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1640 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1641
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1642
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1643 /* Phase 9*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1644 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1645 movq (%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1646 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1647 pxor %mm7, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1648 pfacc %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1649 pfmul %mm6, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1650 pf2id %mm0, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1651 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1652 movw %ax, 512(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1653 psrlq $32, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1654 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1655 movw %ax, (%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1656
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1657 movd 12(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1658 pfsub 8(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1659 pfmul 120(%ebx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1660 pf2id %mm0, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1661 movd %mm7, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1662 movw %ax, 256(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1663 pfadd 12(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1664 pfadd 8(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1665 pf2id %mm0, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1666 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1667 movw %ax, 256(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1668
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1669 movd 16(%ecx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1670 pfsub 20(%ecx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1671 pfmul 120(%ebx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1672 movq %mm3, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1673
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1674 movd 28(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1675 pfsub 24(%ecx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1676 pfmul 120(%ebx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1677 movq %mm2, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1678
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1679 pf2id %mm2, %mm7
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1680 movd %mm7, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1681 movw %ax, 384(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1682
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1683 pfadd 24(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1684 pfadd 28(%ecx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1685 movq %mm1, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1686
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1687 pfadd 16(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1688 pfadd 20(%ecx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1689 pf2id %mm0, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1690 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1691 movw %ax, 384(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1692 pfadd %mm3, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1693 pf2id %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1694 movd %mm1, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1695 movw %ax, 128(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1696 pfadd %mm3, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1697 pf2id %mm2, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1698 movd %mm2, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1699 movw %ax, 128(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1700 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1701
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1702
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1703 /* Phase 10*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1704 /*
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1705 movq 32(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1706 movq 48(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1707 pfadd 48(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1708 pfadd 40(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1709 pf2id %mm0, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1710 pf2id %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1711 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1712 movd %mm1, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1713 movw %ax, 448(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1714 movw %cx, 320(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1715 psrlq $32, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1716 psrlq $32, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1717 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1718 movd %mm1, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1719 movw %ax, 64(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1720 movw %cx, 192(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1721
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1722 movd 40(%edx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1723 movd 56(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1724 movd 60(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1725 movd 44(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1726 movd 120(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1727 punpckldq %mm4, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1728 punpckldq 124(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1729 pfadd 100(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1730 punpckldq 36(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1731 punpckldq 92(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1732 movq %mm5, %mm6
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1733 pfadd %mm4, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1734 pf2id %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1735 pf2id %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1736 pfadd 88(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1737 movd %mm1, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1738 movd %mm3, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1739 movw %ax, 448(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1740 movw %cx, 192(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1741 pf2id %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1742 psrlq $32, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1743 psrlq $32, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1744 movd %mm5, %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1745 movd %mm1, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1746 movd %mm3, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1747 movw %bx, 96(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1748 movw %ax, 480(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1749 movw %cx, 64(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1750 pfadd %mm2, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1751 pf2id %mm0, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1752 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1753 pfadd 68(%edx), %mm6
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1754 movw %ax, 320(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1755 psrlq $32, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1756 pf2id %mm6, %mm6
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1757 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1758 movd %mm6, %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1759 movw %ax, 416(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1760 movw %bx, 32(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1761
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1762 movq 96(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1763 movq 112(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1764 movq 104(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1765 pfadd %mm2, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1766 pfadd %mm4, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1767 pfadd 120(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1768 movq %mm0, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1769 movq %mm2, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1770 movq %mm4, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1771 pfadd 64(%edx), %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1772 pfadd 80(%edx), %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1773 pfadd 72(%edx), %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1774 pf2id %mm0, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1775 pf2id %mm2, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1776 pf2id %mm4, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1777 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1778 movd %mm2, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1779 movd %mm4, %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1780 movw %ax, 480(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1781 movw %cx, 352(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1782 movw %bx, 224(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1783 psrlq $32, %mm0
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1784 psrlq $32, %mm2
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1785 psrlq $32, %mm4
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1786 movd %mm0, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1787 movd %mm2, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1788 movd %mm4, %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1789 movw %ax, 32(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1790 movw %cx, 160(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1791 movw %bx, 288(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1792 pfadd 80(%edx), %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1793 pfadd 72(%edx), %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1794 pfadd 88(%edx), %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1795 pf2id %mm1, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1796 pf2id %mm3, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1797 pf2id %mm5, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1798 movd %mm1, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1799 movd %mm3, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1800 movd %mm5, %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1801 movw %ax, 416(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1802 movw %cx, 288(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1803 movw %bx, 160(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1804 psrlq $32, %mm1
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1805 psrlq $32, %mm3
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1806 psrlq $32, %mm5
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1807 movd %mm1, %eax
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1808 movd %mm3, %ecx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1809 movd %mm5, %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1810 movw %ax, 96(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1811 movw %cx, 224(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1812 movw %bx, 352(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1813
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1814 movsw
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1815
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1816 .L_bye:
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1817 addl $256,%esp
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1818 / femms
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1819 emms
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1820 popl %edi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1821 popl %esi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1822 popl %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1823 ret $12
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1824 */
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1825
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1826 // here comes old fashioned FPU code for the tough parts
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1827
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1828 /* Phase 5*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1829
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1830 flds 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1831 fadds 36(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1832 fstps 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1833
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1834 flds 32(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1835 fsubs 36(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1836 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1837 fstps 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1838
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1839 flds 44(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1840 fsubs 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1841 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1842 fsts 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1843 fadds 40(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1844 fadds 44(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1845 fstps 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1846
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1847 flds 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1848 fsubs 52(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1849 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1850
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1851 flds 60(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1852 fsubs 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1853 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1854 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1855 fadds 56(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1856 fadds 60(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1857 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1858 fadds 48(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1859 fadds 52(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1860 fstps 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1861 fadd %st(2)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1862 fstps 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1863 fsts 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1864 faddp %st(1)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1865 fstps 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1866
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1867 flds 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1868 fadds 68(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1869 fstps 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1870
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1871 flds 64(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1872 fsubs 68(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1873 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1874 fstps 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1875
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1876 flds 76(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1877 fsubs 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1878 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1879 fsts 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1880 fadds 72(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1881 fadds 76(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1882 fstps 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1883
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1884 flds 92(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1885 fsubs 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1886 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1887 fsts 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1888 fadds 92(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1889 fadds 88(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1890 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1891 fadds 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1892 fadds 84(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1893 fstps 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1894
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1895 flds 80(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1896 fsubs 84(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1897 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1898 fadd %st(0), %st(1)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1899 fadds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1900 fstps 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1901 fstps 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1902
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1903 flds 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1904 fadds 100(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1905 fstps 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1906
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1907 flds 96(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1908 fsubs 100(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1909 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1910 fstps 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1911
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1912 flds 108(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1913 fsubs 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1914 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1915 fsts 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1916 fadds 104(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1917 fadds 108(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1918 fstps 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1919
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1920 flds 124(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1921 fsubs 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1922 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1923 fsts 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1924 fadds 120(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1925 fadds 124(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1926 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1927 fadds 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1928 fadds 116(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1929 fstps 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1930
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1931 flds 112(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1932 fsubs 116(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1933 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1934 fadd %st(0),%st(1)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1935 fadds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1936 fstps 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1937 fstps 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1938 jnz .L01
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1939
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1940
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1941 /* Phase 6*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1942
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1943 flds (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1944 fadds 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1945 fstps 1024(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1946
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1947 flds (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1948 fsubs 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1949 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1950 fsts (%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1951 fstps (%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1952
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1953 flds 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1954 fsubs 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1955 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1956 fsts 512(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1957 fadds 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1958 fadds 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1959 fstps 512(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1960
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1961 flds 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1962 fsubs 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1963 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1964
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1965 flds 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1966 fsubs 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1967 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1968 fsts 768(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1969 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1970 fadds 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1971 fadds 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1972 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1973 fadds 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1974 fadds 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1975 fstps 768(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1976 fadd %st(2)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1977 fstps 256(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1978 faddp %st(1)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1979 fstps 256(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1980
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1981 /* Phase 7*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1982
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1983 flds 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1984 fadds 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1985 fstps 896(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1986
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1987 flds 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1988 fadds 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1989 fstps 640(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1990
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1991 flds 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1992 fadds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1993 fstps 384(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1994
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1995 flds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1996 fadds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1997 fstps 128(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1998
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
1999 flds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2000 fadds 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2001 fstps 128(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2002
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2003 flds 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2004 fadds 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2005 fstps 384(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2006
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2007 flds 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2008 fsts 896(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2009 fadds 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2010 fstps 640(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2011
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2012 flds 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2013 fadds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2014 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2015 fadds 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2016 fstps 960(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2017 fadds 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2018 fstps 832(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2019
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2020 flds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2021 fadds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2022 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2023 fadds 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2024 fstps 704(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2025 fadds 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2026 fstps 576(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2027
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2028 flds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2029 fadds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2030 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2031 fadds 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2032 fstps 448(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2033 fadds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2034 fstps 320(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2035
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2036 flds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2037 fadds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2038 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2039 fadds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2040 fstps 192(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2041 fadds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2042 fstps 64(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2043
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2044 flds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2045 fadds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2046 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2047 fadds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2048 fstps 64(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2049 fadds 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2050 fstps 192(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2051
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2052 flds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2053 fadds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2054 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2055 fadds 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2056 fstps 320(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2057 fadds 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2058 fstps 448(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2059
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2060 flds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2061 fadds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2062 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2063 fadds 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2064 fstps 576(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2065 fadds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2066 fstps 704(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2067
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2068 flds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2069 fsts 960(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2070 fadds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2071 fstps 832(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2072 addl $256,%esp
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2073 popl %edi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2074 popl %esi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2075 popl %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2076 ret
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2077 .L01:
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2078 /* Phase 8*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2079
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2080 flds (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2081 fadds 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2082 fistp 512(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2083
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2084 flds (%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2085 fsubs 4(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2086 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2087
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2088 fistp (%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2089
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2090
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2091 flds 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2092 fsubs 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2093 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2094 fist 256(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2095 fadds 12(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2096 fadds 8(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2097 fistp 256(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2098
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2099 flds 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2100 fsubs 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2101 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2102
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2103 flds 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2104 fsubs 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2105 fmuls 120(%ebx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2106 fist 384(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2107 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2108 fadds 24(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2109 fadds 28(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2110 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2111 fadds 16(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2112 fadds 20(%ecx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2113 fistp 384(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2114 fadd %st(2)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2115 fistp 128(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2116 faddp %st(1)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2117 fistp 128(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2118
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2119 /* Phase 9*/
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2120
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2121 flds 32(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2122 fadds 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2123 fistp 448(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2124
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2125 flds 48(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2126 fadds 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2127 fistp 320(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2128
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2129 flds 40(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2130 fadds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2131 fistp 192(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2132
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2133 flds 56(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2134 fadds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2135 fistp 64(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2136
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2137 flds 36(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2138 fadds 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2139 fistp 64(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2140
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2141 flds 52(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2142 fadds 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2143 fistp 192(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2144
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2145 flds 60(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2146 fist 448(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2147 fadds 44(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2148 fistp 320(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2149
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2150 flds 96(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2151 fadds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2152 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2153 fadds 64(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2154 fistp 480(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2155 fadds 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2156 fistp 416(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2157
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2158 flds 112(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2159 fadds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2160 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2161 fadds 80(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2162 fistp 352(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2163 fadds 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2164 fistp 288(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2165
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2166 flds 104(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2167 fadds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2168 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2169 fadds 72(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2170 fistp 224(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2171 fadds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2172 fistp 160(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2173
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2174 flds 120(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2175 fadds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2176 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2177 fadds 88(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2178 fistp 96(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2179 fadds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2180 fistp 32(%esi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2181
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2182 flds 100(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2183 fadds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2184 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2185 fadds 68(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2186 fistp 32(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2187 fadds 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2188 fistp 96(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2189
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2190 flds 116(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2191 fadds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2192 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2193 fadds 84(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2194 fistp 160(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2195 fadds 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2196 fistp 224(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2197
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2198 flds 108(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2199 fadds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2200 fld %st(0)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2201 fadds 76(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2202 fistp 288(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2203 fadds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2204 fistp 352(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2205
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2206 flds 124(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2207 fist 480(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2208 fadds 92(%edx)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2209 fistp 416(%edi)
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2210 movsw
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2211 addl $256,%esp
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2212 popl %edi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2213 popl %esi
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2214 popl %ebx
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2215 ret $12
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2216
d9e3f91d6da9 First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff changeset
2217 // end of FPU stuff