Mercurial > mplayer.hg
annotate mp3lib/dct64_sse.s @ 2316:bcb229557e9b
fixed alignment (static variables where sometimes not 8-byte aligned)
added half uv interpolation support
added prefetch
BGR15 support in MMX (untested) (so BGR15,16,24,32 are supported)
special unscaled height version (not much faster but it doesnt interpolate uv vertically)
author | michael |
---|---|
date | Sat, 20 Oct 2001 21:12:09 +0000 |
parents | d9e3f91d6da9 |
children | 8312f4bc8dab |
rev | line source |
---|---|
1394
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1 # This code is a translation of dct64_k7.s from MPlayer. |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2 # Coded by Felix Buenemann <atmosfear at users.sourceforge.net> |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
3 # |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
4 # TODO: - fix phases 4 and 5 (sse) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
5 # - optimize scalar FPU code? (interleave with sse code) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
6 # |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
8 //.data |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
9 // .align 8 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
10 //x_plus_minus_3dnow: .long 0x00000000, 0x80000000 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
11 //plus_1f: .float 1.0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
12 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
13 .text |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
14 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
15 .align 16 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
16 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
17 .global dct64_MMX_sse |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
18 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
19 dct64_MMX_sse: |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
20 pushl %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
21 pushl %esi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
22 pushl %edi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
23 subl $256,%esp |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
24 movl 280(%esp),%eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
25 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
26 leal 128(%esp),%edx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
27 movl 272(%esp),%esi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
28 movl 276(%esp),%edi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
29 movl $costab_mmx,%ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
30 orl %ecx,%ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
31 movl %esp,%ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
32 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
33 /* Phase 1 (complete, worx) */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
34 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
35 // [1] Process Block A1 (16 Bytes) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
36 / movq (%eax), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
37 / movq 8(%eax), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
38 movups (%eax), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
39 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
40 // Copy A1 to another register A2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
41 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
42 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
43 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
44 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
45 // Process Block B1 (last 16 bytes) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
46 / movq 120(%eax), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
47 / movq 112(%eax), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
48 movups 112(%eax), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
49 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
50 /* The PSWAPD instruction swaps or reverses the upper and lower |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
51 * doublewords of the source operand. PSWAPD mmreg1, mmreg2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
52 * performs the following operations: |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
53 * temp = mmreg2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
54 * mmreg1[63:32] = temp[31:0 ] |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
55 * mmreg1[31:0 ] = temp[63:32] |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
56 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
57 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
58 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
59 // shufps here exchanges a,b,c,d to b,a,d,c in xmm1 (desc ia32-ref p.752) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
60 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
61 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
62 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
63 // Add B1 to A1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
64 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
65 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
66 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
67 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
68 // Save Block A1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
69 / movq %mm0, (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
70 / movq %mm4, 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
71 movups %xmm0, (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
72 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
73 // Sub B1 from A2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
74 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
75 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
76 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
77 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
78 // Mul mem with A2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
79 / pfmul (%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
80 / pfmul 8(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
81 movups (%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
82 mulps %xmm7, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
83 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
84 // Shuffle A2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
85 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
86 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
87 // I do a,b,c,d -> d,c,b,a to suit order when writing to mem (saves one shufps) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
88 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
89 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
90 // Save A2 to mem (end) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
91 / movq %mm3, 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
92 / movq %mm7, 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
93 movups %xmm2, 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
94 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
95 // [2] Process next data block |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
96 / movq 16(%eax), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
97 / movq 24(%eax), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
98 movups 16(%eax), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
99 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
100 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
101 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
102 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
103 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
104 / movq 104(%eax), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
105 / movq 96(%eax), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
106 movups 96(%eax), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
107 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
108 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
109 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
110 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
111 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
112 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
113 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
114 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
115 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
116 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
117 / movq %mm0, 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
118 / movq %mm4, 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
119 movups %xmm0, 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
120 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
121 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
122 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
123 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
124 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
125 / pfmul 16(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
126 / pfmul 24(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
127 movups 16(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
128 mulps %xmm7, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
129 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
130 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
131 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
132 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
133 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
134 / movq %mm3, 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
135 / movq %mm7, 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
136 movups %xmm2, 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
137 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
138 // [3] |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
139 / movq 32(%eax), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
140 / movq 40(%eax), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
141 movups 32(%eax), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
142 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
143 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
144 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
145 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
146 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
147 / movq 88(%eax), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
148 / movq 80(%eax), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
149 movups 80(%eax), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
150 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
151 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
152 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
153 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
154 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
155 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
156 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
157 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
158 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
159 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
160 / movq %mm0, 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
161 / movq %mm4, 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
162 movups %xmm0, 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
163 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
164 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
165 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
166 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
167 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
168 / pfmul 32(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
169 / pfmul 40(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
170 movups 32(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
171 mulps %xmm7, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
172 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
173 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
174 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
175 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
176 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
177 / movq %mm3, 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
178 / movq %mm7, 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
179 movups %xmm2, 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
180 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
181 // [4] |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
182 / movq 48(%eax), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
183 / movq 56(%eax), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
184 movups 48(%eax), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
185 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
186 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
187 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
188 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
189 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
190 / movq 72(%eax), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
191 / movq 64(%eax), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
192 movups 64(%eax), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
193 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
194 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
195 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
196 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
197 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
198 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
199 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
200 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
201 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
202 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
203 / movq %mm0, 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
204 / movq %mm4, 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
205 movups %xmm0, 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
206 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
207 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
208 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
209 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
210 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
211 / pfmul 48(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
212 / pfmul 56(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
213 movups 48(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
214 mulps %xmm7, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
215 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
216 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
217 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
218 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
219 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
220 / movq %mm3, 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
221 / movq %mm7, 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
222 movups %xmm2, 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
223 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
224 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
225 // phase 1 fpu code |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
226 /* Phase 1*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
227 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
228 flds (%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
229 leal 128(%esp),%edx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
230 fadds 124(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
231 movl 272(%esp),%esi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
232 fstps (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
233 movl 276(%esp),%edi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
234 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
235 flds 4(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
236 movl $costab_mmx,%ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
237 fadds 120(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
238 orl %ecx,%ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
239 fstps 4(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
240 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
241 flds (%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
242 movl %esp,%ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
243 fsubs 124(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
244 fmuls (%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
245 fstps 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
246 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
247 flds 4(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
248 fsubs 120(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
249 fmuls 4(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
250 fstps 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
251 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
252 flds 8(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
253 fadds 116(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
254 fstps 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
255 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
256 flds 12(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
257 fadds 112(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
258 fstps 12(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
259 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
260 flds 8(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
261 fsubs 116(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
262 fmuls 8(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
263 fstps 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
264 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
265 flds 12(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
266 fsubs 112(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
267 fmuls 12(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
268 fstps 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
269 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
270 flds 16(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
271 fadds 108(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
272 fstps 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
273 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
274 flds 20(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
275 fadds 104(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
276 fstps 20(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
277 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
278 flds 16(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
279 fsubs 108(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
280 fmuls 16(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
281 fstps 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
282 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
283 flds 20(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
284 fsubs 104(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
285 fmuls 20(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
286 fstps 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
287 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
288 flds 24(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
289 fadds 100(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
290 fstps 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
291 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
292 flds 28(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
293 fadds 96(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
294 fstps 28(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
295 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
296 flds 24(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
297 fsubs 100(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
298 fmuls 24(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
299 fstps 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
300 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
301 flds 28(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
302 fsubs 96(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
303 fmuls 28(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
304 fstps 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
305 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
306 flds 32(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
307 fadds 92(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
308 fstps 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
309 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
310 flds 36(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
311 fadds 88(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
312 fstps 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
313 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
314 flds 32(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
315 fsubs 92(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
316 fmuls 32(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
317 fstps 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
318 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
319 flds 36(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
320 fsubs 88(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
321 fmuls 36(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
322 fstps 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
323 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
324 flds 40(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
325 fadds 84(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
326 fstps 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
327 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
328 flds 44(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
329 fadds 80(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
330 fstps 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
331 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
332 flds 40(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
333 fsubs 84(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
334 fmuls 40(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
335 fstps 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
336 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
337 flds 44(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
338 fsubs 80(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
339 fmuls 44(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
340 fstps 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
341 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
342 flds 48(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
343 fadds 76(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
344 fstps 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
345 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
346 flds 52(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
347 fadds 72(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
348 fstps 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
349 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
350 flds 48(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
351 fsubs 76(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
352 fmuls 48(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
353 fstps 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
354 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
355 flds 52(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
356 fsubs 72(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
357 fmuls 52(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
358 fstps 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
359 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
360 flds 56(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
361 fadds 68(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
362 fstps 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
363 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
364 flds 60(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
365 fadds 64(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
366 fstps 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
367 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
368 flds 56(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
369 fsubs 68(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
370 fmuls 56(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
371 fstps 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
372 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
373 flds 60(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
374 fsubs 64(%eax) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
375 fmuls 60(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
376 fstps 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
377 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
378 // end phase 1 fpu code |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
379 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
380 /* Phase 2 (completed, worx) */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
381 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
382 / movq (%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
383 / movq 8(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
384 movups (%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
385 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
386 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
387 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
388 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
389 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
390 / movq 56(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
391 / movq 48(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
392 movups 48(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
393 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
394 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
395 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
396 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
397 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
398 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
399 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
400 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
401 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
402 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
403 / movq %mm0, (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
404 / movq %mm4, 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
405 movups %xmm0, (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
406 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
407 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
408 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
409 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
410 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
411 / pfmul 64(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
412 / pfmul 72(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
413 movups 64(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
414 mulps %xmm7, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
415 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
416 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
417 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
418 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
419 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
420 / movq %mm3, 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
421 / movq %mm7, 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
422 movups %xmm2, 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
423 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
424 / movq 16(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
425 / movq 24(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
426 movups 16(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
427 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
428 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
429 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
430 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
431 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
432 / movq 40(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
433 / movq 32(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
434 movups 32(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
435 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
436 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
437 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
438 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
439 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
440 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
441 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
442 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
443 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
444 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
445 / movq %mm0, 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
446 / movq %mm4, 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
447 movups %xmm0, 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
448 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
449 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
450 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
451 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
452 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
453 / pfmul 80(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
454 / pfmul 88(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
455 movups 80(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
456 mulps %xmm7, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
457 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
458 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
459 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
460 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
461 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
462 / movq %mm3, 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
463 / movq %mm7, 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
464 movups %xmm2, 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
465 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
466 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
467 // phase 2 fpu |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
468 /* Phase 2*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
469 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
470 flds (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
471 fadds 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
472 fstps (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
473 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
474 flds 4(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
475 fadds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
476 fstps 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
477 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
478 flds (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
479 fsubs 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
480 fmuls 64(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
481 fstps 60(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
482 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
483 flds 4(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
484 fsubs 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
485 fmuls 68(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
486 fstps 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
487 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
488 flds 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
489 fadds 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
490 fstps 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
491 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
492 flds 12(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
493 fadds 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
494 fstps 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
495 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
496 flds 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
497 fsubs 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
498 fmuls 72(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
499 fstps 52(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
500 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
501 flds 12(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
502 fsubs 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
503 fmuls 76(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
504 fstps 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
505 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
506 flds 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
507 fadds 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
508 fstps 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
509 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
510 flds 20(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
511 fadds 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
512 fstps 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
513 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
514 flds 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
515 fsubs 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
516 fmuls 80(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
517 fstps 44(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
518 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
519 flds 20(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
520 fsubs 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
521 fmuls 84(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
522 fstps 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
523 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
524 flds 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
525 fadds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
526 fstps 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
527 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
528 flds 28(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
529 fadds 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
530 fstps 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
531 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
532 flds 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
533 fsubs 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
534 fmuls 88(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
535 fstps 36(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
536 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
537 flds 28(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
538 fsubs 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
539 fmuls 92(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
540 fstps 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
541 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
542 // end phase 2 fpu |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
543 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
544 /* Phase 3 (completed, working) */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
545 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
546 / movq 64(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
547 / movq 72(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
548 movups 64(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
549 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
550 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
551 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
552 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
553 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
554 / movq 120(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
555 / movq 112(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
556 movups 112(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
557 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
558 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
559 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
560 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
561 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
562 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
563 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
564 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
565 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
566 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
567 / movq %mm0, 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
568 / movq %mm4, 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
569 movups %xmm0, 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
570 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
571 / pfsubr %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
572 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
573 // optimized (xmm1<->xmm2) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
574 subps %xmm2, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
575 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
576 / pfmul 64(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
577 / pfmul 72(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
578 movups 64(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
579 mulps %xmm7, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
580 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
581 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
582 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
583 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
584 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
585 / movq %mm3, 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
586 / movq %mm7, 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
587 movups %xmm1, 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
588 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
589 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
590 / movq 80(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
591 / movq 88(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
592 movups 80(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
593 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
594 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
595 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
596 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
597 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
598 / movq 104(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
599 / movq 96(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
600 movups 96(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
601 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
602 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
603 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
604 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
605 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
606 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
607 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
608 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
609 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
610 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
611 / movq %mm0, 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
612 / movq %mm4, 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
613 movups %xmm0, 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
614 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
615 / pfsubr %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
616 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
617 // optimized (xmm1<->xmm2) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
618 subps %xmm2, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
619 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
620 / pfmul 80(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
621 / pfmul 88(%ebx), %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
622 movups 80(%ebx), %xmm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
623 mulps %xmm7, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
624 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
625 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
626 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
627 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
628 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
629 / movq %mm3, 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
630 / movq %mm7, 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
631 movups %xmm1, 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
632 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
633 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
634 // phase 3 fpu |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
635 /* Phase 3*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
636 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
637 flds 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
638 fadds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
639 fstps 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
640 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
641 flds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
642 fadds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
643 fstps 68(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
644 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
645 flds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
646 fsubs 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
647 fmuls 64(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
648 fstps 124(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
649 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
650 flds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
651 fsubs 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
652 fmuls 68(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
653 fstps 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
654 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
655 flds 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
656 fadds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
657 fstps 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
658 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
659 flds 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
660 fadds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
661 fstps 76(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
662 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
663 flds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
664 fsubs 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
665 fmuls 72(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
666 fstps 116(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
667 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
668 flds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
669 fsubs 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
670 fmuls 76(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
671 fstps 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
672 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
673 flds 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
674 fadds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
675 fstps 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
676 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
677 flds 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
678 fadds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
679 fstps 84(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
680 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
681 flds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
682 fsubs 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
683 fmuls 80(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
684 fstps 108(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
685 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
686 flds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
687 fsubs 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
688 fmuls 84(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
689 fstps 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
690 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
691 flds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
692 fadds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
693 fstps 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
694 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
695 flds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
696 fadds 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
697 fstps 92(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
698 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
699 flds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
700 fsubs 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
701 fmuls 88(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
702 fstps 100(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
703 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
704 flds 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
705 fsubs 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
706 fmuls 92(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
707 fstps 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
708 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
709 // end phase 3 fpu |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
710 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
711 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
712 /* Phase 4 (completed, buggy) */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
713 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
714 / movq 96(%ebx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
715 / movq 104(%ebx), %mm6 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
716 movups 96(%ebx), %xmm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
717 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
718 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
719 / movq (%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
720 / movq 8(%ecx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
721 movups (%ecx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
722 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
723 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
724 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
725 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
726 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
727 / movq 24(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
728 / movq 16(%ecx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
729 movups 16(%ecx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
730 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
731 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
732 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
733 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
734 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
735 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
736 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
737 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
738 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
739 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
740 / movq %mm0, (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
741 / movq %mm4, 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
742 movups %xmm0, (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
743 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
744 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
745 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
746 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
747 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
748 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
749 / pfmul %mm6, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
750 mulps %xmm4, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
751 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
752 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
753 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
754 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
755 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
756 / movq %mm3, 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
757 / movq %mm7, 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
758 movups %xmm2, 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
759 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
760 / movq 32(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
761 / movq 40(%ecx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
762 movups 32(%ecx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
763 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
764 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
765 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
766 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
767 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
768 / movq 56(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
769 / movq 48(%ecx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
770 movups 48(%ecx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
771 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
772 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
773 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
774 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
775 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
776 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
777 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
778 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
779 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
780 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
781 / movq %mm0, 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
782 / movq %mm4, 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
783 movups %xmm0, 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
784 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
785 / pfsubr %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
786 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
787 // Luckily we can swap this (xmm1<->xmm2) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
788 subps %xmm2, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
789 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
790 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
791 / pfmul %mm6, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
792 mulps %xmm4, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
793 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
794 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
795 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
796 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
797 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
798 / movq %mm3, 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
799 / movq %mm7, 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
800 movups %xmm1, 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
801 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
802 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
803 / movq 64(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
804 / movq 72(%ecx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
805 movups 64(%ecx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
806 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
807 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
808 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
809 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
810 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
811 / movq 88(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
812 / movq 80(%ecx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
813 movups 80(%ecx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
814 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
815 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
816 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
817 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
818 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
819 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
820 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
821 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
822 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
823 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
824 / movq %mm0, 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
825 / movq %mm4, 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
826 movups %xmm0, 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
827 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
828 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
829 / pfsub %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
830 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
831 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
832 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
833 / pfmul %mm6, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
834 mulps %xmm4, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
835 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
836 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
837 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
838 shufps $27, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
839 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
840 / movq %mm3, 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
841 / movq %mm7, 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
842 movups %xmm2, 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
843 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
844 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
845 / movq 96(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
846 / movq 104(%ecx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
847 movups 96(%ecx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
848 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
849 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
850 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
851 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
852 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
853 / movq 120(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
854 / movq 112(%ecx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
855 movups 112(%ecx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
856 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
857 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
858 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
859 //// shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
860 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
861 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
862 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
863 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
864 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
865 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
866 / movq %mm0, 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
867 / movq %mm4, 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
868 movups %xmm0, 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
869 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
870 / pfsubr %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
871 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
872 // This is already optimized, so xmm2 must be swapped with xmm1 for rest of phase |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
873 subps %xmm2, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
874 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
875 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
876 / pfmul %mm6, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
877 mulps %xmm4, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
878 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
879 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
880 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
881 shufps $27, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
882 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
883 / movq %mm3, 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
884 / movq %mm7, 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
885 movups %xmm1, 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
886 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
887 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
888 // phase 4 fpu code |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
889 /* Phase 4*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
890 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
891 flds (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
892 fadds 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
893 fstps (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
894 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
895 flds (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
896 fsubs 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
897 fmuls 96(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
898 fstps 28(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
899 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
900 flds 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
901 fadds 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
902 fstps 4(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
903 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
904 flds 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
905 fsubs 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
906 fmuls 100(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
907 fstps 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
908 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
909 flds 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
910 fadds 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
911 fstps 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
912 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
913 flds 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
914 fsubs 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
915 fmuls 104(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
916 fstps 20(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
917 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
918 flds 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
919 fadds 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
920 fstps 12(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
921 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
922 flds 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
923 fsubs 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
924 fmuls 108(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
925 fstps 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
926 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
927 flds 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
928 fadds 60(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
929 fstps 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
930 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
931 flds 60(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
932 fsubs 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
933 fmuls 96(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
934 fstps 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
935 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
936 flds 36(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
937 fadds 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
938 fstps 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
939 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
940 flds 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
941 fsubs 36(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
942 fmuls 100(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
943 fstps 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
944 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
945 flds 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
946 fadds 52(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
947 fstps 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
948 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
949 flds 52(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
950 fsubs 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
951 fmuls 104(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
952 fstps 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
953 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
954 flds 44(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
955 fadds 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
956 fstps 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
957 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
958 flds 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
959 fsubs 44(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
960 fmuls 108(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
961 fstps 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
962 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
963 flds 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
964 fadds 92(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
965 fstps 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
966 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
967 flds 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
968 fsubs 92(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
969 fmuls 96(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
970 fstps 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
971 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
972 flds 68(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
973 fadds 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
974 fstps 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
975 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
976 flds 68(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
977 fsubs 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
978 fmuls 100(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
979 fstps 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
980 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
981 flds 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
982 fadds 84(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
983 fstps 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
984 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
985 flds 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
986 fsubs 84(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
987 fmuls 104(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
988 fstps 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
989 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
990 flds 76(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
991 fadds 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
992 fstps 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
993 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
994 flds 76(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
995 fsubs 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
996 fmuls 108(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
997 fstps 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
998 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
999 flds 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1000 fadds 124(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1001 fstps 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1002 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1003 flds 124(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1004 fsubs 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1005 fmuls 96(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1006 fstps 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1007 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1008 flds 100(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1009 fadds 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1010 fstps 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1011 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1012 flds 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1013 fsubs 100(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1014 fmuls 100(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1015 fstps 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1016 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1017 flds 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1018 fadds 116(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1019 fstps 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1020 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1021 flds 116(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1022 fsubs 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1023 fmuls 104(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1024 fstps 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1025 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1026 flds 108(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1027 fadds 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1028 fstps 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1029 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1030 flds 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1031 fsubs 108(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1032 fmuls 108(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1033 fstps 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1034 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1035 flds (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1036 fadds 12(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1037 fstps (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1038 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1039 flds (%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1040 fsubs 12(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1041 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1042 fstps 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1043 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1044 flds 4(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1045 fadds 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1046 fstps 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1047 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1048 flds 4(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1049 fsubs 8(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1050 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1051 fstps 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1052 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1053 flds 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1054 fadds 28(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1055 fstps 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1056 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1057 flds 28(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1058 fsubs 16(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1059 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1060 fstps 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1061 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1062 flds 20(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1063 fadds 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1064 fstps 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1065 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1066 flds 24(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1067 fsubs 20(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1068 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1069 fstps 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1070 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1071 flds 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1072 fadds 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1073 fstps 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1074 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1075 flds 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1076 fsubs 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1077 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1078 fstps 44(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1079 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1080 flds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1081 fadds 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1082 fstps 36(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1083 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1084 flds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1085 fsubs 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1086 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1087 fstps 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1088 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1089 flds 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1090 fadds 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1091 fstps 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1092 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1093 flds 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1094 fsubs 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1095 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1096 fstps 60(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1097 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1098 flds 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1099 fadds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1100 fstps 52(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1101 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1102 flds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1103 fsubs 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1104 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1105 fstps 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1106 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1107 flds 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1108 fadds 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1109 fstps 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1110 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1111 flds 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1112 fsubs 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1113 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1114 fstps 76(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1115 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1116 flds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1117 fadds 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1118 fstps 68(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1119 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1120 flds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1121 fsubs 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1122 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1123 fstps 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1124 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1125 flds 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1126 fadds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1127 fstps 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1128 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1129 flds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1130 fsubs 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1131 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1132 fstps 92(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1133 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1134 flds 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1135 fadds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1136 fstps 84(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1137 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1138 flds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1139 fsubs 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1140 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1141 fstps 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1142 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1143 flds 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1144 fadds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1145 fstps 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1146 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1147 flds 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1148 fsubs 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1149 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1150 fstps 108(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1151 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1152 flds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1153 fadds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1154 fstps 100(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1155 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1156 flds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1157 fsubs 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1158 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1159 fstps 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1160 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1161 flds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1162 fadds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1163 fstps 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1164 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1165 flds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1166 fsubs 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1167 fmuls 112(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1168 fstps 124(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1169 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1170 flds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1171 fadds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1172 fstps 116(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1173 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1174 flds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1175 fsubs 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1176 fmuls 116(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1177 fstps 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1178 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1179 // end of phase 4 fpu |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1180 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1181 // below stuff needs to be finished I use FPU code for first |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1182 /* Phase 5 (completed, crashing) */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1183 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1184 / movq 112(%ebx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1185 // move 8 byte data to (low)high quadword - check this! atmos |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1186 movlps 112(%ebx), %xmm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1187 // maybe I need movhlps too to get data into correct quadword |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1188 movlhps %xmm4, %xmm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1189 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1190 / movq (%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1191 / movq 16(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1192 movups (%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1193 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1194 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1195 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1196 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1197 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1198 // hmm? this is strange |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1199 / movq 8(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1200 / movq 24(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1201 movlps 8(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1202 movhps 24(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1203 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1204 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1205 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1206 pshufd $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1207 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1208 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1209 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1210 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1211 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1212 / movq %mm0, (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1213 / movq %mm4, 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1214 movlps %xmm0, (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1215 movhps %xmm0, 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1216 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1217 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1218 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1219 // I need to emulate pfsubr here |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1220 movaps %xmm1, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1221 subps %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1222 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1223 // now move correct quadword from reverse substration in xmm3 to correct |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1224 // quadword in xmm2 and leave other quadword with non-reversed substration untouched |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1225 /// shufpd $2, %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1226 // (or $1?) (see ia32-ref p.749) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1227 // optimize |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1228 movq %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1229 movaps %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1230 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1231 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1232 / pfmul %mm2, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1233 mulps %xmm4, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1234 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1235 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1236 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1237 shufps $177, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1238 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1239 / movq %mm3, 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1240 / movq %mm7, 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1241 movlps %xmm2, 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1242 movhps %xmm2, 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1243 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1244 / movq 32(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1245 / movq 48(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1246 movlps 32(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1247 movhps 48(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1248 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1249 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1250 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1251 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1252 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1253 / movq 40(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1254 / movq 56(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1255 movlps 40(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1256 movhps 56(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1257 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1258 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1259 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1260 shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1261 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1262 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1263 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1264 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1265 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1266 / movq %mm0, 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1267 / movq %mm4, 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1268 movlps %xmm0, 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1269 movhps %xmm0, 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1270 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1271 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1272 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1273 movaps %xmm1, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1274 subps %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1275 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1276 /// shufpd $2, %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1277 // (or $1?) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1278 // optimize |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1279 movq %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1280 movaps %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1281 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1282 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1283 / pfmul %mm2, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1284 mulps %xmm4, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1285 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1286 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1287 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1288 shufps $177, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1289 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1290 / movq %mm3, 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1291 / movq %mm7, 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1292 movlps %xmm2, 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1293 movhps %xmm2, 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1294 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1295 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1296 / movq 64(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1297 / movq 80(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1298 movlps 64(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1299 movhps 80(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1300 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1301 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1302 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1303 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1304 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1305 / movq 72(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1306 / movq 88(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1307 movlps 72(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1308 movhps 88(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1309 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1310 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1311 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1312 shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1313 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1314 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1315 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1316 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1317 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1318 / movq %mm0, 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1319 / movq %mm4, 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1320 movlps %xmm0, 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1321 movhps %xmm0, 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1322 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1323 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1324 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1325 movaps %xmm1, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1326 subps %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1327 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1328 /// shufpd $2, %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1329 // (or $1?) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1330 // optimize |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1331 movq %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1332 movaps %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1333 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1334 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1335 / pfmul %mm2, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1336 mulps %xmm4, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1337 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1338 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1339 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1340 shufps $177, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1341 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1342 / movq %mm3, 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1343 / movq %mm7, 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1344 movlps %xmm2, 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1345 movhps %xmm2, 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1346 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1347 / movq 96(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1348 / movq 112(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1349 movups 96(%edx), %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1350 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1351 / movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1352 / movq %mm4, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1353 movaps %xmm0, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1354 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1355 / movq 104(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1356 / movq 120(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1357 movlps 104(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1358 movhps 120(%edx), %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1359 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1360 / pswapd %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1361 / pswapd %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1362 shufps $177, %xmm1, %xmm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1363 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1364 / pfadd %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1365 / pfadd %mm5, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1366 addps %xmm1, %xmm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1367 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1368 / movq %mm0, 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1369 / movq %mm4, 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1370 movups %xmm0, 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1371 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1372 / pfsub %mm1, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1373 / pfsubr %mm5, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1374 movaps %xmm1, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1375 subps %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1376 subps %xmm1, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1377 /// shufpd $2, %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1378 // (or $1?) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1379 // optimize |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1380 movq %xmm2, %xmm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1381 movaps %xmm3, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1382 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1383 / pfmul %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1384 / pfmul %mm2, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1385 mulps %xmm4, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1386 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1387 / pswapd %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1388 / pswapd %mm7, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1389 shufps $177, %xmm2, %xmm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1390 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1391 / movq %mm3, 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1392 / movq %mm7, 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1393 movlps %xmm2, 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1394 movhps %xmm2, 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1395 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1396 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1397 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1398 /* Phase 6. This is the end of easy road. */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1399 /* Code below is coded in scalar mode. Should be optimized */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1400 // |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1401 // movd plus_1f, %mm6 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1402 // punpckldq 120(%ebx), %mm6 /* mm6 = 1.0 | 120(%ebx)*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1403 // movq x_plus_minus_3dnow, %mm7 /* mm7 = +1 | -1 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1404 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1405 movq 32(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1406 movq 64(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1407 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1408 movq %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1409 pxor %mm7, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1410 pxor %mm7, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1411 pfacc %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1412 pfacc %mm3, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1413 pfmul %mm6, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1414 pfmul %mm6, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1415 movq %mm0, 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1416 movq %mm2, 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1417 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1418 movd 44(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1419 movd 40(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1420 movd 120(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1421 punpckldq 76(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1422 punpckldq 72(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1423 punpckldq %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1424 movq %mm0, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1425 movq %mm2, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1426 pfsub %mm2, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1427 pfmul %mm3, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1428 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1429 pfadd %mm5, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1430 pfadd %mm4, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1431 movq %mm0, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1432 punpckldq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1433 punpckhdq %mm1, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1434 movq %mm0, 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1435 movq %mm2, 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1436 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1437 movd 48(%ecx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1438 movd 60(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1439 pfsub 52(%ecx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1440 pfsub 56(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1441 pfmul 120(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1442 pfmul 120(%ebx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1443 movq %mm2, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1444 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1445 pfadd 56(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1446 pfadd 60(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1447 movq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1448 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1449 pfadd 48(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1450 pfadd 52(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1451 pfadd %mm3, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1452 punpckldq %mm2, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1453 pfadd %mm3, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1454 punpckldq %mm2, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1455 movq %mm1, 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1456 movq %mm0, 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1457 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1458 /*---*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1459 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1460 movd 92(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1461 pfsub 88(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1462 pfmul 120(%ebx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1463 movd %mm1, 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1464 pfadd 92(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1465 pfadd 88(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1466 movq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1467 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1468 pfadd 80(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1469 pfadd 84(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1470 movd %mm0, 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1471 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1472 movd 80(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1473 pfsub 84(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1474 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1475 pfadd %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1476 pfadd 92(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1477 punpckldq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1478 movq %mm0, 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1479 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1480 movq 96(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1481 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1482 pxor %mm7, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1483 pfacc %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1484 pfmul %mm6, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1485 movq %mm0, 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1486 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1487 movd 108(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1488 pfsub 104(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1489 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1490 movd %mm0, 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1491 pfadd 104(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1492 pfadd 108(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1493 movd %mm0, 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1494 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1495 movd 124(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1496 pfsub 120(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1497 pfmul 120(%ebx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1498 movd %mm1, 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1499 pfadd 120(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1500 pfadd 124(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1501 movq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1502 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1503 pfadd 112(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1504 pfadd 116(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1505 movd %mm0, 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1506 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1507 movd 112(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1508 pfsub 116(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1509 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1510 pfadd %mm0,%mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1511 pfadd 124(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1512 punpckldq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1513 movq %mm0, 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1514 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1515 jnz .L01 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1516 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1517 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1518 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1519 /* Phase 7*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1520 /* Code below is coded in scalar mode. Should be optimized */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1521 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1522 movd (%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1523 pfadd 4(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1524 movd %mm0, 1024(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1525 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1526 movd (%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1527 pfsub 4(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1528 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1529 movd %mm0, (%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1530 movd %mm0, (%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1531 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1532 movd 12(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1533 pfsub 8(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1534 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1535 movd %mm0, 512(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1536 pfadd 12(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1537 pfadd 8(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1538 movd %mm0, 512(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1539 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1540 movd 16(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1541 pfsub 20(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1542 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1543 movq %mm0, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1544 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1545 movd 28(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1546 pfsub 24(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1547 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1548 movd %mm0, 768(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1549 movq %mm0, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1550 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1551 pfadd 24(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1552 pfadd 28(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1553 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1554 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1555 pfadd 16(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1556 pfadd 20(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1557 movd %mm0, 768(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1558 pfadd %mm3, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1559 movd %mm1, 256(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1560 pfadd %mm3, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1561 movd %mm2, 256(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1562 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1563 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1564 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1565 /* Phase 8*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1566 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1567 movq 32(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1568 movq 48(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1569 pfadd 48(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1570 pfadd 40(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1571 movd %mm0, 896(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1572 movd %mm1, 640(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1573 psrlq $32, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1574 psrlq $32, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1575 movd %mm0, 128(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1576 movd %mm1, 384(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1577 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1578 movd 40(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1579 pfadd 56(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1580 movd %mm0, 384(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1581 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1582 movd 56(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1583 pfadd 36(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1584 movd %mm0, 128(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1585 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1586 movd 60(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1587 movd %mm0, 896(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1588 pfadd 44(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1589 movd %mm0, 640(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1590 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1591 movq 96(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1592 movq 112(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1593 movq 104(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1594 pfadd 112(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1595 pfadd 104(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1596 pfadd 120(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1597 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1598 movq %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1599 movq %mm4, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1600 pfadd 64(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1601 pfadd 80(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1602 pfadd 72(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1603 movd %mm0, 960(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1604 movd %mm2, 704(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1605 movd %mm4, 448(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1606 psrlq $32, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1607 psrlq $32, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1608 psrlq $32, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1609 movd %mm0, 64(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1610 movd %mm2, 320(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1611 movd %mm4, 576(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1612 pfadd 80(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1613 pfadd 72(%edx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1614 pfadd 88(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1615 movd %mm1, 832(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1616 movd %mm3, 576(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1617 movd %mm5, 320(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1618 psrlq $32, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1619 psrlq $32, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1620 psrlq $32, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1621 movd %mm1, 192(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1622 movd %mm3, 448(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1623 movd %mm5, 704(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1624 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1625 movd 120(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1626 pfadd 100(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1627 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1628 pfadd 88(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1629 movd %mm0, 192(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1630 pfadd 68(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1631 movd %mm1, 64(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1632 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1633 movd 124(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1634 movd %mm0, 960(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1635 pfadd 92(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1636 movd %mm0, 832(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1637 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1638 jmp .L_bye |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1639 .L01: |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1640 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1641 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1642 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1643 /* Phase 9*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1644 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1645 movq (%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1646 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1647 pxor %mm7, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1648 pfacc %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1649 pfmul %mm6, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1650 pf2id %mm0, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1651 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1652 movw %ax, 512(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1653 psrlq $32, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1654 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1655 movw %ax, (%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1656 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1657 movd 12(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1658 pfsub 8(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1659 pfmul 120(%ebx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1660 pf2id %mm0, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1661 movd %mm7, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1662 movw %ax, 256(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1663 pfadd 12(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1664 pfadd 8(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1665 pf2id %mm0, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1666 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1667 movw %ax, 256(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1668 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1669 movd 16(%ecx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1670 pfsub 20(%ecx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1671 pfmul 120(%ebx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1672 movq %mm3, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1673 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1674 movd 28(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1675 pfsub 24(%ecx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1676 pfmul 120(%ebx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1677 movq %mm2, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1678 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1679 pf2id %mm2, %mm7 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1680 movd %mm7, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1681 movw %ax, 384(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1682 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1683 pfadd 24(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1684 pfadd 28(%ecx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1685 movq %mm1, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1686 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1687 pfadd 16(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1688 pfadd 20(%ecx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1689 pf2id %mm0, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1690 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1691 movw %ax, 384(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1692 pfadd %mm3, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1693 pf2id %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1694 movd %mm1, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1695 movw %ax, 128(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1696 pfadd %mm3, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1697 pf2id %mm2, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1698 movd %mm2, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1699 movw %ax, 128(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1700 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1701 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1702 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1703 /* Phase 10*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1704 /* |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1705 movq 32(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1706 movq 48(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1707 pfadd 48(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1708 pfadd 40(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1709 pf2id %mm0, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1710 pf2id %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1711 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1712 movd %mm1, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1713 movw %ax, 448(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1714 movw %cx, 320(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1715 psrlq $32, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1716 psrlq $32, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1717 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1718 movd %mm1, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1719 movw %ax, 64(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1720 movw %cx, 192(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1721 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1722 movd 40(%edx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1723 movd 56(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1724 movd 60(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1725 movd 44(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1726 movd 120(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1727 punpckldq %mm4, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1728 punpckldq 124(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1729 pfadd 100(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1730 punpckldq 36(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1731 punpckldq 92(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1732 movq %mm5, %mm6 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1733 pfadd %mm4, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1734 pf2id %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1735 pf2id %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1736 pfadd 88(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1737 movd %mm1, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1738 movd %mm3, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1739 movw %ax, 448(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1740 movw %cx, 192(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1741 pf2id %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1742 psrlq $32, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1743 psrlq $32, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1744 movd %mm5, %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1745 movd %mm1, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1746 movd %mm3, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1747 movw %bx, 96(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1748 movw %ax, 480(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1749 movw %cx, 64(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1750 pfadd %mm2, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1751 pf2id %mm0, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1752 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1753 pfadd 68(%edx), %mm6 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1754 movw %ax, 320(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1755 psrlq $32, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1756 pf2id %mm6, %mm6 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1757 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1758 movd %mm6, %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1759 movw %ax, 416(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1760 movw %bx, 32(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1761 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1762 movq 96(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1763 movq 112(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1764 movq 104(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1765 pfadd %mm2, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1766 pfadd %mm4, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1767 pfadd 120(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1768 movq %mm0, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1769 movq %mm2, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1770 movq %mm4, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1771 pfadd 64(%edx), %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1772 pfadd 80(%edx), %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1773 pfadd 72(%edx), %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1774 pf2id %mm0, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1775 pf2id %mm2, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1776 pf2id %mm4, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1777 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1778 movd %mm2, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1779 movd %mm4, %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1780 movw %ax, 480(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1781 movw %cx, 352(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1782 movw %bx, 224(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1783 psrlq $32, %mm0 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1784 psrlq $32, %mm2 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1785 psrlq $32, %mm4 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1786 movd %mm0, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1787 movd %mm2, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1788 movd %mm4, %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1789 movw %ax, 32(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1790 movw %cx, 160(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1791 movw %bx, 288(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1792 pfadd 80(%edx), %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1793 pfadd 72(%edx), %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1794 pfadd 88(%edx), %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1795 pf2id %mm1, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1796 pf2id %mm3, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1797 pf2id %mm5, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1798 movd %mm1, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1799 movd %mm3, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1800 movd %mm5, %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1801 movw %ax, 416(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1802 movw %cx, 288(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1803 movw %bx, 160(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1804 psrlq $32, %mm1 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1805 psrlq $32, %mm3 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1806 psrlq $32, %mm5 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1807 movd %mm1, %eax |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1808 movd %mm3, %ecx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1809 movd %mm5, %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1810 movw %ax, 96(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1811 movw %cx, 224(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1812 movw %bx, 352(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1813 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1814 movsw |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1815 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1816 .L_bye: |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1817 addl $256,%esp |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1818 / femms |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1819 emms |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1820 popl %edi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1821 popl %esi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1822 popl %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1823 ret $12 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1824 */ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1825 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1826 // here comes old fashioned FPU code for the tough parts |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1827 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1828 /* Phase 5*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1829 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1830 flds 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1831 fadds 36(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1832 fstps 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1833 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1834 flds 32(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1835 fsubs 36(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1836 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1837 fstps 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1838 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1839 flds 44(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1840 fsubs 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1841 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1842 fsts 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1843 fadds 40(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1844 fadds 44(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1845 fstps 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1846 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1847 flds 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1848 fsubs 52(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1849 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1850 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1851 flds 60(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1852 fsubs 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1853 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1854 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1855 fadds 56(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1856 fadds 60(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1857 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1858 fadds 48(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1859 fadds 52(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1860 fstps 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1861 fadd %st(2) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1862 fstps 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1863 fsts 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1864 faddp %st(1) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1865 fstps 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1866 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1867 flds 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1868 fadds 68(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1869 fstps 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1870 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1871 flds 64(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1872 fsubs 68(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1873 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1874 fstps 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1875 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1876 flds 76(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1877 fsubs 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1878 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1879 fsts 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1880 fadds 72(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1881 fadds 76(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1882 fstps 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1883 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1884 flds 92(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1885 fsubs 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1886 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1887 fsts 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1888 fadds 92(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1889 fadds 88(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1890 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1891 fadds 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1892 fadds 84(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1893 fstps 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1894 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1895 flds 80(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1896 fsubs 84(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1897 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1898 fadd %st(0), %st(1) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1899 fadds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1900 fstps 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1901 fstps 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1902 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1903 flds 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1904 fadds 100(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1905 fstps 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1906 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1907 flds 96(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1908 fsubs 100(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1909 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1910 fstps 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1911 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1912 flds 108(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1913 fsubs 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1914 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1915 fsts 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1916 fadds 104(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1917 fadds 108(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1918 fstps 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1919 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1920 flds 124(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1921 fsubs 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1922 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1923 fsts 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1924 fadds 120(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1925 fadds 124(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1926 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1927 fadds 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1928 fadds 116(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1929 fstps 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1930 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1931 flds 112(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1932 fsubs 116(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1933 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1934 fadd %st(0),%st(1) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1935 fadds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1936 fstps 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1937 fstps 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1938 jnz .L01 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1939 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1940 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1941 /* Phase 6*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1942 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1943 flds (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1944 fadds 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1945 fstps 1024(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1946 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1947 flds (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1948 fsubs 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1949 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1950 fsts (%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1951 fstps (%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1952 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1953 flds 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1954 fsubs 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1955 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1956 fsts 512(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1957 fadds 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1958 fadds 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1959 fstps 512(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1960 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1961 flds 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1962 fsubs 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1963 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1964 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1965 flds 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1966 fsubs 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1967 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1968 fsts 768(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1969 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1970 fadds 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1971 fadds 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1972 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1973 fadds 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1974 fadds 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1975 fstps 768(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1976 fadd %st(2) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1977 fstps 256(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1978 faddp %st(1) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1979 fstps 256(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1980 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1981 /* Phase 7*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1982 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1983 flds 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1984 fadds 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1985 fstps 896(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1986 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1987 flds 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1988 fadds 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1989 fstps 640(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1990 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1991 flds 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1992 fadds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1993 fstps 384(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1994 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1995 flds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1996 fadds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1997 fstps 128(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1998 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
1999 flds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2000 fadds 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2001 fstps 128(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2002 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2003 flds 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2004 fadds 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2005 fstps 384(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2006 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2007 flds 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2008 fsts 896(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2009 fadds 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2010 fstps 640(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2011 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2012 flds 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2013 fadds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2014 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2015 fadds 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2016 fstps 960(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2017 fadds 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2018 fstps 832(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2019 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2020 flds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2021 fadds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2022 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2023 fadds 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2024 fstps 704(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2025 fadds 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2026 fstps 576(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2027 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2028 flds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2029 fadds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2030 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2031 fadds 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2032 fstps 448(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2033 fadds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2034 fstps 320(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2035 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2036 flds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2037 fadds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2038 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2039 fadds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2040 fstps 192(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2041 fadds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2042 fstps 64(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2043 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2044 flds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2045 fadds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2046 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2047 fadds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2048 fstps 64(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2049 fadds 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2050 fstps 192(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2051 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2052 flds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2053 fadds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2054 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2055 fadds 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2056 fstps 320(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2057 fadds 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2058 fstps 448(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2059 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2060 flds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2061 fadds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2062 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2063 fadds 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2064 fstps 576(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2065 fadds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2066 fstps 704(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2067 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2068 flds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2069 fsts 960(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2070 fadds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2071 fstps 832(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2072 addl $256,%esp |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2073 popl %edi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2074 popl %esi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2075 popl %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2076 ret |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2077 .L01: |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2078 /* Phase 8*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2079 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2080 flds (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2081 fadds 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2082 fistp 512(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2083 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2084 flds (%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2085 fsubs 4(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2086 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2087 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2088 fistp (%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2089 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2090 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2091 flds 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2092 fsubs 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2093 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2094 fist 256(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2095 fadds 12(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2096 fadds 8(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2097 fistp 256(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2098 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2099 flds 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2100 fsubs 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2101 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2102 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2103 flds 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2104 fsubs 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2105 fmuls 120(%ebx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2106 fist 384(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2107 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2108 fadds 24(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2109 fadds 28(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2110 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2111 fadds 16(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2112 fadds 20(%ecx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2113 fistp 384(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2114 fadd %st(2) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2115 fistp 128(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2116 faddp %st(1) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2117 fistp 128(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2118 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2119 /* Phase 9*/ |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2120 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2121 flds 32(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2122 fadds 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2123 fistp 448(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2124 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2125 flds 48(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2126 fadds 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2127 fistp 320(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2128 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2129 flds 40(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2130 fadds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2131 fistp 192(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2132 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2133 flds 56(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2134 fadds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2135 fistp 64(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2136 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2137 flds 36(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2138 fadds 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2139 fistp 64(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2140 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2141 flds 52(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2142 fadds 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2143 fistp 192(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2144 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2145 flds 60(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2146 fist 448(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2147 fadds 44(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2148 fistp 320(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2149 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2150 flds 96(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2151 fadds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2152 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2153 fadds 64(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2154 fistp 480(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2155 fadds 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2156 fistp 416(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2157 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2158 flds 112(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2159 fadds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2160 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2161 fadds 80(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2162 fistp 352(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2163 fadds 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2164 fistp 288(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2165 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2166 flds 104(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2167 fadds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2168 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2169 fadds 72(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2170 fistp 224(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2171 fadds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2172 fistp 160(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2173 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2174 flds 120(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2175 fadds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2176 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2177 fadds 88(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2178 fistp 96(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2179 fadds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2180 fistp 32(%esi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2181 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2182 flds 100(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2183 fadds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2184 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2185 fadds 68(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2186 fistp 32(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2187 fadds 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2188 fistp 96(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2189 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2190 flds 116(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2191 fadds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2192 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2193 fadds 84(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2194 fistp 160(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2195 fadds 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2196 fistp 224(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2197 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2198 flds 108(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2199 fadds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2200 fld %st(0) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2201 fadds 76(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2202 fistp 288(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2203 fadds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2204 fistp 352(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2205 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2206 flds 124(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2207 fist 480(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2208 fadds 92(%edx) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2209 fistp 416(%edi) |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2210 movsw |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2211 addl $256,%esp |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2212 popl %edi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2213 popl %esi |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2214 popl %ebx |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2215 ret $12 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2216 |
d9e3f91d6da9
First development version of dct64, mixed with 3dnow/k7 and fpu code.
atmos4
parents:
diff
changeset
|
2217 // end of FPU stuff |