aboutsummaryrefslogtreecommitdiffhomepage
path: root/mp3lib
diff options
context:
space:
mode:
authorGravatar diego <diego@b3059339-0415-0410-9bf9-f77b7e298cf2>2010-04-12 10:56:17 +0000
committerGravatar diego <diego@b3059339-0415-0410-9bf9-f77b7e298cf2>2010-04-12 10:56:17 +0000
commit7573c29480850d715e2f06cae70f252573098123 (patch)
treea5a2f498ad3a19806957e1d7e01f913c1650b33d /mp3lib
parent86ea8d4f4abf23672516fa0ca3378aa19c44bf2c (diff)
the great MPlayer tab removal: part I
git-svn-id: svn://svn.mplayerhq.hu/mplayer/trunk@31032 b3059339-0415-0410-9bf9-f77b7e298cf2
Diffstat (limited to 'mp3lib')
-rw-r--r--mp3lib/dct36.c28
-rw-r--r--mp3lib/dct36_3dnow.c902
-rw-r--r--mp3lib/dct64_3dnow.c1666
-rw-r--r--mp3lib/dct64_k7.c1404
-rw-r--r--mp3lib/dct64_mmx.c1892
-rw-r--r--mp3lib/decod386.c10
-rw-r--r--mp3lib/decode_i586.c6
-rw-r--r--mp3lib/decode_mmx.c382
-rw-r--r--mp3lib/equalizer.c119
-rw-r--r--mp3lib/l2tables.h258
-rw-r--r--mp3lib/layer1.c2
-rw-r--r--mp3lib/layer2.c6
-rw-r--r--mp3lib/layer3.c28
-rw-r--r--mp3lib/mpg123.h4
-rw-r--r--mp3lib/sr1.c36
15 files changed, 3371 insertions, 3372 deletions
diff --git a/mp3lib/dct36.c b/mp3lib/dct36.c
index b884bb949d..22ec273277 100644
--- a/mp3lib/dct36.c
+++ b/mp3lib/dct36.c
@@ -189,21 +189,21 @@ static void dct36(real *inbuf,real *o1,real *o2,real *wintab,real *tsbuf)
ts[SBLIMIT*(8-(v))] = out1[8-(v)] + sum0 * w[8-(v)]; \
ts[SBLIMIT*(9+(v))] = out1[9+(v)] + sum0 * w[9+(v)];
#define MACRO1(v) { \
- real sum0,sum1; \
+ real sum0, sum1; \
sum0 = tmp1a + tmp2a; \
- sum1 = (tmp1b + tmp2b) * tfcos36[(v)]; \
- MACRO0(v); }
+ sum1 = (tmp1b + tmp2b) * tfcos36[(v)]; \
+ MACRO0(v); }
#define MACRO2(v) { \
- real sum0,sum1; \
+ real sum0, sum1; \
sum0 = tmp2a - tmp1a; \
sum1 = (tmp2b - tmp1b) * tfcos36[(v)]; \
- MACRO0(v); }
+ MACRO0(v); }
register const real *c = COS9;
register real *out2 = o2;
- register real *w = wintab;
- register real *out1 = o1;
- register real *ts = tsbuf;
+ register real *w = wintab;
+ register real *out1 = o1;
+ register real *ts = tsbuf;
real ta33,ta66,tb33,tb66;
@@ -256,12 +256,12 @@ static void dct36(real *inbuf,real *o1,real *o2,real *wintab,real *tsbuf)
MACRO2(5);
}
- {
- real sum0,sum1;
- sum0 = in[2*0+0] - in[2*2+0] + in[2*4+0] - in[2*6+0] + in[2*8+0];
- sum1 = (in[2*0+1] - in[2*2+1] + in[2*4+1] - in[2*6+1] + in[2*8+1] ) * tfcos36[4];
- MACRO0(4);
- }
+ {
+ real sum0,sum1;
+ sum0 = in[2*0+0] - in[2*2+0] + in[2*4+0] - in[2*6+0] + in[2*8+0];
+ sum1 = (in[2*0+1] - in[2*2+1] + in[2*4+1] - in[2*6+1] + in[2*8+1] ) * tfcos36[4];
+ MACRO0(4);
+ }
}
#endif
diff --git a/mp3lib/dct36_3dnow.c b/mp3lib/dct36_3dnow.c
index 8263639149..68cc33014b 100644
--- a/mp3lib/dct36_3dnow.c
+++ b/mp3lib/dct36_3dnow.c
@@ -40,462 +40,462 @@ void dct36_3dnow(real *inbuf, real *o1,
#endif
{
__asm__ volatile(
- "movq (%%eax),%%mm0\n\t"
- "movq 4(%%eax),%%mm1\n\t"
- "pfadd %%mm1,%%mm0\n\t"
- "movq %%mm0,4(%%eax)\n\t"
- "psrlq $32,%%mm1\n\t"
- "movq 12(%%eax),%%mm2\n\t"
- "punpckldq %%mm2,%%mm1\n\t"
- "pfadd %%mm2,%%mm1\n\t"
- "movq %%mm1,12(%%eax)\n\t"
- "psrlq $32,%%mm2\n\t"
- "movq 20(%%eax),%%mm3\n\t"
- "punpckldq %%mm3,%%mm2\n\t"
- "pfadd %%mm3,%%mm2\n\t"
- "movq %%mm2,20(%%eax)\n\t"
- "psrlq $32,%%mm3\n\t"
- "movq 28(%%eax),%%mm4\n\t"
- "punpckldq %%mm4,%%mm3\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "movq %%mm3,28(%%eax)\n\t"
- "psrlq $32,%%mm4\n\t"
- "movq 36(%%eax),%%mm5\n\t"
- "punpckldq %%mm5,%%mm4\n\t"
- "pfadd %%mm5,%%mm4\n\t"
- "movq %%mm4,36(%%eax)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movq 44(%%eax),%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movq %%mm5,44(%%eax)\n\t"
- "psrlq $32,%%mm6\n\t"
- "movq 52(%%eax),%%mm7\n\t"
- "punpckldq %%mm7,%%mm6\n\t"
- "pfadd %%mm7,%%mm6\n\t"
- "movq %%mm6,52(%%eax)\n\t"
- "psrlq $32,%%mm7\n\t"
- "movq 60(%%eax),%%mm0\n\t"
- "punpckldq %%mm0,%%mm7\n\t"
- "pfadd %%mm0,%%mm7\n\t"
- "movq %%mm7,60(%%eax)\n\t"
- "psrlq $32,%%mm0\n\t"
- "movd 68(%%eax),%%mm1\n\t"
- "pfadd %%mm1,%%mm0\n\t"
- "movd %%mm0,68(%%eax)\n\t"
- "movd 4(%%eax),%%mm0\n\t"
- "movd 12(%%eax),%%mm1\n\t"
- "punpckldq %%mm1,%%mm0\n\t"
- "punpckldq 20(%%eax),%%mm1\n\t"
- "pfadd %%mm1,%%mm0\n\t"
- "movd %%mm0,12(%%eax)\n\t"
- "psrlq $32,%%mm0\n\t"
- "movd %%mm0,20(%%eax)\n\t"
- "psrlq $32,%%mm1\n\t"
- "movd 28(%%eax),%%mm2\n\t"
- "punpckldq %%mm2,%%mm1\n\t"
- "punpckldq 36(%%eax),%%mm2\n\t"
- "pfadd %%mm2,%%mm1\n\t"
- "movd %%mm1,28(%%eax)\n\t"
- "psrlq $32,%%mm1\n\t"
- "movd %%mm1,36(%%eax)\n\t"
- "psrlq $32,%%mm2\n\t"
- "movd 44(%%eax),%%mm3\n\t"
- "punpckldq %%mm3,%%mm2\n\t"
- "punpckldq 52(%%eax),%%mm3\n\t"
- "pfadd %%mm3,%%mm2\n\t"
- "movd %%mm2,44(%%eax)\n\t"
- "psrlq $32,%%mm2\n\t"
- "movd %%mm2,52(%%eax)\n\t"
- "psrlq $32,%%mm3\n\t"
- "movd 60(%%eax),%%mm4\n\t"
- "punpckldq %%mm4,%%mm3\n\t"
- "punpckldq 68(%%eax),%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "movd %%mm3,60(%%eax)\n\t"
- "psrlq $32,%%mm3\n\t"
- "movd %%mm3,68(%%eax)\n\t"
+ "movq (%%eax),%%mm0\n\t"
+ "movq 4(%%eax),%%mm1\n\t"
+ "pfadd %%mm1,%%mm0\n\t"
+ "movq %%mm0,4(%%eax)\n\t"
+ "psrlq $32,%%mm1\n\t"
+ "movq 12(%%eax),%%mm2\n\t"
+ "punpckldq %%mm2,%%mm1\n\t"
+ "pfadd %%mm2,%%mm1\n\t"
+ "movq %%mm1,12(%%eax)\n\t"
+ "psrlq $32,%%mm2\n\t"
+ "movq 20(%%eax),%%mm3\n\t"
+ "punpckldq %%mm3,%%mm2\n\t"
+ "pfadd %%mm3,%%mm2\n\t"
+ "movq %%mm2,20(%%eax)\n\t"
+ "psrlq $32,%%mm3\n\t"
+ "movq 28(%%eax),%%mm4\n\t"
+ "punpckldq %%mm4,%%mm3\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "movq %%mm3,28(%%eax)\n\t"
+ "psrlq $32,%%mm4\n\t"
+ "movq 36(%%eax),%%mm5\n\t"
+ "punpckldq %%mm5,%%mm4\n\t"
+ "pfadd %%mm5,%%mm4\n\t"
+ "movq %%mm4,36(%%eax)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movq 44(%%eax),%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movq %%mm5,44(%%eax)\n\t"
+ "psrlq $32,%%mm6\n\t"
+ "movq 52(%%eax),%%mm7\n\t"
+ "punpckldq %%mm7,%%mm6\n\t"
+ "pfadd %%mm7,%%mm6\n\t"
+ "movq %%mm6,52(%%eax)\n\t"
+ "psrlq $32,%%mm7\n\t"
+ "movq 60(%%eax),%%mm0\n\t"
+ "punpckldq %%mm0,%%mm7\n\t"
+ "pfadd %%mm0,%%mm7\n\t"
+ "movq %%mm7,60(%%eax)\n\t"
+ "psrlq $32,%%mm0\n\t"
+ "movd 68(%%eax),%%mm1\n\t"
+ "pfadd %%mm1,%%mm0\n\t"
+ "movd %%mm0,68(%%eax)\n\t"
+ "movd 4(%%eax),%%mm0\n\t"
+ "movd 12(%%eax),%%mm1\n\t"
+ "punpckldq %%mm1,%%mm0\n\t"
+ "punpckldq 20(%%eax),%%mm1\n\t"
+ "pfadd %%mm1,%%mm0\n\t"
+ "movd %%mm0,12(%%eax)\n\t"
+ "psrlq $32,%%mm0\n\t"
+ "movd %%mm0,20(%%eax)\n\t"
+ "psrlq $32,%%mm1\n\t"
+ "movd 28(%%eax),%%mm2\n\t"
+ "punpckldq %%mm2,%%mm1\n\t"
+ "punpckldq 36(%%eax),%%mm2\n\t"
+ "pfadd %%mm2,%%mm1\n\t"
+ "movd %%mm1,28(%%eax)\n\t"
+ "psrlq $32,%%mm1\n\t"
+ "movd %%mm1,36(%%eax)\n\t"
+ "psrlq $32,%%mm2\n\t"
+ "movd 44(%%eax),%%mm3\n\t"
+ "punpckldq %%mm3,%%mm2\n\t"
+ "punpckldq 52(%%eax),%%mm3\n\t"
+ "pfadd %%mm3,%%mm2\n\t"
+ "movd %%mm2,44(%%eax)\n\t"
+ "psrlq $32,%%mm2\n\t"
+ "movd %%mm2,52(%%eax)\n\t"
+ "psrlq $32,%%mm3\n\t"
+ "movd 60(%%eax),%%mm4\n\t"
+ "punpckldq %%mm4,%%mm3\n\t"
+ "punpckldq 68(%%eax),%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "movd %%mm3,60(%%eax)\n\t"
+ "psrlq $32,%%mm3\n\t"
+ "movd %%mm3,68(%%eax)\n\t"
- "movq 24(%%eax),%%mm0\n\t"
- "movq 48(%%eax),%%mm1\n\t"
- "movd "MANGLE(COS9)"+12,%%mm2\n\t"
- "punpckldq %%mm2,%%mm2\n\t"
- "movd "MANGLE(COS9)"+24,%%mm3\n\t"
- "punpckldq %%mm3,%%mm3\n\t"
- "pfmul %%mm2,%%mm0\n\t"
- "pfmul %%mm3,%%mm1\n\t"
- "pushl %%eax\n\t"
- "movl $1,%%eax\n\t"
- "movd %%eax,%%mm7\n\t"
- "pi2fd %%mm7,%%mm7\n\t"
- "popl %%eax\n\t"
- "movq 8(%%eax),%%mm2\n\t"
- "movd "MANGLE(COS9)"+4,%%mm3\n\t"
- "punpckldq %%mm3,%%mm3\n\t"
- "pfmul %%mm3,%%mm2\n\t"
- "pfadd %%mm0,%%mm2\n\t"
- "movq 40(%%eax),%%mm3\n\t"
- "movd "MANGLE(COS9)"+20,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "pfadd %%mm3,%%mm2\n\t"
- "movq 56(%%eax),%%mm3\n\t"
- "movd "MANGLE(COS9)"+28,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "pfadd %%mm3,%%mm2\n\t"
- "movq (%%eax),%%mm3\n\t"
- "movq 16(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+8,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "movq 32(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+16,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "pfadd %%mm1,%%mm3\n\t"
- "movq 64(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+32,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "movq %%mm2,%%mm4\n\t"
- "pfadd %%mm3,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+0,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 108(%%edx),%%mm6\n\t"
- "punpckldq 104(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
+ "movq 24(%%eax),%%mm0\n\t"
+ "movq 48(%%eax),%%mm1\n\t"
+ "movd "MANGLE(COS9)"+12,%%mm2\n\t"
+ "punpckldq %%mm2,%%mm2\n\t"
+ "movd "MANGLE(COS9)"+24,%%mm3\n\t"
+ "punpckldq %%mm3,%%mm3\n\t"
+ "pfmul %%mm2,%%mm0\n\t"
+ "pfmul %%mm3,%%mm1\n\t"
+ "pushl %%eax\n\t"
+ "movl $1,%%eax\n\t"
+ "movd %%eax,%%mm7\n\t"
+ "pi2fd %%mm7,%%mm7\n\t"
+ "popl %%eax\n\t"
+ "movq 8(%%eax),%%mm2\n\t"
+ "movd "MANGLE(COS9)"+4,%%mm3\n\t"
+ "punpckldq %%mm3,%%mm3\n\t"
+ "pfmul %%mm3,%%mm2\n\t"
+ "pfadd %%mm0,%%mm2\n\t"
+ "movq 40(%%eax),%%mm3\n\t"
+ "movd "MANGLE(COS9)"+20,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "pfadd %%mm3,%%mm2\n\t"
+ "movq 56(%%eax),%%mm3\n\t"
+ "movd "MANGLE(COS9)"+28,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "pfadd %%mm3,%%mm2\n\t"
+ "movq (%%eax),%%mm3\n\t"
+ "movq 16(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+8,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "movq 32(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+16,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "pfadd %%mm1,%%mm3\n\t"
+ "movq 64(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+32,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "movq %%mm2,%%mm4\n\t"
+ "pfadd %%mm3,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+0,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 108(%%edx),%%mm6\n\t"
+ "punpckldq 104(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
#ifdef DCT36_OPTIMIZE_FOR_K7
- "pswapd %%mm5,%%mm5\n\t"
- "movq %%mm5,32(%%ecx)\n\t"
+ "pswapd %%mm5,%%mm5\n\t"
+ "movq %%mm5,32(%%ecx)\n\t"
#else
- "movd %%mm5,36(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,32(%%ecx)\n\t"
+ "movd %%mm5,36(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,32(%%ecx)\n\t"
#endif
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 32(%%edx),%%mm6\n\t"
- "punpckldq 36(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 32(%%esi),%%mm6\n\t"
- "punpckldq 36(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,1024(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1152(%%ebx)\n\t"
- "movq %%mm3,%%mm4\n\t"
- "pfsub %%mm2,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+32,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 140(%%edx),%%mm6\n\t"
- "punpckldq 72(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,68(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,0(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 0(%%edx),%%mm6\n\t"
- "punpckldq 68(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 0(%%esi),%%mm6\n\t"
- "punpckldq 68(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,0(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,2176(%%ebx)\n\t"
- "movq 8(%%eax),%%mm2\n\t"
- "movq 40(%%eax),%%mm3\n\t"
- "pfsub %%mm3,%%mm2\n\t"
- "movq 56(%%eax),%%mm3\n\t"
- "pfsub %%mm3,%%mm2\n\t"
- "movd "MANGLE(COS9)"+12,%%mm3\n\t"
- "punpckldq %%mm3,%%mm3\n\t"
- "pfmul %%mm3,%%mm2\n\t"
- "movq 16(%%eax),%%mm3\n\t"
- "movq 32(%%eax),%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "movq 64(%%eax),%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "movd "MANGLE(COS9)"+24,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "movq 48(%%eax),%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "movq (%%eax),%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "movq %%mm2,%%mm4\n\t"
- "pfadd %%mm3,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+4,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 112(%%edx),%%mm6\n\t"
- "punpckldq 100(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,40(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,28(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 28(%%edx),%%mm6\n\t"
- "punpckldq 40(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 28(%%esi),%%mm6\n\t"
- "punpckldq 40(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,896(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1280(%%ebx)\n\t"
- "movq %%mm3,%%mm4\n\t"
- "pfsub %%mm2,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+28,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 136(%%edx),%%mm6\n\t"
- "punpckldq 76(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,64(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,4(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 4(%%edx),%%mm6\n\t"
- "punpckldq 64(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 4(%%esi),%%mm6\n\t"
- "punpckldq 64(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,128(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,2048(%%ebx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 32(%%edx),%%mm6\n\t"
+ "punpckldq 36(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 32(%%esi),%%mm6\n\t"
+ "punpckldq 36(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,1024(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1152(%%ebx)\n\t"
+ "movq %%mm3,%%mm4\n\t"
+ "pfsub %%mm2,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+32,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 140(%%edx),%%mm6\n\t"
+ "punpckldq 72(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,68(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,0(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 0(%%edx),%%mm6\n\t"
+ "punpckldq 68(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 0(%%esi),%%mm6\n\t"
+ "punpckldq 68(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,0(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,2176(%%ebx)\n\t"
+ "movq 8(%%eax),%%mm2\n\t"
+ "movq 40(%%eax),%%mm3\n\t"
+ "pfsub %%mm3,%%mm2\n\t"
+ "movq 56(%%eax),%%mm3\n\t"
+ "pfsub %%mm3,%%mm2\n\t"
+ "movd "MANGLE(COS9)"+12,%%mm3\n\t"
+ "punpckldq %%mm3,%%mm3\n\t"
+ "pfmul %%mm3,%%mm2\n\t"
+ "movq 16(%%eax),%%mm3\n\t"
+ "movq 32(%%eax),%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "movq 64(%%eax),%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "movd "MANGLE(COS9)"+24,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "movq 48(%%eax),%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "movq (%%eax),%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "movq %%mm2,%%mm4\n\t"
+ "pfadd %%mm3,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+4,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 112(%%edx),%%mm6\n\t"
+ "punpckldq 100(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,40(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,28(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 28(%%edx),%%mm6\n\t"
+ "punpckldq 40(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 28(%%esi),%%mm6\n\t"
+ "punpckldq 40(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,896(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1280(%%ebx)\n\t"
+ "movq %%mm3,%%mm4\n\t"
+ "pfsub %%mm2,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+28,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 136(%%edx),%%mm6\n\t"
+ "punpckldq 76(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,64(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,4(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 4(%%edx),%%mm6\n\t"
+ "punpckldq 64(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 4(%%esi),%%mm6\n\t"
+ "punpckldq 64(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,128(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,2048(%%ebx)\n\t"
- "movq 8(%%eax),%%mm2\n\t"
- "movd "MANGLE(COS9)"+20,%%mm3\n\t"
- "punpckldq %%mm3,%%mm3\n\t"
- "pfmul %%mm3,%%mm2\n\t"
- "pfsub %%mm0,%%mm2\n\t"
- "movq 40(%%eax),%%mm3\n\t"
- "movd "MANGLE(COS9)"+28,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "pfsub %%mm3,%%mm2\n\t"
- "movq 56(%%eax),%%mm3\n\t"
- "movd "MANGLE(COS9)"+4,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "pfadd %%mm3,%%mm2\n\t"
- "movq (%%eax),%%mm3\n\t"
- "movq 16(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+32,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "movq 32(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+8,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "pfadd %%mm1,%%mm3\n\t"
- "movq 64(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+16,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "movq %%mm2,%%mm4\n\t"
- "pfadd %%mm3,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+8,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 116(%%edx),%%mm6\n\t"
- "punpckldq 96(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,44(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,24(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 24(%%edx),%%mm6\n\t"
- "punpckldq 44(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 24(%%esi),%%mm6\n\t"
- "punpckldq 44(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,768(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1408(%%ebx)\n\t"
- "movq %%mm3,%%mm4\n\t"
- "pfsub %%mm2,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+24,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 132(%%edx),%%mm6\n\t"
- "punpckldq 80(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,60(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,8(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 8(%%edx),%%mm6\n\t"
- "punpckldq 60(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 8(%%esi),%%mm6\n\t"
- "punpckldq 60(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,256(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1920(%%ebx)\n\t"
- "movq 8(%%eax),%%mm2\n\t"
- "movd "MANGLE(COS9)"+28,%%mm3\n\t"
- "punpckldq %%mm3,%%mm3\n\t"
- "pfmul %%mm3,%%mm2\n\t"
- "pfsub %%mm0,%%mm2\n\t"
- "movq 40(%%eax),%%mm3\n\t"
- "movd "MANGLE(COS9)"+4,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "pfadd %%mm3,%%mm2\n\t"
- "movq 56(%%eax),%%mm3\n\t"
- "movd "MANGLE(COS9)"+20,%%mm4\n\t"
- "punpckldq %%mm4,%%mm4\n\t"
- "pfmul %%mm4,%%mm3\n\t"
- "pfsub %%mm3,%%mm2\n\t"
- "movq (%%eax),%%mm3\n\t"
- "movq 16(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+16,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "movq 32(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+32,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfadd %%mm4,%%mm3\n\t"
- "pfadd %%mm1,%%mm3\n\t"
- "movq 64(%%eax),%%mm4\n\t"
- "movd "MANGLE(COS9)"+8,%%mm5\n\t"
- "punpckldq %%mm5,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "pfsub %%mm4,%%mm3\n\t"
- "movq %%mm2,%%mm4\n\t"
- "pfadd %%mm3,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+12,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 120(%%edx),%%mm6\n\t"
- "punpckldq 92(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,48(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,20(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 20(%%edx),%%mm6\n\t"
- "punpckldq 48(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 20(%%esi),%%mm6\n\t"
- "punpckldq 48(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,640(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1536(%%ebx)\n\t"
- "movq %%mm3,%%mm4\n\t"
- "pfsub %%mm2,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+20,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 128(%%edx),%%mm6\n\t"
- "punpckldq 84(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,56(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,12(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 12(%%edx),%%mm6\n\t"
- "punpckldq 56(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 12(%%esi),%%mm6\n\t"
- "punpckldq 56(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,384(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1792(%%ebx)\n\t"
+ "movq 8(%%eax),%%mm2\n\t"
+ "movd "MANGLE(COS9)"+20,%%mm3\n\t"
+ "punpckldq %%mm3,%%mm3\n\t"
+ "pfmul %%mm3,%%mm2\n\t"
+ "pfsub %%mm0,%%mm2\n\t"
+ "movq 40(%%eax),%%mm3\n\t"
+ "movd "MANGLE(COS9)"+28,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "pfsub %%mm3,%%mm2\n\t"
+ "movq 56(%%eax),%%mm3\n\t"
+ "movd "MANGLE(COS9)"+4,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "pfadd %%mm3,%%mm2\n\t"
+ "movq (%%eax),%%mm3\n\t"
+ "movq 16(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+32,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "movq 32(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+8,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "pfadd %%mm1,%%mm3\n\t"
+ "movq 64(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+16,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "movq %%mm2,%%mm4\n\t"
+ "pfadd %%mm3,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+8,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 116(%%edx),%%mm6\n\t"
+ "punpckldq 96(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,44(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,24(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 24(%%edx),%%mm6\n\t"
+ "punpckldq 44(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 24(%%esi),%%mm6\n\t"
+ "punpckldq 44(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,768(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1408(%%ebx)\n\t"
+ "movq %%mm3,%%mm4\n\t"
+ "pfsub %%mm2,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+24,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 132(%%edx),%%mm6\n\t"
+ "punpckldq 80(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,60(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,8(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 8(%%edx),%%mm6\n\t"
+ "punpckldq 60(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 8(%%esi),%%mm6\n\t"
+ "punpckldq 60(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,256(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1920(%%ebx)\n\t"
+ "movq 8(%%eax),%%mm2\n\t"
+ "movd "MANGLE(COS9)"+28,%%mm3\n\t"
+ "punpckldq %%mm3,%%mm3\n\t"
+ "pfmul %%mm3,%%mm2\n\t"
+ "pfsub %%mm0,%%mm2\n\t"
+ "movq 40(%%eax),%%mm3\n\t"
+ "movd "MANGLE(COS9)"+4,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "pfadd %%mm3,%%mm2\n\t"
+ "movq 56(%%eax),%%mm3\n\t"
+ "movd "MANGLE(COS9)"+20,%%mm4\n\t"
+ "punpckldq %%mm4,%%mm4\n\t"
+ "pfmul %%mm4,%%mm3\n\t"
+ "pfsub %%mm3,%%mm2\n\t"
+ "movq (%%eax),%%mm3\n\t"
+ "movq 16(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+16,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "movq 32(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+32,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfadd %%mm4,%%mm3\n\t"
+ "pfadd %%mm1,%%mm3\n\t"
+ "movq 64(%%eax),%%mm4\n\t"
+ "movd "MANGLE(COS9)"+8,%%mm5\n\t"
+ "punpckldq %%mm5,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "pfsub %%mm4,%%mm3\n\t"
+ "movq %%mm2,%%mm4\n\t"
+ "pfadd %%mm3,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+12,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 120(%%edx),%%mm6\n\t"
+ "punpckldq 92(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,48(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,20(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 20(%%edx),%%mm6\n\t"
+ "punpckldq 48(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 20(%%esi),%%mm6\n\t"
+ "punpckldq 48(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,640(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1536(%%ebx)\n\t"
+ "movq %%mm3,%%mm4\n\t"
+ "pfsub %%mm2,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+20,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 128(%%edx),%%mm6\n\t"
+ "punpckldq 84(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,56(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,12(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 12(%%edx),%%mm6\n\t"
+ "punpckldq 56(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 12(%%esi),%%mm6\n\t"
+ "punpckldq 56(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,384(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1792(%%ebx)\n\t"
- "movq (%%eax),%%mm4\n\t"
- "movq 16(%%eax),%%mm3\n\t"
- "pfsub %%mm3,%%mm4\n\t"
- "movq 32(%%eax),%%mm3\n\t"
- "pfadd %%mm3,%%mm4\n\t"
- "movq 48(%%eax),%%mm3\n\t"
- "pfsub %%mm3,%%mm4\n\t"
- "movq 64(%%eax),%%mm3\n\t"
- "pfadd %%mm3,%%mm4\n\t"
- "movq %%mm7,%%mm5\n\t"
- "punpckldq "MANGLE(tfcos36)"+16,%%mm5\n\t"
- "pfmul %%mm5,%%mm4\n\t"
- "movq %%mm4,%%mm5\n\t"
- "pfacc %%mm5,%%mm5\n\t"
- "movd 124(%%edx),%%mm6\n\t"
- "punpckldq 88(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd %%mm5,52(%%ecx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,16(%%ecx)\n\t"
- "movq %%mm4,%%mm6\n\t"
- "punpckldq %%mm6,%%mm5\n\t"
- "pfsub %%mm6,%%mm5\n\t"
- "punpckhdq %%mm5,%%mm5\n\t"
- "movd 16(%%edx),%%mm6\n\t"
- "punpckldq 52(%%edx),%%mm6\n\t"
- "pfmul %%mm6,%%mm5\n\t"
- "movd 16(%%esi),%%mm6\n\t"
- "punpckldq 52(%%esi),%%mm6\n\t"
- "pfadd %%mm6,%%mm5\n\t"
- "movd %%mm5,512(%%ebx)\n\t"
- "psrlq $32,%%mm5\n\t"
- "movd %%mm5,1664(%%ebx)\n\t"
+ "movq (%%eax),%%mm4\n\t"
+ "movq 16(%%eax),%%mm3\n\t"
+ "pfsub %%mm3,%%mm4\n\t"
+ "movq 32(%%eax),%%mm3\n\t"
+ "pfadd %%mm3,%%mm4\n\t"
+ "movq 48(%%eax),%%mm3\n\t"
+ "pfsub %%mm3,%%mm4\n\t"
+ "movq 64(%%eax),%%mm3\n\t"
+ "pfadd %%mm3,%%mm4\n\t"
+ "movq %%mm7,%%mm5\n\t"
+ "punpckldq "MANGLE(tfcos36)"+16,%%mm5\n\t"
+ "pfmul %%mm5,%%mm4\n\t"
+ "movq %%mm4,%%mm5\n\t"
+ "pfacc %%mm5,%%mm5\n\t"
+ "movd 124(%%edx),%%mm6\n\t"
+ "punpckldq 88(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd %%mm5,52(%%ecx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,16(%%ecx)\n\t"
+ "movq %%mm4,%%mm6\n\t"
+ "punpckldq %%mm6,%%mm5\n\t"
+ "pfsub %%mm6,%%mm5\n\t"
+ "punpckhdq %%mm5,%%mm5\n\t"
+ "movd 16(%%edx),%%mm6\n\t"
+ "punpckldq 52(%%edx),%%mm6\n\t"
+ "pfmul %%mm6,%%mm5\n\t"
+ "movd 16(%%esi),%%mm6\n\t"
+ "punpckldq 52(%%esi),%%mm6\n\t"
+ "pfadd %%mm6,%%mm5\n\t"
+ "movd %%mm5,512(%%ebx)\n\t"
+ "psrlq $32,%%mm5\n\t"
+ "movd %%mm5,1664(%%ebx)\n\t"
- "femms\n\t"
- :
- : "a" (inbuf), "S" (o1), "c" (o2), "d" (wintab), "b" (tsbuf)
- : "memory");
+ "femms\n\t"
+ :
+ : "a" (inbuf), "S" (o1), "c" (o2), "d" (wintab), "b" (tsbuf)
+ : "memory");
}
diff --git a/mp3lib/dct64_3dnow.c b/mp3lib/dct64_3dnow.c
index 55340b0512..d528654207 100644
--- a/mp3lib/dct64_3dnow.c
+++ b/mp3lib/dct64_3dnow.c
@@ -19,910 +19,910 @@ void dct64_MMX_3dnow(short *a,short *b,real *c)
{
char tmp[256];
__asm__ volatile(
-" movl %2,%%eax\n\t"
+" movl %2,%%eax\n\t"
-" leal 128+%3,%%edx\n\t"
-" movl %0,%%esi\n\t"
-" movl %1,%%edi\n\t"
-" movl $"MANGLE(costab_mmx)",%%ebx\n\t"
-" leal %3,%%ecx\n\t"
+" leal 128+%3,%%edx\n\t"
+" movl %0,%%esi\n\t"
+" movl %1,%%edi\n\t"
+" movl $"MANGLE(costab_mmx)",%%ebx\n\t"
+" leal %3,%%ecx\n\t"
/* Phase 1*/
-" movq (%%eax), %%mm0\n\t"
-" movq 8(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 120(%%eax), %%mm1\n\t"
-" movq 112(%%eax), %%mm5\n\t"
+" movq (%%eax), %%mm0\n\t"
+" movq 8(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 120(%%eax), %%mm1\n\t"
+" movq 112(%%eax), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%edx)\n\t"
-" movq %%mm4, 8(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul (%%ebx), %%mm3\n\t"
-" pfmul 8(%%ebx), %%mm7\n\t"
-" movd %%mm3, 124(%%edx)\n\t"
-" movd %%mm7, 116(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 120(%%edx)\n\t"
-" movd %%mm7, 112(%%edx)\n\t"
-
-" movq 16(%%eax), %%mm0\n\t"
-" movq 24(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 104(%%eax), %%mm1\n\t"
-" movq 96(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%edx)\n\t"
+" movq %%mm4, 8(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul (%%ebx), %%mm3\n\t"
+" pfmul 8(%%ebx), %%mm7\n\t"
+" movd %%mm3, 124(%%edx)\n\t"
+" movd %%mm7, 116(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 120(%%edx)\n\t"
+" movd %%mm7, 112(%%edx)\n\t"
+
+" movq 16(%%eax), %%mm0\n\t"
+" movq 24(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 104(%%eax), %%mm1\n\t"
+" movq 96(%%eax), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 16(%%edx)\n\t"
-" movq %%mm4, 24(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 16(%%ebx), %%mm3\n\t"
-" pfmul 24(%%ebx), %%mm7\n\t"
-" movd %%mm3, 108(%%edx)\n\t"
-" movd %%mm7, 100(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 104(%%edx)\n\t"
-" movd %%mm7, 96(%%edx)\n\t"
-
-" movq 32(%%eax), %%mm0\n\t"
-" movq 40(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 88(%%eax), %%mm1\n\t"
-" movq 80(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 16(%%edx)\n\t"
+" movq %%mm4, 24(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 16(%%ebx), %%mm3\n\t"
+" pfmul 24(%%ebx), %%mm7\n\t"
+" movd %%mm3, 108(%%edx)\n\t"
+" movd %%mm7, 100(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 104(%%edx)\n\t"
+" movd %%mm7, 96(%%edx)\n\t"
+
+" movq 32(%%eax), %%mm0\n\t"
+" movq 40(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 88(%%eax), %%mm1\n\t"
+" movq 80(%%eax), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 32(%%edx)\n\t"
-" movq %%mm4, 40(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 32(%%ebx), %%mm3\n\t"
-" pfmul 40(%%ebx), %%mm7\n\t"
-" movd %%mm3, 92(%%edx)\n\t"
-" movd %%mm7, 84(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 88(%%edx)\n\t"
-" movd %%mm7, 80(%%edx)\n\t"
-
-" movq 48(%%eax), %%mm0\n\t"
-" movq 56(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 72(%%eax), %%mm1\n\t"
-" movq 64(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 32(%%edx)\n\t"
+" movq %%mm4, 40(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 32(%%ebx), %%mm3\n\t"
+" pfmul 40(%%ebx), %%mm7\n\t"
+" movd %%mm3, 92(%%edx)\n\t"
+" movd %%mm7, 84(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 88(%%edx)\n\t"
+" movd %%mm7, 80(%%edx)\n\t"
+
+" movq 48(%%eax), %%mm0\n\t"
+" movq 56(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 72(%%eax), %%mm1\n\t"
+" movq 64(%%eax), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 48(%%edx)\n\t"
-" movq %%mm4, 56(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 48(%%ebx), %%mm3\n\t"
-" pfmul 56(%%ebx), %%mm7\n\t"
-" movd %%mm3, 76(%%edx)\n\t"
-" movd %%mm7, 68(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 72(%%edx)\n\t"
-" movd %%mm7, 64(%%edx)\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 48(%%edx)\n\t"
+" movq %%mm4, 56(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 48(%%ebx), %%mm3\n\t"
+" pfmul 56(%%ebx), %%mm7\n\t"
+" movd %%mm3, 76(%%edx)\n\t"
+" movd %%mm7, 68(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 72(%%edx)\n\t"
+" movd %%mm7, 64(%%edx)\n\t"
/* Phase 2*/
-" movq (%%edx), %%mm0\n\t"
-" movq 8(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 56(%%edx), %%mm1\n\t"
-" movq 48(%%edx), %%mm5\n\t"
+" movq (%%edx), %%mm0\n\t"
+" movq 8(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 56(%%edx), %%mm1\n\t"
+" movq 48(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%ecx)\n\t"
-" movq %%mm4, 8(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 64(%%ebx), %%mm3\n\t"
-" pfmul 72(%%ebx), %%mm7\n\t"
-" movd %%mm3, 60(%%ecx)\n\t"
-" movd %%mm7, 52(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 56(%%ecx)\n\t"
-" movd %%mm7, 48(%%ecx)\n\t"
-
-" movq 16(%%edx), %%mm0\n\t"
-" movq 24(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 40(%%edx), %%mm1\n\t"
-" movq 32(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%ecx)\n\t"
+" movq %%mm4, 8(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 64(%%ebx), %%mm3\n\t"
+" pfmul 72(%%ebx), %%mm7\n\t"
+" movd %%mm3, 60(%%ecx)\n\t"
+" movd %%mm7, 52(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 56(%%ecx)\n\t"
+" movd %%mm7, 48(%%ecx)\n\t"
+
+" movq 16(%%edx), %%mm0\n\t"
+" movq 24(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 40(%%edx), %%mm1\n\t"
+" movq 32(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 16(%%ecx)\n\t"
-" movq %%mm4, 24(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 80(%%ebx), %%mm3\n\t"
-" pfmul 88(%%ebx), %%mm7\n\t"
-" movd %%mm3, 44(%%ecx)\n\t"
-" movd %%mm7, 36(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 40(%%ecx)\n\t"
-" movd %%mm7, 32(%%ecx)\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 16(%%ecx)\n\t"
+" movq %%mm4, 24(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 80(%%ebx), %%mm3\n\t"
+" pfmul 88(%%ebx), %%mm7\n\t"
+" movd %%mm3, 44(%%ecx)\n\t"
+" movd %%mm7, 36(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 40(%%ecx)\n\t"
+" movd %%mm7, 32(%%ecx)\n\t"
/* Phase 3*/
-" movq 64(%%edx), %%mm0\n\t"
-" movq 72(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 120(%%edx), %%mm1\n\t"
-" movq 112(%%edx), %%mm5\n\t"
+" movq 64(%%edx), %%mm0\n\t"
+" movq 72(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 120(%%edx), %%mm1\n\t"
+" movq 112(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 64(%%ecx)\n\t"
-" movq %%mm4, 72(%%ecx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 64(%%ebx), %%mm3\n\t"
-" pfmul 72(%%ebx), %%mm7\n\t"
-" movd %%mm3, 124(%%ecx)\n\t"
-" movd %%mm7, 116(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 120(%%ecx)\n\t"
-" movd %%mm7, 112(%%ecx)\n\t"
-
-" movq 80(%%edx), %%mm0\n\t"
-" movq 88(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 104(%%edx), %%mm1\n\t"
-" movq 96(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 64(%%ecx)\n\t"
+" movq %%mm4, 72(%%ecx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 64(%%ebx), %%mm3\n\t"
+" pfmul 72(%%ebx), %%mm7\n\t"
+" movd %%mm3, 124(%%ecx)\n\t"
+" movd %%mm7, 116(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 120(%%ecx)\n\t"
+" movd %%mm7, 112(%%ecx)\n\t"
+
+" movq 80(%%edx), %%mm0\n\t"
+" movq 88(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 104(%%edx), %%mm1\n\t"
+" movq 96(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 80(%%ecx)\n\t"
-" movq %%mm4, 88(%%ecx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 80(%%ebx), %%mm3\n\t"
-" pfmul 88(%%ebx), %%mm7\n\t"
-" movd %%mm3, 108(%%ecx)\n\t"
-" movd %%mm7, 100(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 104(%%ecx)\n\t"
-" movd %%mm7, 96(%%ecx)\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 80(%%ecx)\n\t"
+" movq %%mm4, 88(%%ecx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 80(%%ebx), %%mm3\n\t"
+" pfmul 88(%%ebx), %%mm7\n\t"
+" movd %%mm3, 108(%%ecx)\n\t"
+" movd %%mm7, 100(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 104(%%ecx)\n\t"
+" movd %%mm7, 96(%%ecx)\n\t"
/* Phase 4*/
-" movq (%%ecx), %%mm0\n\t"
-" movq 8(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 24(%%ecx), %%mm1\n\t"
-" movq 16(%%ecx), %%mm5\n\t"
+" movq (%%ecx), %%mm0\n\t"
+" movq 8(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 24(%%ecx), %%mm1\n\t"
+" movq 16(%%ecx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%edx)\n\t"
-" movq %%mm4, 8(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 96(%%ebx), %%mm3\n\t"
-" pfmul 104(%%ebx), %%mm7\n\t"
-" movd %%mm3, 28(%%edx)\n\t"
-" movd %%mm7, 20(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 24(%%edx)\n\t"
-" movd %%mm7, 16(%%edx)\n\t"
-
-" movq 32(%%ecx), %%mm0\n\t"
-" movq 40(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 56(%%ecx), %%mm1\n\t"
-" movq 48(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%edx)\n\t"
+" movq %%mm4, 8(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 96(%%ebx), %%mm3\n\t"
+" pfmul 104(%%ebx), %%mm7\n\t"
+" movd %%mm3, 28(%%edx)\n\t"
+" movd %%mm7, 20(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 24(%%edx)\n\t"
+" movd %%mm7, 16(%%edx)\n\t"
+
+" movq 32(%%ecx), %%mm0\n\t"
+" movq 40(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 56(%%ecx), %%mm1\n\t"
+" movq 48(%%ecx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 32(%%edx)\n\t"
-" movq %%mm4, 40(%%edx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 96(%%ebx), %%mm3\n\t"
-" pfmul 104(%%ebx), %%mm7\n\t"
-" movd %%mm3, 60(%%edx)\n\t"
-" movd %%mm7, 52(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 56(%%edx)\n\t"
-" movd %%mm7, 48(%%edx)\n\t"
-
-" movq 64(%%ecx), %%mm0\n\t"
-" movq 72(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 88(%%ecx), %%mm1\n\t"
-" movq 80(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 32(%%edx)\n\t"
+" movq %%mm4, 40(%%edx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 96(%%ebx), %%mm3\n\t"
+" pfmul 104(%%ebx), %%mm7\n\t"
+" movd %%mm3, 60(%%edx)\n\t"
+" movd %%mm7, 52(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 56(%%edx)\n\t"
+" movd %%mm7, 48(%%edx)\n\t"
+
+" movq 64(%%ecx), %%mm0\n\t"
+" movq 72(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 88(%%ecx), %%mm1\n\t"
+" movq 80(%%ecx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 64(%%edx)\n\t"
-" movq %%mm4, 72(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 96(%%ebx), %%mm3\n\t"
-" pfmul 104(%%ebx), %%mm7\n\t"
-" movd %%mm3, 92(%%edx)\n\t"
-" movd %%mm7, 84(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 88(%%edx)\n\t"
-" movd %%mm7, 80(%%edx)\n\t"
-
-" movq 96(%%ecx), %%mm0\n\t"
-" movq 104(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 120(%%ecx), %%mm1\n\t"
-" movq 112(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 64(%%edx)\n\t"
+" movq %%mm4, 72(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 96(%%ebx), %%mm3\n\t"
+" pfmul 104(%%ebx), %%mm7\n\t"
+" movd %%mm3, 92(%%edx)\n\t"
+" movd %%mm7, 84(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 88(%%edx)\n\t"
+" movd %%mm7, 80(%%edx)\n\t"
+
+" movq 96(%%ecx), %%mm0\n\t"
+" movq 104(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 120(%%ecx), %%mm1\n\t"
+" movq 112(%%ecx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 96(%%edx)\n\t"
-" movq %%mm4, 104(%%edx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 96(%%ebx), %%mm3\n\t"
-" pfmul 104(%%ebx), %%mm7\n\t"
-" movd %%mm3, 124(%%edx)\n\t"
-" movd %%mm7, 116(%%edx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 120(%%edx)\n\t"
-" movd %%mm7, 112(%%edx)\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 96(%%edx)\n\t"
+" movq %%mm4, 104(%%edx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 96(%%ebx), %%mm3\n\t"
+" pfmul 104(%%ebx), %%mm7\n\t"
+" movd %%mm3, 124(%%edx)\n\t"
+" movd %%mm7, 116(%%edx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 120(%%edx)\n\t"
+" movd %%mm7, 112(%%edx)\n\t"
/* Phase 5 */
-" movq (%%edx), %%mm0\n\t"
-" movq 16(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 8(%%edx), %%mm1\n\t"
-" movq 24(%%edx), %%mm5\n\t"
+" movq (%%edx), %%mm0\n\t"
+" movq 16(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 8(%%edx), %%mm1\n\t"
+" movq 24(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%ecx)\n\t"
-" movq %%mm4, 16(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 112(%%ebx), %%mm3\n\t"
-" pfmul 112(%%ebx), %%mm7\n\t"
-" movd %%mm3, 12(%%ecx)\n\t"
-" movd %%mm7, 28(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 8(%%ecx)\n\t"
-" movd %%mm7, 24(%%ecx)\n\t"
-
-" movq 32(%%edx), %%mm0\n\t"
-" movq 48(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 40(%%edx), %%mm1\n\t"
-" movq 56(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%ecx)\n\t"
+" movq %%mm4, 16(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 112(%%ebx), %%mm3\n\t"
+" pfmul 112(%%ebx), %%mm7\n\t"
+" movd %%mm3, 12(%%ecx)\n\t"
+" movd %%mm7, 28(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 8(%%ecx)\n\t"
+" movd %%mm7, 24(%%ecx)\n\t"
+
+" movq 32(%%edx), %%mm0\n\t"
+" movq 48(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 40(%%edx), %%mm1\n\t"
+" movq 56(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 32(%%ecx)\n\t"
-" movq %%mm4, 48(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 112(%%ebx), %%mm3\n\t"
-" pfmul 112(%%ebx), %%mm7\n\t"
-" movd %%mm3, 44(%%ecx)\n\t"
-" movd %%mm7, 60(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 40(%%ecx)\n\t"
-" movd %%mm7, 56(%%ecx)\n\t"
-
-" movq 64(%%edx), %%mm0\n\t"
-" movq 80(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 72(%%edx), %%mm1\n\t"
-" movq 88(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 32(%%ecx)\n\t"
+" movq %%mm4, 48(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 112(%%ebx), %%mm3\n\t"
+" pfmul 112(%%ebx), %%mm7\n\t"
+" movd %%mm3, 44(%%ecx)\n\t"
+" movd %%mm7, 60(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 40(%%ecx)\n\t"
+" movd %%mm7, 56(%%ecx)\n\t"
+
+" movq 64(%%edx), %%mm0\n\t"
+" movq 80(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 72(%%edx), %%mm1\n\t"
+" movq 88(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 64(%%ecx)\n\t"
-" movq %%mm4, 80(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 112(%%ebx), %%mm3\n\t"
-" pfmul 112(%%ebx), %%mm7\n\t"
-" movd %%mm3, 76(%%ecx)\n\t"
-" movd %%mm7, 92(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 72(%%ecx)\n\t"
-" movd %%mm7, 88(%%ecx)\n\t"
-
-" movq 96(%%edx), %%mm0\n\t"
-" movq 112(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" movq 104(%%edx), %%mm1\n\t"
-" movq 120(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 64(%%ecx)\n\t"
+" movq %%mm4, 80(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 112(%%ebx), %%mm3\n\t"
+" pfmul 112(%%ebx), %%mm7\n\t"
+" movd %%mm3, 76(%%ecx)\n\t"
+" movd %%mm7, 92(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 72(%%ecx)\n\t"
+" movd %%mm7, 88(%%ecx)\n\t"
+
+" movq 96(%%edx), %%mm0\n\t"
+" movq 112(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" movq 104(%%edx), %%mm1\n\t"
+" movq 120(%%edx), %%mm5\n\t"
/* n.b.: pswapd*/
-" movq %%mm1, %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm5\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" punpckldq %%mm6, %%mm5\n\t"
+" movq %%mm1, %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm5\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" punpckldq %%mm6, %%mm5\n\t"
/**/
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 96(%%ecx)\n\t"
-" movq %%mm4, 112(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 112(%%ebx), %%mm3\n\t"
-" pfmul 112(%%ebx), %%mm7\n\t"
-" movd %%mm3, 108(%%ecx)\n\t"
-" movd %%mm7, 124(%%ecx)\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm7\n\t"
-" movd %%mm3, 104(%%ecx)\n\t"
-" movd %%mm7, 120(%%ecx)\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 96(%%ecx)\n\t"
+" movq %%mm4, 112(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 112(%%ebx), %%mm3\n\t"
+" pfmul 112(%%ebx), %%mm7\n\t"
+" movd %%mm3, 108(%%ecx)\n\t"
+" movd %%mm7, 124(%%ecx)\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm7\n\t"
+" movd %%mm3, 104(%%ecx)\n\t"
+" movd %%mm7, 120(%%ecx)\n\t"
/* Phase 6. This is the end of easy road. */
/* Code below is coded in scalar mode. Should be optimized */
-" movd "MANGLE(plus_1f)", %%mm6\n\t"
-" punpckldq 120(%%ebx), %%mm6\n\t" /* mm6 = 1.0 | 120(%%ebx)*/
-" movq "MANGLE(x_plus_minus_3dnow)", %%mm7\n\t" /* mm7 = +1 | -1 */
-
-" movq 32(%%ecx), %%mm0\n\t"
-" movq 64(%%ecx), %%mm2\n\t"
-" movq %%mm0, %%mm1\n\t"
-" movq %%mm2, %%mm3\n\t"
-" pxor %%mm7, %%mm1\n\t"
-" pxor %%mm7, %%mm3\n\t"
-" pfacc %%mm1, %%mm0\n\t"
-" pfacc %%mm3, %%mm2\n\t"
-" pfmul %%mm6, %%mm0\n\t"
-" pfmul %%mm6, %%mm2\n\t"
-" movq %%mm0, 32(%%edx)\n\t"
-" movq %%mm2, 64(%%edx)\n\t"
-
-" movd 44(%%ecx), %%mm0\n\t"
-" movd 40(%%ecx), %%mm2\n\t"
-" movd 120(%%ebx), %%mm3\n\t"
-" punpckldq 76(%%ecx), %%mm0\n\t"
-" punpckldq 72(%%ecx), %%mm2\n\t"
-" punpckldq %%mm3, %%mm3\n\t"
-" movq %%mm0, %%mm4\n\t"
-" movq %%mm2, %%mm5\n\t"
-" pfsub %%mm2, %%mm0\n\t"
-" pfmul %%mm3, %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pfadd %%mm5, %%mm0\n\t"
-" pfadd %%mm4, %%mm0\n\t"
-" movq %%mm0, %%mm2\n\t"
-" punpckldq %%mm1, %%mm0\n\t"
-" punpckhdq %%mm1, %%mm2\n\t"
-" movq %%mm0, 40(%%edx)\n\t"
-" movq %%mm2, 72(%%edx)\n\t"
-
-" movd 48(%%ecx), %%mm3\n\t"
-" movd 60(%%ecx), %%mm2\n\t"
-" pfsub 52(%%ecx), %%mm3\n\t"
-" pfsub 56(%%ecx), %%mm2\n\t"
-" pfmul 120(%%ebx), %%mm3\n\t"
-" pfmul 120(%%ebx), %%mm2\n\t"
-" movq %%mm2, %%mm1\n\t"
-
-" pfadd 56(%%ecx), %%mm1\n\t"
-" pfadd 60(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 48(%%ecx), %%mm0\n\t"
-" pfadd 52(%%ecx), %%mm0\n\t"
-" pfadd %%mm3, %%mm1\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" pfadd %%mm3, %%mm2\n\t"
-" punpckldq %%mm2, %%mm0\n\t"
-" movq %%mm1, 56(%%edx)\n\t"
-" movq %%mm0, 48(%%edx)\n\t"
+" movd "MANGLE(plus_1f)", %%mm6\n\t"
+" punpckldq 120(%%ebx), %%mm6\n\t" /* mm6 = 1.0 | 120(%%ebx)*/
+" movq "MANGLE(x_plus_minus_3dnow)", %%mm7\n\t" /* mm7 = +1 | -1 */
+
+" movq 32(%%ecx), %%mm0\n\t"
+" movq 64(%%ecx), %%mm2\n\t"
+" movq %%mm0, %%mm1\n\t"
+" movq %%mm2, %%mm3\n\t"
+" pxor %%mm7, %%mm1\n\t"
+" pxor %%mm7, %%mm3\n\t"
+" pfacc %%mm1, %%mm0\n\t"
+" pfacc %%mm3, %%mm2\n\t"
+" pfmul %%mm6, %%mm0\n\t"
+" pfmul %%mm6, %%mm2\n\t"
+" movq %%mm0, 32(%%edx)\n\t"
+" movq %%mm2, 64(%%edx)\n\t"
+
+" movd 44(%%ecx), %%mm0\n\t"
+" movd 40(%%ecx), %%mm2\n\t"
+" movd 120(%%ebx), %%mm3\n\t"
+" punpckldq 76(%%ecx), %%mm0\n\t"
+" punpckldq 72(%%ecx), %%mm2\n\t"
+" punpckldq %%mm3, %%mm3\n\t"
+" movq %%mm0, %%mm4\n\t"
+" movq %%mm2, %%mm5\n\t"
+" pfsub %%mm2, %%mm0\n\t"
+" pfmul %%mm3, %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pfadd %%mm5, %%mm0\n\t"
+" pfadd %%mm4, %%mm0\n\t"
+" movq %%mm0, %%mm2\n\t"
+" punpckldq %%mm1, %%mm0\n\t"
+" punpckhdq %%mm1, %%mm2\n\t"
+" movq %%mm0, 40(%%edx)\n\t"
+" movq %%mm2, 72(%%edx)\n\t"
+
+" movd 48(%%ecx), %%mm3\n\t"
+" movd 60(%%ecx), %%mm2\n\t"
+" pfsub 52(%%ecx), %%mm3\n\t"
+" pfsub 56(%%ecx), %%mm2\n\t"
+" pfmul 120(%%ebx), %%mm3\n\t"
+" pfmul 120(%%ebx), %%mm2\n\t"
+" movq %%mm2, %%mm1\n\t"
+
+" pfadd 56(%%ecx), %%mm1\n\t"
+" pfadd 60(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 48(%%ecx), %%mm0\n\t"
+" pfadd 52(%%ecx), %%mm0\n\t"
+" pfadd %%mm3, %%mm1\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" pfadd %%mm3, %%mm2\n\t"
+" punpckldq %%mm2, %%mm0\n\t"
+" movq %%mm1, 56(%%edx)\n\t"
+" movq %%mm0, 48(%%edx)\n\t"
/*---*/
-" movd 92(%%ecx), %%mm1\n\t"
-" pfsub 88(%%ecx), %%mm1\n\t"
-" pfmul 120(%%ebx), %%mm1\n\t"
-" movd %%mm1, 92(%%edx)\n\t"
-" pfadd 92(%%ecx), %%mm1\n\t"
-" pfadd 88(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 80(%%ecx), %%mm0\n\t"
-" pfadd 84(%%ecx), %%mm0\n\t"
-" movd %%mm0, 80(%%edx)\n\t"
-
-" movd 80(%%ecx), %%mm0\n\t"
-" pfsub 84(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" pfadd %%mm0, %%mm1\n\t"
-" pfadd 92(%%edx), %%mm0\n\t"
-" punpckldq %%mm1, %%mm0\n\t"
-" movq %%mm0, 84(%%edx)\n\t"
-
-" movq 96(%%ecx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pxor %%mm7, %%mm1\n\t"
-" pfacc %%mm1, %%mm0\n\t"
-" pfmul %%mm6, %%mm0\n\t"
-" movq %%mm0, 96(%%edx)\n\t"
-
-" movd 108(%%ecx), %%mm0\n\t"
-" pfsub 104(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, 108(%%edx)\n\t"
-" pfadd 104(%%ecx), %%mm0\n\t"
-" pfadd 108(%%ecx), %%mm0\n\t"
-" movd %%mm0, 104(%%edx)\n\t"
-
-" movd 124(%%ecx), %%mm1\n\t"
-" pfsub 120(%%ecx), %%mm1\n\t"
-" pfmul 120(%%ebx), %%mm1\n\t"
-" movd %%mm1, 124(%%edx)\n\t"
-" pfadd 120(%%ecx), %%mm1\n\t"
-" pfadd 124(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 112(%%ecx), %%mm0\n\t"
-" pfadd 116(%%ecx), %%mm0\n\t"
-" movd %%mm0, 112(%%edx)\n\t"
-
-" movd 112(%%ecx), %%mm0\n\t"
-" pfsub 116(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" pfadd %%mm0,%%mm1\n\t"
-" pfadd 124(%%edx), %%mm0\n\t"
-" punpckldq %%mm1, %%mm0\n\t"
-" movq %%mm0, 116(%%edx)\n\t"
+" movd 92(%%ecx), %%mm1\n\t"
+" pfsub 88(%%ecx), %%mm1\n\t"
+" pfmul 120(%%ebx), %%mm1\n\t"
+" movd %%mm1, 92(%%edx)\n\t"
+" pfadd 92(%%ecx), %%mm1\n\t"
+" pfadd 88(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 80(%%ecx), %%mm0\n\t"
+" pfadd 84(%%ecx), %%mm0\n\t"
+" movd %%mm0, 80(%%edx)\n\t"
+
+" movd 80(%%ecx), %%mm0\n\t"
+" pfsub 84(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" pfadd %%mm0, %%mm1\n\t"
+" pfadd 92(%%edx), %%mm0\n\t"
+" punpckldq %%mm1, %%mm0\n\t"
+" movq %%mm0, 84(%%edx)\n\t"
+
+" movq 96(%%ecx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pxor %%mm7, %%mm1\n\t"
+" pfacc %%mm1, %%mm0\n\t"
+" pfmul %%mm6, %%mm0\n\t"
+" movq %%mm0, 96(%%edx)\n\t"
+
+" movd 108(%%ecx), %%mm0\n\t"
+" pfsub 104(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, 108(%%edx)\n\t"
+" pfadd 104(%%ecx), %%mm0\n\t"
+" pfadd 108(%%ecx), %%mm0\n\t"
+" movd %%mm0, 104(%%edx)\n\t"
+
+" movd 124(%%ecx), %%mm1\n\t"
+" pfsub 120(%%ecx), %%mm1\n\t"
+" pfmul 120(%%ebx), %%mm1\n\t"
+" movd %%mm1, 124(%%edx)\n\t"
+" pfadd 120(%%ecx), %%mm1\n\t"
+" pfadd 124(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 112(%%ecx), %%mm0\n\t"
+" pfadd 116(%%ecx), %%mm0\n\t"
+" movd %%mm0, 112(%%edx)\n\t"
+
+" movd 112(%%ecx), %%mm0\n\t"
+" pfsub 116(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" pfadd %%mm0,%%mm1\n\t"
+" pfadd 124(%%edx), %%mm0\n\t"
+" punpckldq %%mm1, %%mm0\n\t"
+" movq %%mm0, 116(%%edx)\n\t"
// this code is broken, there is nothing modifying the z flag above.
#if 0
-" jnz .L01\n\t"
+" jnz .L01\n\t"
/* Phase 7*/
/* Code below is coded in scalar mode. Should be optimized */
-" movd (%%ecx), %%mm0\n\t"
-" pfadd 4(%%ecx), %%mm0\n\t"
-" movd %%mm0, 1024(%%esi)\n\t"
-
-" movd (%%ecx), %%mm0\n\t"
-" pfsub 4(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, (%%esi)\n\t"
-" movd %%mm0, (%%edi)\n\t"
-
-" movd 12(%%ecx), %%mm0\n\t"
-" pfsub 8(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, 512(%%edi)\n\t"
-" pfadd 12(%%ecx), %%mm0\n\t"
-" pfadd 8(%%ecx), %%mm0\n\t"
-" movd %%mm0, 512(%%esi)\n\t"
-
-" movd 16(%%ecx), %%mm0\n\t"
-" pfsub 20(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movq %%mm0, %%mm3\n\t"
-
-" movd 28(%%ecx), %%mm0\n\t"
-" pfsub 24(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, 768(%%edi)\n\t"
-" movq %%mm0, %%mm2\n\t"
-
-" pfadd 24(%%ecx), %%mm0\n\t"
-" pfadd 28(%%ecx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-
-" pfadd 16(%%ecx), %%mm0\n\t"
-" pfadd 20(%%ecx), %%mm0\n\t"
-" movd %%mm0, 768(%%esi)\n\t"
-" pfadd %%mm3, %%mm1\n\t"
-" movd %%mm1, 256(%%esi)\n\t"
-" pfadd %%mm3, %%mm2\n\t"
-" movd %%mm2, 256(%%edi)\n\t"
+" movd (%%ecx), %%mm0\n\t"
+" pfadd 4(%%ecx), %%mm0\n\t"
+" movd %%mm0, 1024(%%esi)\n\t"
+
+" movd (%%ecx), %%mm0\n\t"
+" pfsub 4(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, (%%esi)\n\t"
+" movd %%mm0, (%%edi)\n\t"
+
+" movd 12(%%ecx), %%mm0\n\t"
+" pfsub 8(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, 512(%%edi)\n\t"
+" pfadd 12(%%ecx), %%mm0\n\t"
+" pfadd 8(%%ecx), %%mm0\n\t"
+" movd %%mm0, 512(%%esi)\n\t"
+
+" movd 16(%%ecx), %%mm0\n\t"
+" pfsub 20(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movq %%mm0, %%mm3\n\t"
+
+" movd 28(%%ecx), %%mm0\n\t"
+" pfsub 24(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, 768(%%edi)\n\t"
+" movq %%mm0, %%mm2\n\t"
+
+" pfadd 24(%%ecx), %%mm0\n\t"
+" pfadd 28(%%ecx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+
+" pfadd 16(%%ecx), %%mm0\n\t"
+" pfadd 20(%%ecx), %%mm0\n\t"
+" movd %%mm0, 768(%%esi)\n\t"
+" pfadd %%mm3, %%mm1\n\t"
+" movd %%mm1, 256(%%esi)\n\t"
+" pfadd %%mm3, %%mm2\n\t"
+" movd %%mm2, 256(%%edi)\n\t"
/* Phase 8*/
-" movq 32(%%edx), %%mm0\n\t"
-" movq 48(%%edx), %%mm1\n\t"
-" pfadd 48(%%edx), %%mm0\n\t"
-" pfadd 40(%%edx), %%mm1\n\t"
-" movd %%mm0, 896(%%esi)\n\t"
-" movd %%mm1, 640(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" psrlq $32, %%mm1\n\t"
-" movd %%mm0, 128(%%edi)\n\t"
-" movd %%mm1, 384(%%edi)\n\t"
-
-" movd 40(%%edx), %%mm0\n\t"
-" pfadd 56(%%edx), %%mm0\n\t"
-" movd %%mm0, 384(%%esi)\n\t"
-
-" movd 56(%%edx), %%mm0\n\t"
-" pfadd 36(%%edx), %%mm0\n\t"
-" movd %%mm0, 128(%%esi)\n\t"
-
-" movd 60(%%edx), %%mm0\n\t"
-" movd %%mm0, 896(%%edi)\n\t"
-" pfadd 44(%%edx), %%mm0\n\t"
-" movd %%mm0, 640(%%edi)\n\t"
-
-" movq 96(%%edx), %%mm0\n\t"
-" movq 112(%%edx), %%mm2\n\t"
-" movq 104(%%edx), %%mm4\n\t"
-" pfadd 112(%%edx), %%mm0\n\t"
-" pfadd 104(%%edx), %%mm2\n\t"
-" pfadd 120(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm1\n\t"
-" movq %%mm2, %%mm3\n\t"
-" movq %%mm4, %%mm5\n\t"
-" pfadd 64(%%edx), %%mm0\n\t"
-" pfadd 80(%%edx), %%mm2\n\t"
-" pfadd 72(%%edx), %%mm4\n\t"
-" movd %%mm0, 960(%%esi)\n\t"
-" movd %%mm2, 704(%%esi)\n\t"
-" movd %%mm4, 448(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" psrlq $32, %%mm2\n\t"
-" psrlq $32, %%mm4\n\t"
-" movd %%mm0, 64(%%edi)\n\t"
-" movd %%mm2, 320(%%edi)\n\t"
-" movd %%mm4, 576(%%edi)\n\t"
-" pfadd 80(%%edx), %%mm1\n\t"
-" pfadd 72(%%edx), %%mm3\n\t"
-" pfadd 88(%%edx), %%mm5\n\t"
-" movd %%mm1, 832(%%esi)\n\t"
-" movd %%mm3, 576(%%esi)\n\t"
-" movd %%mm5, 320(%%esi)\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm5\n\t"
-" movd %%mm1, 192(%%edi)\n\t"
-" movd %%mm3, 448(%%edi)\n\t"
-" movd %%mm5, 704(%%edi)\n\t"
-
-" movd 120(%%edx), %%mm0\n\t"
-" pfadd 100(%%edx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pfadd 88(%%edx), %%mm0\n\t"
-" movd %%mm0, 192(%%esi)\n\t"
-" pfadd 68(%%edx), %%mm1\n\t"
-" movd %%mm1, 64(%%esi)\n\t"
-
-" movd 124(%%edx), %%mm0\n\t"
-" movd %%mm0, 960(%%edi)\n\t"
-" pfadd 92(%%edx), %%mm0\n\t"
-" movd %%mm0, 832(%%edi)\n\t"
-
-" jmp .L_bye\n\t"
+" movq 32(%%edx), %%mm0\n\t"
+" movq 48(%%edx), %%mm1\n\t"
+" pfadd 48(%%edx), %%mm0\n\t"
+" pfadd 40(%%edx), %%mm1\n\t"
+" movd %%mm0, 896(%%esi)\n\t"
+" movd %%mm1, 640(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" psrlq $32, %%mm1\n\t"
+" movd %%mm0, 128(%%edi)\n\t"
+" movd %%mm1, 384(%%edi)\n\t"
+
+" movd 40(%%edx), %%mm0\n\t"
+" pfadd 56(%%edx), %%mm0\n\t"
+" movd %%mm0, 384(%%esi)\n\t"
+
+" movd 56(%%edx), %%mm0\n\t"
+" pfadd 36(%%edx), %%mm0\n\t"
+" movd %%mm0, 128(%%esi)\n\t"
+
+" movd 60(%%edx), %%mm0\n\t"
+" movd %%mm0, 896(%%edi)\n\t"
+" pfadd 44(%%edx), %%mm0\n\t"
+" movd %%mm0, 640(%%edi)\n\t"
+
+" movq 96(%%edx), %%mm0\n\t"
+" movq 112(%%edx), %%mm2\n\t"
+" movq 104(%%edx), %%mm4\n\t"
+" pfadd 112(%%edx), %%mm0\n\t"
+" pfadd 104(%%edx), %%mm2\n\t"
+" pfadd 120(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm1\n\t"
+" movq %%mm2, %%mm3\n\t"
+" movq %%mm4, %%mm5\n\t"
+" pfadd 64(%%edx), %%mm0\n\t"
+" pfadd 80(%%edx), %%mm2\n\t"
+" pfadd 72(%%edx), %%mm4\n\t"
+" movd %%mm0, 960(%%esi)\n\t"
+" movd %%mm2, 704(%%esi)\n\t"
+" movd %%mm4, 448(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" psrlq $32, %%mm2\n\t"
+" psrlq $32, %%mm4\n\t"
+" movd %%mm0, 64(%%edi)\n\t"
+" movd %%mm2, 320(%%edi)\n\t"
+" movd %%mm4, 576(%%edi)\n\t"
+" pfadd 80(%%edx), %%mm1\n\t"
+" pfadd 72(%%edx), %%mm3\n\t"
+" pfadd 88(%%edx), %%mm5\n\t"
+" movd %%mm1, 832(%%esi)\n\t"
+" movd %%mm3, 576(%%esi)\n\t"
+" movd %%mm5, 320(%%esi)\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm5\n\t"
+" movd %%mm1, 192(%%edi)\n\t"
+" movd %%mm3, 448(%%edi)\n\t"
+" movd %%mm5, 704(%%edi)\n\t"
+
+" movd 120(%%edx), %%mm0\n\t"
+" pfadd 100(%%edx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pfadd 88(%%edx), %%mm0\n\t"
+" movd %%mm0, 192(%%esi)\n\t"
+" pfadd 68(%%edx), %%mm1\n\t"
+" movd %%mm1, 64(%%esi)\n\t"
+
+" movd 124(%%edx), %%mm0\n\t"
+" movd %%mm0, 960(%%edi)\n\t"
+" pfadd 92(%%edx), %%mm0\n\t"
+" movd %%mm0, 832(%%edi)\n\t"
+
+" jmp .L_bye\n\t"
".L01:\n\t"
#endif
/* Phase 9*/
-" movq (%%ecx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pxor %%mm7, %%mm1\n\t"
-" pfacc %%mm1, %%mm0\n\t"
-" pfmul %%mm6, %%mm0\n\t"
-" pf2id %%mm0, %%mm0\n\t"
-" packssdw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, 512(%%esi)\n\t"
-" shrl $16, %%eax\n\t"
-" movw %%ax, (%%esi)\n\t"
-
-" movd 12(%%ecx), %%mm0\n\t"
-" pfsub 8(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" pf2id %%mm0, %%mm7\n\t"
-" packssdw %%mm7, %%mm7\n\t"
-" movd %%mm7, %%eax\n\t"
-" movw %%ax, 256(%%edi)\n\t"
-" pfadd 12(%%ecx), %%mm0\n\t"
-" pfadd 8(%%ecx), %%mm0\n\t"
-" pf2id %%mm0, %%mm0\n\t"
-" packssdw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, 256(%%esi)\n\t"
-
-" movd 16(%%ecx), %%mm3\n\t"
-" pfsub 20(%%ecx), %%mm3\n\t"
-" pfmul 120(%%ebx), %%mm3\n\t"
-" movq %%mm3, %%mm2\n\t"
-
-" movd 28(%%ecx), %%mm2\n\t"
-" pfsub 24(%%ecx), %%mm2\n\t"
-" pfmul 120(%%ebx), %%mm2\n\t"
-" movq %%mm2, %%mm1\n\t"
-
-" pf2id %%mm2, %%mm7\n\t"
-" packssdw %%mm7, %%mm7\n\t"
-" movd %%mm7, %%eax\n\t"
-" movw %%ax, 384(%%edi)\n\t"
-
-" pfadd 24(%%ecx), %%mm1\n\t"
-" pfadd 28(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 16(%%ecx), %%mm0\n\t"
-" pfadd 20(%%ecx), %%mm0\n\t"
-" pf2id %%mm0, %%mm0\n\t"
-" packssdw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, 384(%%esi)\n\t"
-" pfadd %%mm3, %%mm1\n\t"
-" pf2id %%mm1, %%mm1\n\t"
-" packssdw %%mm1, %%mm1\n\t"
-" movd %%mm1, %%eax\n\t"
-" movw %%ax, 128(%%esi)\n\t"
-" pfadd %%mm3, %%mm2\n\t"
-" pf2id %%mm2, %%mm2\n\t"
-" packssdw %%mm2, %%mm2\n\t"
-" movd %%mm2, %%eax\n\t"
-" movw %%ax, 128(%%edi)\n\t"
+" movq (%%ecx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pxor %%mm7, %%mm1\n\t"
+" pfacc %%mm1, %%mm0\n\t"
+" pfmul %%mm6, %%mm0\n\t"
+" pf2id %%mm0, %%mm0\n\t"
+" packssdw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, 512(%%esi)\n\t"
+" shrl $16, %%eax\n\t"
+" movw %%ax, (%%esi)\n\t"
+
+" movd 12(%%ecx), %%mm0\n\t"
+" pfsub 8(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" pf2id %%mm0, %%mm7\n\t"
+" packssdw %%mm7, %%mm7\n\t"
+" movd %%mm7, %%eax\n\t"
+" movw %%ax, 256(%%edi)\n\t"
+" pfadd 12(%%ecx), %%mm0\n\t"
+" pfadd 8(%%ecx), %%mm0\n\t"
+" pf2id %%mm0, %%mm0\n\t"
+" packssdw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, 256(%%esi)\n\t"
+
+" movd 16(%%ecx), %%mm3\n\t"
+" pfsub 20(%%ecx), %%mm3\n\t"
+" pfmul 120(%%ebx), %%mm3\n\t"
+" movq %%mm3, %%mm2\n\t"
+
+" movd 28(%%ecx), %%mm2\n\t"
+" pfsub 24(%%ecx), %%mm2\n\t"
+" pfmul 120(%%ebx), %%mm2\n\t"
+" movq %%mm2, %%mm1\n\t"
+
+" pf2id %%mm2, %%mm7\n\t"
+" packssdw %%mm7, %%mm7\n\t"
+" movd %%mm7, %%eax\n\t"
+" movw %%ax, 384(%%edi)\n\t"
+
+" pfadd 24(%%ecx), %%mm1\n\t"
+" pfadd 28(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 16(%%ecx), %%mm0\n\t"
+" pfadd 20(%%ecx), %%mm0\n\t"
+" pf2id %%mm0, %%mm0\n\t"
+" packssdw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, 384(%%esi)\n\t"
+" pfadd %%mm3, %%mm1\n\t"
+" pf2id %%mm1, %%mm1\n\t"
+" packssdw %%mm1, %%mm1\n\t"
+" movd %%mm1, %%eax\n\t"
+" movw %%ax, 128(%%esi)\n\t"
+" pfadd %%mm3, %%mm2\n\t"
+" pf2id %%mm2, %%mm2\n\t"
+" packssdw %%mm2, %%mm2\n\t"
+" movd %%mm2, %%eax\n\t"
+" movw %%ax, 128(%%edi)\n\t"
/* Phase 10*/
-" movq 32(%%edx), %%mm0\n\t"
-" movq 48(%%edx), %%mm1\n\t"
-" pfadd 48(%%edx), %%mm0\n\t"
-" pfadd 40(%%edx), %%mm1\n\t"
-" pf2id %%mm0, %%mm0\n\t"
-" pf2id %%mm1, %%mm1\n\t"
-" packssdw %%mm0, %%mm0\n\t"
-" packssdw %%mm1, %%mm1\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm1, %%ecx\n\t"
-" movw %%ax, 448(%%esi)\n\t"
-" movw %%cx, 320(%%esi)\n\t"
-" shrl $16, %%eax\n\t"
-" shrl $16, %%ecx\n\t"
-" movw %%ax, 64(%%edi)\n\t"
-" movw %%cx, 192(%%edi)\n\t"
-
-" movd 40(%%edx), %%mm3\n\t"
-" movd 56(%%edx), %%mm4\n\t"
-" movd 60(%%edx), %%mm0\n\t"
-" movd 44(%%edx), %%mm2\n\t"
-" movd 120(%%edx), %%mm5\n\t"
-" punpckldq %%mm4, %%mm3\n\t"
-" punpckldq 124(%%edx), %%mm0\n\t"
-" pfadd 100(%%edx), %%mm5\n\t"
-" punpckldq 36(%%edx), %%mm4\n\t"
-" punpckldq 92(%%edx), %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" pfadd %%mm4, %%mm3\n\t"
-" pf2id %%mm0, %%mm1\n\t"
-" pf2id %%mm3, %%mm3\n\t"
-" packssdw %%mm1, %%mm1\n\t"
-" packssdw %%mm3, %%mm3\n\t"
-" pfadd 88(%%edx), %%mm5\n\t"
-" movd %%mm1, %%eax\n\t"
-" movd %%mm3, %%ecx\n\t"
-" movw %%ax, 448(%%edi)\n\t"
-" movw %%cx, 192(%%esi)\n\t"
-" pf2id %%mm5, %%mm5\n\t"
-" packssdw %%mm5, %%mm5\n\t"
-" shrl $16, %%eax\n\t"
-" shrl $16, %%ecx\n\t"
-" movd %%mm5, %%ebx\n\t"
-" movw %%bx, 96(%%esi)\n\t"
-" movw %%ax, 480(%%edi)\n\t"
-" movw %%cx, 64(%%esi)\n\t"
-" pfadd %%mm2, %%mm0\n\t"
-" pf2id %%mm0, %%mm0\n\t"
-" packssdw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" pfadd 68(%%edx), %%mm6\n\t"
-" movw %%ax, 320(%%edi)\n\t"
-" shr $16, %%eax\n\t"
-" pf2id %%mm6, %%mm6\n\t"
-" packssdw %%mm6, %%mm6\n\t"
-" movd %%mm6, %%ebx\n\t"
-" movw %%ax, 416(%%edi)\n\t"
-" movw %%bx, 32(%%esi)\n\t"
-
-" movq 96(%%edx), %%mm0\n\t"
-" movq 112(%%edx), %%mm2\n\t"
-" movq 104(%%edx), %%mm4\n\t"
-" pfadd %%mm2, %%mm0\n\t"
-" pfadd %%mm4, %%mm2\n\t"
-" pfadd 120(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm1\n\t"
-" movq %%mm2, %%mm3\n\t"
-" movq %%mm4, %%mm5\n\t"
-" pfadd 64(%%edx), %%mm0\n\t"
-" pfadd 80(%%edx), %%mm2\n\t"
-" pfadd 72(%%edx), %%mm4\n\t"
-" pf2id %%mm0, %%mm0\n\t"
-" pf2id %%mm2, %%mm2\n\t"
-" pf2id %%mm4, %%mm4\n\t"
-" packssdw %%mm0, %%mm0\n\t"
-" packssdw %%mm2, %%mm2\n\t"
-" packssdw %%mm4, %%mm4\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm2, %%ecx\n\t"
-" movd %%mm4, %%ebx\n\t"
-" movw %%ax, 480(%%esi)\n\t"
-" movw %%cx, 352(%%esi)\n\t"
-" movw %%bx, 224(%%esi)\n\t"
-" shrl $16, %%eax\n\t"
-" shrl $16, %%ecx\n\t"
-" shrl $16, %%ebx\n\t"
-" movw %%ax, 32(%%edi)\n\t"
-" movw %%cx, 160(%%edi)\n\t"
-" movw %%bx, 288(%%edi)\n\t"
-" pfadd 80(%%edx), %%mm1\n\t"
-" pfadd 72(%%edx), %%mm3\n\t"
-" pfadd 88(%%edx), %%mm5\n\t"
-" pf2id %%mm1, %%mm1\n\t"
-" pf2id %%mm3, %%mm3\n\t"
-" pf2id %%mm5, %%mm5\n\t"
-" packssdw %%mm1, %%mm1\n\t"
-" packssdw %%mm3, %%mm3\n\t"
-" packssdw %%mm5, %%mm5\n\t"
-" movd %%mm1, %%eax\n\t"
-" movd %%mm3, %%ecx\n\t"
-" movd %%mm5, %%ebx\n\t"
-" movw %%ax, 416(%%esi)\n\t"
-" movw %%cx, 288(%%esi)\n\t"
-" movw %%bx, 160(%%esi)\n\t"
-" shrl $16, %%eax\n\t"
-" shrl $16, %%ecx\n\t"
-" shrl $16, %%ebx\n\t"
-" movw %%ax, 96(%%edi)\n\t"
-" movw %%cx, 224(%%edi)\n\t"
-" movw %%bx, 352(%%edi)\n\t"
-
-" movsw\n\t"
+" movq 32(%%edx), %%mm0\n\t"
+" movq 48(%%edx), %%mm1\n\t"
+" pfadd 48(%%edx), %%mm0\n\t"
+" pfadd 40(%%edx), %%mm1\n\t"
+" pf2id %%mm0, %%mm0\n\t"
+" pf2id %%mm1, %%mm1\n\t"
+" packssdw %%mm0, %%mm0\n\t"
+" packssdw %%mm1, %%mm1\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm1, %%ecx\n\t"
+" movw %%ax, 448(%%esi)\n\t"
+" movw %%cx, 320(%%esi)\n\t"
+" shrl $16, %%eax\n\t"
+" shrl $16, %%ecx\n\t"
+" movw %%ax, 64(%%edi)\n\t"
+" movw %%cx, 192(%%edi)\n\t"
+
+" movd 40(%%edx), %%mm3\n\t"
+" movd 56(%%edx), %%mm4\n\t"
+" movd 60(%%edx), %%mm0\n\t"
+" movd 44(%%edx), %%mm2\n\t"
+" movd 120(%%edx), %%mm5\n\t"
+" punpckldq %%mm4, %%mm3\n\t"
+" punpckldq 124(%%edx), %%mm0\n\t"
+" pfadd 100(%%edx), %%mm5\n\t"
+" punpckldq 36(%%edx), %%mm4\n\t"
+" punpckldq 92(%%edx), %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" pfadd %%mm4, %%mm3\n\t"
+" pf2id %%mm0, %%mm1\n\t"
+" pf2id %%mm3, %%mm3\n\t"
+" packssdw %%mm1, %%mm1\n\t"
+" packssdw %%mm3, %%mm3\n\t"
+" pfadd 88(%%edx), %%mm5\n\t"
+" movd %%mm1, %%eax\n\t"
+" movd %%mm3, %%ecx\n\t"
+" movw %%ax, 448(%%edi)\n\t"
+" movw %%cx, 192(%%esi)\n\t"
+" pf2id %%mm5, %%mm5\n\t"
+" packssdw %%mm5, %%mm5\n\t"
+" shrl $16, %%eax\n\t"
+" shrl $16, %%ecx\n\t"
+" movd %%mm5, %%ebx\n\t"
+" movw %%bx, 96(%%esi)\n\t"
+" movw %%ax, 480(%%edi)\n\t"
+" movw %%cx, 64(%%esi)\n\t"
+" pfadd %%mm2, %%mm0\n\t"
+" pf2id %%mm0, %%mm0\n\t"
+" packssdw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" pfadd 68(%%edx), %%mm6\n\t"
+" movw %%ax, 320(%%edi)\n\t"
+" shr $16, %%eax\n\t"
+" pf2id %%mm6, %%mm6\n\t"
+" packssdw %%mm6, %%mm6\n\t"
+" movd %%mm6, %%ebx\n\t"
+" movw %%ax, 416(%%edi)\n\t"
+" movw %%bx, 32(%%esi)\n\t"
+
+" movq 96(%%edx), %%mm0\n\t"
+" movq 112(%%edx), %%mm2\n\t"
+" movq 104(%%edx), %%mm4\n\t"
+" pfadd %%mm2, %%mm0\n\t"
+" pfadd %%mm4, %%mm2\n\t"
+" pfadd 120(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm1\n\t"
+" movq %%mm2, %%mm3\n\t"
+" movq %%mm4, %%mm5\n\t"
+" pfadd 64(%%edx), %%mm0\n\t"
+" pfadd 80(%%edx), %%mm2\n\t"
+" pfadd 72(%%edx), %%mm4\n\t"
+" pf2id %%mm0, %%mm0\n\t"
+" pf2id %%mm2, %%mm2\n\t"
+" pf2id %%mm4, %%mm4\n\t"
+" packssdw %%mm0, %%mm0\n\t"
+" packssdw %%mm2, %%mm2\n\t"
+" packssdw %%mm4, %%mm4\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm2, %%ecx\n\t"
+" movd %%mm4, %%ebx\n\t"
+" movw %%ax, 480(%%esi)\n\t"
+" movw %%cx, 352(%%esi)\n\t"
+" movw %%bx, 224(%%esi)\n\t"
+" shrl $16, %%eax\n\t"
+" shrl $16, %%ecx\n\t"
+" shrl $16, %%ebx\n\t"
+" movw %%ax, 32(%%edi)\n\t"
+" movw %%cx, 160(%%edi)\n\t"
+" movw %%bx, 288(%%edi)\n\t"
+" pfadd 80(%%edx), %%mm1\n\t"
+" pfadd 72(%%edx), %%mm3\n\t"
+" pfadd 88(%%edx), %%mm5\n\t"
+" pf2id %%mm1, %%mm1\n\t"
+" pf2id %%mm3, %%mm3\n\t"
+" pf2id %%mm5, %%mm5\n\t"
+" packssdw %%mm1, %%mm1\n\t"
+" packssdw %%mm3, %%mm3\n\t"
+" packssdw %%mm5, %%mm5\n\t"
+" movd %%mm1, %%eax\n\t"
+" movd %%mm3, %%ecx\n\t"
+" movd %%mm5, %%ebx\n\t"
+" movw %%ax, 416(%%esi)\n\t"
+" movw %%cx, 288(%%esi)\n\t"
+" movw %%bx, 160(%%esi)\n\t"
+" shrl $16, %%eax\n\t"
+" shrl $16, %%ecx\n\t"
+" shrl $16, %%ebx\n\t"
+" movw %%ax, 96(%%edi)\n\t"
+" movw %%cx, 224(%%edi)\n\t"
+" movw %%bx, 352(%%edi)\n\t"
+
+" movsw\n\t"
".L_bye:\n\t"
-" femms\n\t"
- :
- :"m"(a),"m"(b),"m"(c),"m"(tmp[0])
- :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi");
+" femms\n\t"
+ :
+ :"m"(a),"m"(b),"m"(c),"m"(tmp[0])
+ :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi");
}
diff --git a/mp3lib/dct64_k7.c b/mp3lib/dct64_k7.c
index edd41bd7a2..8204877cad 100644
--- a/mp3lib/dct64_k7.c
+++ b/mp3lib/dct64_k7.c
@@ -19,748 +19,748 @@ void dct64_MMX_3dnowex(short *a,short *b,real *c)
{
char tmp[256];
__asm__ volatile(
-" movl %2,%%eax\n\t"
+" movl %2,%%eax\n\t"
-" leal 128+%3,%%edx\n\t"
-" movl %0,%%esi\n\t"
-" movl %1,%%edi\n\t"
-" movl $"MANGLE(costab_mmx)",%%ebx\n\t"
-" leal %3,%%ecx\n\t"
+" leal 128+%3,%%edx\n\t"
+" movl %0,%%esi\n\t"
+" movl %1,%%edi\n\t"
+" movl $"MANGLE(costab_mmx)",%%ebx\n\t"
+" leal %3,%%ecx\n\t"
/* Phase 1*/
-" movq (%%eax), %%mm0\n\t"
-" movq 8(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 120(%%eax), %%mm1\n\t"
-" pswapd 112(%%eax), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%edx)\n\t"
-" movq %%mm4, 8(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul (%%ebx), %%mm3\n\t"
-" pfmul 8(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 120(%%edx)\n\t"
-" movq %%mm7, 112(%%edx)\n\t"
-
-" movq 16(%%eax), %%mm0\n\t"
-" movq 24(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 104(%%eax), %%mm1\n\t"
-" pswapd 96(%%eax), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 16(%%edx)\n\t"
-" movq %%mm4, 24(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 16(%%ebx), %%mm3\n\t"
-" pfmul 24(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 104(%%edx)\n\t"
-" movq %%mm7, 96(%%edx)\n\t"
-
-" movq 32(%%eax), %%mm0\n\t"
-" movq 40(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 88(%%eax), %%mm1\n\t"
-" pswapd 80(%%eax), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 32(%%edx)\n\t"
-" movq %%mm4, 40(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 32(%%ebx), %%mm3\n\t"
-" pfmul 40(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 88(%%edx)\n\t"
-" movq %%mm7, 80(%%edx)\n\t"
-
-" movq 48(%%eax), %%mm0\n\t"
-" movq 56(%%eax), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 72(%%eax), %%mm1\n\t"
-" pswapd 64(%%eax), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 48(%%edx)\n\t"
-" movq %%mm4, 56(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 48(%%ebx), %%mm3\n\t"
-" pfmul 56(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 72(%%edx)\n\t"
-" movq %%mm7, 64(%%edx)\n\t"
+" movq (%%eax), %%mm0\n\t"
+" movq 8(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 120(%%eax), %%mm1\n\t"
+" pswapd 112(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%edx)\n\t"
+" movq %%mm4, 8(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul (%%ebx), %%mm3\n\t"
+" pfmul 8(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 120(%%edx)\n\t"
+" movq %%mm7, 112(%%edx)\n\t"
+
+" movq 16(%%eax), %%mm0\n\t"
+" movq 24(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 104(%%eax), %%mm1\n\t"
+" pswapd 96(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 16(%%edx)\n\t"
+" movq %%mm4, 24(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 16(%%ebx), %%mm3\n\t"
+" pfmul 24(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 104(%%edx)\n\t"
+" movq %%mm7, 96(%%edx)\n\t"
+
+" movq 32(%%eax), %%mm0\n\t"
+" movq 40(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 88(%%eax), %%mm1\n\t"
+" pswapd 80(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 32(%%edx)\n\t"
+" movq %%mm4, 40(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 32(%%ebx), %%mm3\n\t"
+" pfmul 40(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 88(%%edx)\n\t"
+" movq %%mm7, 80(%%edx)\n\t"
+
+" movq 48(%%eax), %%mm0\n\t"
+" movq 56(%%eax), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 72(%%eax), %%mm1\n\t"
+" pswapd 64(%%eax), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 48(%%edx)\n\t"
+" movq %%mm4, 56(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 48(%%ebx), %%mm3\n\t"
+" pfmul 56(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 72(%%edx)\n\t"
+" movq %%mm7, 64(%%edx)\n\t"
/* Phase 2*/
-" movq (%%edx), %%mm0\n\t"
-" movq 8(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 56(%%edx), %%mm1\n\t"
-" pswapd 48(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%ecx)\n\t"
-" movq %%mm4, 8(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 64(%%ebx), %%mm3\n\t"
-" pfmul 72(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 56(%%ecx)\n\t"
-" movq %%mm7, 48(%%ecx)\n\t"
-
-" movq 16(%%edx), %%mm0\n\t"
-" movq 24(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 40(%%edx), %%mm1\n\t"
-" pswapd 32(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 16(%%ecx)\n\t"
-" movq %%mm4, 24(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul 80(%%ebx), %%mm3\n\t"
-" pfmul 88(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 40(%%ecx)\n\t"
-" movq %%mm7, 32(%%ecx)\n\t"
+" movq (%%edx), %%mm0\n\t"
+" movq 8(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 56(%%edx), %%mm1\n\t"
+" pswapd 48(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%ecx)\n\t"
+" movq %%mm4, 8(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 64(%%ebx), %%mm3\n\t"
+" pfmul 72(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 56(%%ecx)\n\t"
+" movq %%mm7, 48(%%ecx)\n\t"
+
+" movq 16(%%edx), %%mm0\n\t"
+" movq 24(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 40(%%edx), %%mm1\n\t"
+" pswapd 32(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 16(%%ecx)\n\t"
+" movq %%mm4, 24(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul 80(%%ebx), %%mm3\n\t"
+" pfmul 88(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 40(%%ecx)\n\t"
+" movq %%mm7, 32(%%ecx)\n\t"
/* Phase 3*/
-" movq 64(%%edx), %%mm0\n\t"
-" movq 72(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 120(%%edx), %%mm1\n\t"
-" pswapd 112(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 64(%%ecx)\n\t"
-" movq %%mm4, 72(%%ecx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 64(%%ebx), %%mm3\n\t"
-" pfmul 72(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 120(%%ecx)\n\t"
-" movq %%mm7, 112(%%ecx)\n\t"
-
-" movq 80(%%edx), %%mm0\n\t"
-" movq 88(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 104(%%edx), %%mm1\n\t"
-" pswapd 96(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 80(%%ecx)\n\t"
-" movq %%mm4, 88(%%ecx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul 80(%%ebx), %%mm3\n\t"
-" pfmul 88(%%ebx), %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 104(%%ecx)\n\t"
-" movq %%mm7, 96(%%ecx)\n\t"
+" movq 64(%%edx), %%mm0\n\t"
+" movq 72(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 120(%%edx), %%mm1\n\t"
+" pswapd 112(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 64(%%ecx)\n\t"
+" movq %%mm4, 72(%%ecx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 64(%%ebx), %%mm3\n\t"
+" pfmul 72(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 120(%%ecx)\n\t"
+" movq %%mm7, 112(%%ecx)\n\t"
+
+" movq 80(%%edx), %%mm0\n\t"
+" movq 88(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 104(%%edx), %%mm1\n\t"
+" pswapd 96(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 80(%%ecx)\n\t"
+" movq %%mm4, 88(%%ecx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul 80(%%ebx), %%mm3\n\t"
+" pfmul 88(%%ebx), %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 104(%%ecx)\n\t"
+" movq %%mm7, 96(%%ecx)\n\t"
/* Phase 4*/
-" movq 96(%%ebx), %%mm2\n\t"
-" movq 104(%%ebx), %%mm6\n\t"
-
-" movq (%%ecx), %%mm0\n\t"
-" movq 8(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 24(%%ecx), %%mm1\n\t"
-" pswapd 16(%%ecx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%edx)\n\t"
-" movq %%mm4, 8(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm6, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 24(%%edx)\n\t"
-" movq %%mm7, 16(%%edx)\n\t"
-
-" movq 32(%%ecx), %%mm0\n\t"
-" movq 40(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 56(%%ecx), %%mm1\n\t"
-" pswapd 48(%%ecx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 32(%%edx)\n\t"
-" movq %%mm4, 40(%%edx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm6, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 56(%%edx)\n\t"
-" movq %%mm7, 48(%%edx)\n\t"
-
-" movq 64(%%ecx), %%mm0\n\t"
-" movq 72(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 88(%%ecx), %%mm1\n\t"
-" pswapd 80(%%ecx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 64(%%edx)\n\t"
-" movq %%mm4, 72(%%edx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsub %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm6, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 88(%%edx)\n\t"
-" movq %%mm7, 80(%%edx)\n\t"
-
-" movq 96(%%ecx), %%mm0\n\t"
-" movq 104(%%ecx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 120(%%ecx), %%mm1\n\t"
-" pswapd 112(%%ecx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 96(%%edx)\n\t"
-" movq %%mm4, 104(%%edx)\n\t"
-" pfsubr %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm6, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 120(%%edx)\n\t"
-" movq %%mm7, 112(%%edx)\n\t"
+" movq 96(%%ebx), %%mm2\n\t"
+" movq 104(%%ebx), %%mm6\n\t"
+
+" movq (%%ecx), %%mm0\n\t"
+" movq 8(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 24(%%ecx), %%mm1\n\t"
+" pswapd 16(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%edx)\n\t"
+" movq %%mm4, 8(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm6, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 24(%%edx)\n\t"
+" movq %%mm7, 16(%%edx)\n\t"
+
+" movq 32(%%ecx), %%mm0\n\t"
+" movq 40(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 56(%%ecx), %%mm1\n\t"
+" pswapd 48(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 32(%%edx)\n\t"
+" movq %%mm4, 40(%%edx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm6, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 56(%%edx)\n\t"
+" movq %%mm7, 48(%%edx)\n\t"
+
+" movq 64(%%ecx), %%mm0\n\t"
+" movq 72(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 88(%%ecx), %%mm1\n\t"
+" pswapd 80(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 64(%%edx)\n\t"
+" movq %%mm4, 72(%%edx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsub %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm6, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 88(%%edx)\n\t"
+" movq %%mm7, 80(%%edx)\n\t"
+
+" movq 96(%%ecx), %%mm0\n\t"
+" movq 104(%%ecx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 120(%%ecx), %%mm1\n\t"
+" pswapd 112(%%ecx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 96(%%edx)\n\t"
+" movq %%mm4, 104(%%edx)\n\t"
+" pfsubr %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm6, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 120(%%edx)\n\t"
+" movq %%mm7, 112(%%edx)\n\t"
/* Phase 5 */
-" movq 112(%%ebx), %%mm2\n\t"
-
-" movq (%%edx), %%mm0\n\t"
-" movq 16(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 8(%%edx), %%mm1\n\t"
-" pswapd 24(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, (%%ecx)\n\t"
-" movq %%mm4, 16(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm2, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 8(%%ecx)\n\t"
-" movq %%mm7, 24(%%ecx)\n\t"
-
-" movq 32(%%edx), %%mm0\n\t"
-" movq 48(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 40(%%edx), %%mm1\n\t"
-" pswapd 56(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 32(%%ecx)\n\t"
-" movq %%mm4, 48(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm2, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 40(%%ecx)\n\t"
-" movq %%mm7, 56(%%ecx)\n\t"
-
-" movq 64(%%edx), %%mm0\n\t"
-" movq 80(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 72(%%edx), %%mm1\n\t"
-" pswapd 88(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 64(%%ecx)\n\t"
-" movq %%mm4, 80(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm2, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 72(%%ecx)\n\t"
-" movq %%mm7, 88(%%ecx)\n\t"
-
-" movq 96(%%edx), %%mm0\n\t"
-" movq 112(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm3\n\t"
-" movq %%mm4, %%mm7\n\t"
-" pswapd 104(%%edx), %%mm1\n\t"
-" pswapd 120(%%edx), %%mm5\n\t"
-" pfadd %%mm1, %%mm0\n\t"
-" pfadd %%mm5, %%mm4\n\t"
-" movq %%mm0, 96(%%ecx)\n\t"
-" movq %%mm4, 112(%%ecx)\n\t"
-" pfsub %%mm1, %%mm3\n\t"
-" pfsubr %%mm5, %%mm7\n\t"
-" pfmul %%mm2, %%mm3\n\t"
-" pfmul %%mm2, %%mm7\n\t"
-" pswapd %%mm3, %%mm3\n\t"
-" pswapd %%mm7, %%mm7\n\t"
-" movq %%mm3, 104(%%ecx)\n\t"
-" movq %%mm7, 120(%%ecx)\n\t"
+" movq 112(%%ebx), %%mm2\n\t"
+
+" movq (%%edx), %%mm0\n\t"
+" movq 16(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 8(%%edx), %%mm1\n\t"
+" pswapd 24(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, (%%ecx)\n\t"
+" movq %%mm4, 16(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm2, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 8(%%ecx)\n\t"
+" movq %%mm7, 24(%%ecx)\n\t"
+
+" movq 32(%%edx), %%mm0\n\t"
+" movq 48(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 40(%%edx), %%mm1\n\t"
+" pswapd 56(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 32(%%ecx)\n\t"
+" movq %%mm4, 48(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm2, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 40(%%ecx)\n\t"
+" movq %%mm7, 56(%%ecx)\n\t"
+
+" movq 64(%%edx), %%mm0\n\t"
+" movq 80(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 72(%%edx), %%mm1\n\t"
+" pswapd 88(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 64(%%ecx)\n\t"
+" movq %%mm4, 80(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm2, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 72(%%ecx)\n\t"
+" movq %%mm7, 88(%%ecx)\n\t"
+
+" movq 96(%%edx), %%mm0\n\t"
+" movq 112(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm3\n\t"
+" movq %%mm4, %%mm7\n\t"
+" pswapd 104(%%edx), %%mm1\n\t"
+" pswapd 120(%%edx), %%mm5\n\t"
+" pfadd %%mm1, %%mm0\n\t"
+" pfadd %%mm5, %%mm4\n\t"
+" movq %%mm0, 96(%%ecx)\n\t"
+" movq %%mm4, 112(%%ecx)\n\t"
+" pfsub %%mm1, %%mm3\n\t"
+" pfsubr %%mm5, %%mm7\n\t"
+" pfmul %%mm2, %%mm3\n\t"
+" pfmul %%mm2, %%mm7\n\t"
+" pswapd %%mm3, %%mm3\n\t"
+" pswapd %%mm7, %%mm7\n\t"
+" movq %%mm3, 104(%%ecx)\n\t"
+" movq %%mm7, 120(%%ecx)\n\t"
/* Phase 6. This is the end of easy road. */
/* Code below is coded in scalar mode. Should be optimized */
-" movd "MANGLE(plus_1f)", %%mm6\n\t"
-" punpckldq 120(%%ebx), %%mm6\n\t" /* mm6 = 1.0 | 120(%%ebx)*/
-" movq "MANGLE(x_plus_minus_3dnow)", %%mm7\n\t" /* mm7 = +1 | -1 */
-
-" movq 32(%%ecx), %%mm0\n\t"
-" movq 64(%%ecx), %%mm2\n\t"
-" movq %%mm0, %%mm1\n\t"
-" movq %%mm2, %%mm3\n\t"
-" pxor %%mm7, %%mm1\n\t"
-" pxor %%mm7, %%mm3\n\t"
-" pfacc %%mm1, %%mm0\n\t"
-" pfacc %%mm3, %%mm2\n\t"
-" pfmul %%mm6, %%mm0\n\t"
-" pfmul %%mm6, %%mm2\n\t"
-" movq %%mm0, 32(%%edx)\n\t"
-" movq %%mm2, 64(%%edx)\n\t"
-
-" movd 44(%%ecx), %%mm0\n\t"
-" movd 40(%%ecx), %%mm2\n\t"
-" movd 120(%%ebx), %%mm3\n\t"
-" punpckldq 76(%%ecx), %%mm0\n\t"
-" punpckldq 72(%%ecx), %%mm2\n\t"
-" punpckldq %%mm3, %%mm3\n\t"
-" movq %%mm0, %%mm4\n\t"
-" movq %%mm2, %%mm5\n\t"
-" pfsub %%mm2, %%mm0\n\t"
-" pfmul %%mm3, %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pfadd %%mm5, %%mm0\n\t"
-" pfadd %%mm4, %%mm0\n\t"
-" movq %%mm0, %%mm2\n\t"
-" punpckldq %%mm1, %%mm0\n\t"
-" punpckhdq %%mm1, %%mm2\n\t"
-" movq %%mm0, 40(%%edx)\n\t"
-" movq %%mm2, 72(%%edx)\n\t"
-
-" movd 48(%%ecx), %%mm3\n\t"
-" movd 60(%%ecx), %%mm2\n\t"
-" pfsub 52(%%ecx), %%mm3\n\t"
-" pfsub 56(%%ecx), %%mm2\n\t"
-" pfmul 120(%%ebx), %%mm3\n\t"
-" pfmul 120(%%ebx), %%mm2\n\t"
-" movq %%mm2, %%mm1\n\t"
-
-" pfadd 56(%%ecx), %%mm1\n\t"
-" pfadd 60(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 48(%%ecx), %%mm0\n\t"
-" pfadd 52(%%ecx), %%mm0\n\t"
-" pfadd %%mm3, %%mm1\n\t"
-" punpckldq %%mm2, %%mm1\n\t"
-" pfadd %%mm3, %%mm2\n\t"
-" punpckldq %%mm2, %%mm0\n\t"
-" movq %%mm1, 56(%%edx)\n\t"
-" movq %%mm0, 48(%%edx)\n\t"
+" movd "MANGLE(plus_1f)", %%mm6\n\t"
+" punpckldq 120(%%ebx), %%mm6\n\t" /* mm6 = 1.0 | 120(%%ebx)*/
+" movq "MANGLE(x_plus_minus_3dnow)", %%mm7\n\t" /* mm7 = +1 | -1 */
+
+" movq 32(%%ecx), %%mm0\n\t"
+" movq 64(%%ecx), %%mm2\n\t"
+" movq %%mm0, %%mm1\n\t"
+" movq %%mm2, %%mm3\n\t"
+" pxor %%mm7, %%mm1\n\t"
+" pxor %%mm7, %%mm3\n\t"
+" pfacc %%mm1, %%mm0\n\t"
+" pfacc %%mm3, %%mm2\n\t"
+" pfmul %%mm6, %%mm0\n\t"
+" pfmul %%mm6, %%mm2\n\t"
+" movq %%mm0, 32(%%edx)\n\t"
+" movq %%mm2, 64(%%edx)\n\t"
+
+" movd 44(%%ecx), %%mm0\n\t"
+" movd 40(%%ecx), %%mm2\n\t"
+" movd 120(%%ebx), %%mm3\n\t"
+" punpckldq 76(%%ecx), %%mm0\n\t"
+" punpckldq 72(%%ecx), %%mm2\n\t"
+" punpckldq %%mm3, %%mm3\n\t"
+" movq %%mm0, %%mm4\n\t"
+" movq %%mm2, %%mm5\n\t"
+" pfsub %%mm2, %%mm0\n\t"
+" pfmul %%mm3, %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pfadd %%mm5, %%mm0\n\t"
+" pfadd %%mm4, %%mm0\n\t"
+" movq %%mm0, %%mm2\n\t"
+" punpckldq %%mm1, %%mm0\n\t"
+" punpckhdq %%mm1, %%mm2\n\t"
+" movq %%mm0, 40(%%edx)\n\t"
+" movq %%mm2, 72(%%edx)\n\t"
+
+" movd 48(%%ecx), %%mm3\n\t"
+" movd 60(%%ecx), %%mm2\n\t"
+" pfsub 52(%%ecx), %%mm3\n\t"
+" pfsub 56(%%ecx), %%mm2\n\t"
+" pfmul 120(%%ebx), %%mm3\n\t"
+" pfmul 120(%%ebx), %%mm2\n\t"
+" movq %%mm2, %%mm1\n\t"
+
+" pfadd 56(%%ecx), %%mm1\n\t"
+" pfadd 60(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 48(%%ecx), %%mm0\n\t"
+" pfadd 52(%%ecx), %%mm0\n\t"
+" pfadd %%mm3, %%mm1\n\t"
+" punpckldq %%mm2, %%mm1\n\t"
+" pfadd %%mm3, %%mm2\n\t"
+" punpckldq %%mm2, %%mm0\n\t"
+" movq %%mm1, 56(%%edx)\n\t"
+" movq %%mm0, 48(%%edx)\n\t"
/*---*/
-" movd 92(%%ecx), %%mm1\n\t"
-" pfsub 88(%%ecx), %%mm1\n\t"
-" pfmul 120(%%ebx), %%mm1\n\t"
-" movd %%mm1, 92(%%edx)\n\t"
-" pfadd 92(%%ecx), %%mm1\n\t"
-" pfadd 88(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 80(%%ecx), %%mm0\n\t"
-" pfadd 84(%%ecx), %%mm0\n\t"
-" movd %%mm0, 80(%%edx)\n\t"
-
-" movd 80(%%ecx), %%mm0\n\t"
-" pfsub 84(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" pfadd %%mm0, %%mm1\n\t"
-" pfadd 92(%%edx), %%mm0\n\t"
-" punpckldq %%mm1, %%mm0\n\t"
-" movq %%mm0, 84(%%edx)\n\t"
-
-" movq 96(%%ecx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pxor %%mm7, %%mm1\n\t"
-" pfacc %%mm1, %%mm0\n\t"
-" pfmul %%mm6, %%mm0\n\t"
-" movq %%mm0, 96(%%edx)\n\t"
-
-" movd 108(%%ecx), %%mm0\n\t"
-" pfsub 104(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, 108(%%edx)\n\t"
-" pfadd 104(%%ecx), %%mm0\n\t"
-" pfadd 108(%%ecx), %%mm0\n\t"
-" movd %%mm0, 104(%%edx)\n\t"
-
-" movd 124(%%ecx), %%mm1\n\t"
-" pfsub 120(%%ecx), %%mm1\n\t"
-" pfmul 120(%%ebx), %%mm1\n\t"
-" movd %%mm1, 124(%%edx)\n\t"
-" pfadd 120(%%ecx), %%mm1\n\t"
-" pfadd 124(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 112(%%ecx), %%mm0\n\t"
-" pfadd 116(%%ecx), %%mm0\n\t"
-" movd %%mm0, 112(%%edx)\n\t"
-
-" movd 112(%%ecx), %%mm0\n\t"
-" pfsub 116(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" pfadd %%mm0,%%mm1\n\t"
-" pfadd 124(%%edx), %%mm0\n\t"
-" punpckldq %%mm1, %%mm0\n\t"
-" movq %%mm0, 116(%%edx)\n\t"
+" movd 92(%%ecx), %%mm1\n\t"
+" pfsub 88(%%ecx), %%mm1\n\t"
+" pfmul 120(%%ebx), %%mm1\n\t"
+" movd %%mm1, 92(%%edx)\n\t"
+" pfadd 92(%%ecx), %%mm1\n\t"
+" pfadd 88(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 80(%%ecx), %%mm0\n\t"
+" pfadd 84(%%ecx), %%mm0\n\t"
+" movd %%mm0, 80(%%edx)\n\t"
+
+" movd 80(%%ecx), %%mm0\n\t"
+" pfsub 84(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" pfadd %%mm0, %%mm1\n\t"
+" pfadd 92(%%edx), %%mm0\n\t"
+" punpckldq %%mm1, %%mm0\n\t"
+" movq %%mm0, 84(%%edx)\n\t"
+
+" movq 96(%%ecx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pxor %%mm7, %%mm1\n\t"
+" pfacc %%mm1, %%mm0\n\t"
+" pfmul %%mm6, %%mm0\n\t"
+" movq %%mm0, 96(%%edx)\n\t"
+
+" movd 108(%%ecx), %%mm0\n\t"
+" pfsub 104(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, 108(%%edx)\n\t"
+" pfadd 104(%%ecx), %%mm0\n\t"
+" pfadd 108(%%ecx), %%mm0\n\t"
+" movd %%mm0, 104(%%edx)\n\t"
+
+" movd 124(%%ecx), %%mm1\n\t"
+" pfsub 120(%%ecx), %%mm1\n\t"
+" pfmul 120(%%ebx), %%mm1\n\t"
+" movd %%mm1, 124(%%edx)\n\t"
+" pfadd 120(%%ecx), %%mm1\n\t"
+" pfadd 124(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 112(%%ecx), %%mm0\n\t"
+" pfadd 116(%%ecx), %%mm0\n\t"
+" movd %%mm0, 112(%%edx)\n\t"
+
+" movd 112(%%ecx), %%mm0\n\t"
+" pfsub 116(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" pfadd %%mm0,%%mm1\n\t"
+" pfadd 124(%%edx), %%mm0\n\t"
+" punpckldq %%mm1, %%mm0\n\t"
+" movq %%mm0, 116(%%edx)\n\t"
// this code is broken, there is nothing modifying the z flag above.
#if 0
-" jnz .L01\n\t"
+" jnz .L01\n\t"
/* Phase 7*/
/* Code below is coded in scalar mode. Should be optimized */
-" movd (%%ecx), %%mm0\n\t"
-" pfadd 4(%%ecx), %%mm0\n\t"
-" movd %%mm0, 1024(%%esi)\n\t"
-
-" movd (%%ecx), %%mm0\n\t"
-" pfsub 4(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, (%%esi)\n\t"
-" movd %%mm0, (%%edi)\n\t"
-
-" movd 12(%%ecx), %%mm0\n\t"
-" pfsub 8(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, 512(%%edi)\n\t"
-" pfadd 12(%%ecx), %%mm0\n\t"
-" pfadd 8(%%ecx), %%mm0\n\t"
-" movd %%mm0, 512(%%esi)\n\t"
-
-" movd 16(%%ecx), %%mm0\n\t"
-" pfsub 20(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movq %%mm0, %%mm3\n\t"
-
-" movd 28(%%ecx), %%mm0\n\t"
-" pfsub 24(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" movd %%mm0, 768(%%edi)\n\t"
-" movq %%mm0, %%mm2\n\t"
-
-" pfadd 24(%%ecx), %%mm0\n\t"
-" pfadd 28(%%ecx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-
-" pfadd 16(%%ecx), %%mm0\n\t"
-" pfadd 20(%%ecx), %%mm0\n\t"
-" movd %%mm0, 768(%%esi)\n\t"
-" pfadd %%mm3, %%mm1\n\t"
-" movd %%mm1, 256(%%esi)\n\t"
-" pfadd %%mm3, %%mm2\n\t"
-" movd %%mm2, 256(%%edi)\n\t"
+" movd (%%ecx), %%mm0\n\t"
+" pfadd 4(%%ecx), %%mm0\n\t"
+" movd %%mm0, 1024(%%esi)\n\t"
+
+" movd (%%ecx), %%mm0\n\t"
+" pfsub 4(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, (%%esi)\n\t"
+" movd %%mm0, (%%edi)\n\t"
+
+" movd 12(%%ecx), %%mm0\n\t"
+" pfsub 8(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, 512(%%edi)\n\t"
+" pfadd 12(%%ecx), %%mm0\n\t"
+" pfadd 8(%%ecx), %%mm0\n\t"
+" movd %%mm0, 512(%%esi)\n\t"
+
+" movd 16(%%ecx), %%mm0\n\t"
+" pfsub 20(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movq %%mm0, %%mm3\n\t"
+
+" movd 28(%%ecx), %%mm0\n\t"
+" pfsub 24(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" movd %%mm0, 768(%%edi)\n\t"
+" movq %%mm0, %%mm2\n\t"
+
+" pfadd 24(%%ecx), %%mm0\n\t"
+" pfadd 28(%%ecx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+
+" pfadd 16(%%ecx), %%mm0\n\t"
+" pfadd 20(%%ecx), %%mm0\n\t"
+" movd %%mm0, 768(%%esi)\n\t"
+" pfadd %%mm3, %%mm1\n\t"
+" movd %%mm1, 256(%%esi)\n\t"
+" pfadd %%mm3, %%mm2\n\t"
+" movd %%mm2, 256(%%edi)\n\t"
/* Phase 8*/
-" movq 32(%%edx), %%mm0\n\t"
-" movq 48(%%edx), %%mm1\n\t"
-" pfadd 48(%%edx), %%mm0\n\t"
-" pfadd 40(%%edx), %%mm1\n\t"
-" movd %%mm0, 896(%%esi)\n\t"
-" movd %%mm1, 640(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" psrlq $32, %%mm1\n\t"
-" movd %%mm0, 128(%%edi)\n\t"
-" movd %%mm1, 384(%%edi)\n\t"
-
-" movd 40(%%edx), %%mm0\n\t"
-" pfadd 56(%%edx), %%mm0\n\t"
-" movd %%mm0, 384(%%esi)\n\t"
-
-" movd 56(%%edx), %%mm0\n\t"
-" pfadd 36(%%edx), %%mm0\n\t"
-" movd %%mm0, 128(%%esi)\n\t"
-
-" movd 60(%%edx), %%mm0\n\t"
-" movd %%mm0, 896(%%edi)\n\t"
-" pfadd 44(%%edx), %%mm0\n\t"
-" movd %%mm0, 640(%%edi)\n\t"
-
-" movq 96(%%edx), %%mm0\n\t"
-" movq 112(%%edx), %%mm2\n\t"
-" movq 104(%%edx), %%mm4\n\t"
-" pfadd 112(%%edx), %%mm0\n\t"
-" pfadd 104(%%edx), %%mm2\n\t"
-" pfadd 120(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm1\n\t"
-" movq %%mm2, %%mm3\n\t"
-" movq %%mm4, %%mm5\n\t"
-" pfadd 64(%%edx), %%mm0\n\t"
-" pfadd 80(%%edx), %%mm2\n\t"
-" pfadd 72(%%edx), %%mm4\n\t"
-" movd %%mm0, 960(%%esi)\n\t"
-" movd %%mm2, 704(%%esi)\n\t"
-" movd %%mm4, 448(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" psrlq $32, %%mm2\n\t"
-" psrlq $32, %%mm4\n\t"
-" movd %%mm0, 64(%%edi)\n\t"
-" movd %%mm2, 320(%%edi)\n\t"
-" movd %%mm4, 576(%%edi)\n\t"
-" pfadd 80(%%edx), %%mm1\n\t"
-" pfadd 72(%%edx), %%mm3\n\t"
-" pfadd 88(%%edx), %%mm5\n\t"
-" movd %%mm1, 832(%%esi)\n\t"
-" movd %%mm3, 576(%%esi)\n\t"
-" movd %%mm5, 320(%%esi)\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm5\n\t"
-" movd %%mm1, 192(%%edi)\n\t"
-" movd %%mm3, 448(%%edi)\n\t"
-" movd %%mm5, 704(%%edi)\n\t"
-
-" movd 120(%%edx), %%mm0\n\t"
-" pfadd 100(%%edx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pfadd 88(%%edx), %%mm0\n\t"
-" movd %%mm0, 192(%%esi)\n\t"
-" pfadd 68(%%edx), %%mm1\n\t"
-" movd %%mm1, 64(%%esi)\n\t"
-
-" movd 124(%%edx), %%mm0\n\t"
-" movd %%mm0, 960(%%edi)\n\t"
-" pfadd 92(%%edx), %%mm0\n\t"
-" movd %%mm0, 832(%%edi)\n\t"
-
-" jmp .L_bye\n\t"
-".L01: \n\t"
+" movq 32(%%edx), %%mm0\n\t"
+" movq 48(%%edx), %%mm1\n\t"
+" pfadd 48(%%edx), %%mm0\n\t"
+" pfadd 40(%%edx), %%mm1\n\t"
+" movd %%mm0, 896(%%esi)\n\t"
+" movd %%mm1, 640(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" psrlq $32, %%mm1\n\t"
+" movd %%mm0, 128(%%edi)\n\t"
+" movd %%mm1, 384(%%edi)\n\t"
+
+" movd 40(%%edx), %%mm0\n\t"
+" pfadd 56(%%edx), %%mm0\n\t"
+" movd %%mm0, 384(%%esi)\n\t"
+
+" movd 56(%%edx), %%mm0\n\t"
+" pfadd 36(%%edx), %%mm0\n\t"
+" movd %%mm0, 128(%%esi)\n\t"
+
+" movd 60(%%edx), %%mm0\n\t"
+" movd %%mm0, 896(%%edi)\n\t"
+" pfadd 44(%%edx), %%mm0\n\t"
+" movd %%mm0, 640(%%edi)\n\t"
+
+" movq 96(%%edx), %%mm0\n\t"
+" movq 112(%%edx), %%mm2\n\t"
+" movq 104(%%edx), %%mm4\n\t"
+" pfadd 112(%%edx), %%mm0\n\t"
+" pfadd 104(%%edx), %%mm2\n\t"
+" pfadd 120(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm1\n\t"
+" movq %%mm2, %%mm3\n\t"
+" movq %%mm4, %%mm5\n\t"
+" pfadd 64(%%edx), %%mm0\n\t"
+" pfadd 80(%%edx), %%mm2\n\t"
+" pfadd 72(%%edx), %%mm4\n\t"
+" movd %%mm0, 960(%%esi)\n\t"
+" movd %%mm2, 704(%%esi)\n\t"
+" movd %%mm4, 448(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" psrlq $32, %%mm2\n\t"
+" psrlq $32, %%mm4\n\t"
+" movd %%mm0, 64(%%edi)\n\t"
+" movd %%mm2, 320(%%edi)\n\t"
+" movd %%mm4, 576(%%edi)\n\t"
+" pfadd 80(%%edx), %%mm1\n\t"
+" pfadd 72(%%edx), %%mm3\n\t"
+" pfadd 88(%%edx), %%mm5\n\t"
+" movd %%mm1, 832(%%esi)\n\t"
+" movd %%mm3, 576(%%esi)\n\t"
+" movd %%mm5, 320(%%esi)\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm3\n\t"
+" psrlq $32, %%mm5\n\t"
+" movd %%mm1, 192(%%edi)\n\t"
+" movd %%mm3, 448(%%edi)\n\t"
+" movd %%mm5, 704(%%edi)\n\t"
+
+" movd 120(%%edx), %%mm0\n\t"
+" pfadd 100(%%edx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pfadd 88(%%edx), %%mm0\n\t"
+" movd %%mm0, 192(%%esi)\n\t"
+" pfadd 68(%%edx), %%mm1\n\t"
+" movd %%mm1, 64(%%esi)\n\t"
+
+" movd 124(%%edx), %%mm0\n\t"
+" movd %%mm0, 960(%%edi)\n\t"
+" pfadd 92(%%edx), %%mm0\n\t"
+" movd %%mm0, 832(%%edi)\n\t"
+
+" jmp .L_bye\n\t"
+".L01: \n\t"
#endif
/* Phase 9*/
-" movq (%%ecx), %%mm0\n\t"
-" movq %%mm0, %%mm1\n\t"
-" pxor %%mm7, %%mm1\n\t"
-" pfacc %%mm1, %%mm0\n\t"
-" pfmul %%mm6, %%mm0\n\t"
-" pf2iw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, 512(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, (%%esi)\n\t"
-
-" movd 12(%%ecx), %%mm0\n\t"
-" pfsub 8(%%ecx), %%mm0\n\t"
-" pfmul 120(%%ebx), %%mm0\n\t"
-" pf2iw %%mm0, %%mm7\n\t"
-" movd %%mm7, %%eax\n\t"
-" movw %%ax, 256(%%edi)\n\t"
-" pfadd 12(%%ecx), %%mm0\n\t"
-" pfadd 8(%%ecx), %%mm0\n\t"
-" pf2iw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, 256(%%esi)\n\t"
-
-" movd 16(%%ecx), %%mm3\n\t"
-" pfsub 20(%%ecx), %%mm3\n\t"
-" pfmul 120(%%ebx), %%mm3\n\t"
-" movq %%mm3, %%mm2\n\t"
-
-" movd 28(%%ecx), %%mm2\n\t"
-" pfsub 24(%%ecx), %%mm2\n\t"
-" pfmul 120(%%ebx), %%mm2\n\t"
-" movq %%mm2, %%mm1\n\t"
-
-" pf2iw %%mm2, %%mm7\n\t"
-" movd %%mm7, %%eax\n\t"
-" movw %%ax, 384(%%edi)\n\t"
-
-" pfadd 24(%%ecx), %%mm1\n\t"
-" pfadd 28(%%ecx), %%mm1\n\t"
-" movq %%mm1, %%mm0\n\t"
-
-" pfadd 16(%%ecx), %%mm0\n\t"
-" pfadd 20(%%ecx), %%mm0\n\t"
-" pf2iw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" movw %%ax, 384(%%esi)\n\t"
-" pfadd %%mm3, %%mm1\n\t"
-" pf2iw %%mm1, %%mm1\n\t"
-" movd %%mm1, %%eax\n\t"
-" movw %%ax, 128(%%esi)\n\t"
-" pfadd %%mm3, %%mm2\n\t"
-" pf2iw %%mm2, %%mm2\n\t"
-" movd %%mm2, %%eax\n\t"
-" movw %%ax, 128(%%edi)\n\t"
+" movq (%%ecx), %%mm0\n\t"
+" movq %%mm0, %%mm1\n\t"
+" pxor %%mm7, %%mm1\n\t"
+" pfacc %%mm1, %%mm0\n\t"
+" pfmul %%mm6, %%mm0\n\t"
+" pf2iw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, 512(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, (%%esi)\n\t"
+
+" movd 12(%%ecx), %%mm0\n\t"
+" pfsub 8(%%ecx), %%mm0\n\t"
+" pfmul 120(%%ebx), %%mm0\n\t"
+" pf2iw %%mm0, %%mm7\n\t"
+" movd %%mm7, %%eax\n\t"
+" movw %%ax, 256(%%edi)\n\t"
+" pfadd 12(%%ecx), %%mm0\n\t"
+" pfadd 8(%%ecx), %%mm0\n\t"
+" pf2iw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, 256(%%esi)\n\t"
+
+" movd 16(%%ecx), %%mm3\n\t"
+" pfsub 20(%%ecx), %%mm3\n\t"
+" pfmul 120(%%ebx), %%mm3\n\t"
+" movq %%mm3, %%mm2\n\t"
+
+" movd 28(%%ecx), %%mm2\n\t"
+" pfsub 24(%%ecx), %%mm2\n\t"
+" pfmul 120(%%ebx), %%mm2\n\t"
+" movq %%mm2, %%mm1\n\t"
+
+" pf2iw %%mm2, %%mm7\n\t"
+" movd %%mm7, %%eax\n\t"
+" movw %%ax, 384(%%edi)\n\t"
+
+" pfadd 24(%%ecx), %%mm1\n\t"
+" pfadd 28(%%ecx), %%mm1\n\t"
+" movq %%mm1, %%mm0\n\t"
+
+" pfadd 16(%%ecx), %%mm0\n\t"
+" pfadd 20(%%ecx), %%mm0\n\t"
+" pf2iw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" movw %%ax, 384(%%esi)\n\t"
+" pfadd %%mm3, %%mm1\n\t"
+" pf2iw %%mm1, %%mm1\n\t"
+" movd %%mm1, %%eax\n\t"
+" movw %%ax, 128(%%esi)\n\t"
+" pfadd %%mm3, %%mm2\n\t"
+" pf2iw %%mm2, %%mm2\n\t"
+" movd %%mm2, %%eax\n\t"
+" movw %%ax, 128(%%edi)\n\t"
/* Phase 10*/
-" movq 32(%%edx), %%mm0\n\t"
-" movq 48(%%edx), %%mm1\n\t"
-" pfadd 48(%%edx), %%mm0\n\t"
-" pfadd 40(%%edx), %%mm1\n\t"
-" pf2iw %%mm0, %%mm0\n\t"
-" pf2iw %%mm1, %%mm1\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm1, %%ecx\n\t"
-" movw %%ax, 448(%%esi)\n\t"
-" movw %%cx, 320(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" psrlq $32, %%mm1\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm1, %%ecx\n\t"
-" movw %%ax, 64(%%edi)\n\t"
-" movw %%cx, 192(%%edi)\n\t"
-
-" movd 40(%%edx), %%mm3\n\t"
-" movd 56(%%edx), %%mm4\n\t"
-" movd 60(%%edx), %%mm0\n\t"
-" movd 44(%%edx), %%mm2\n\t"
-" movd 120(%%edx), %%mm5\n\t"
-" punpckldq %%mm4, %%mm3\n\t"
-" punpckldq 124(%%edx), %%mm0\n\t"
-" pfadd 100(%%edx), %%mm5\n\t"
-" punpckldq 36(%%edx), %%mm4\n\t"
-" punpckldq 92(%%edx), %%mm2\n\t"
-" movq %%mm5, %%mm6\n\t"
-" pfadd %%mm4, %%mm3\n\t"
-" pf2iw %%mm0, %%mm1\n\t"
-" pf2iw %%mm3, %%mm3\n\t"
-" pfadd 88(%%edx), %%mm5\n\t"
-" movd %%mm1, %%eax\n\t"
-" movd %%mm3, %%ecx\n\t"
-" movw %%ax, 448(%%edi)\n\t"
-" movw %%cx, 192(%%esi)\n\t"
-" pf2iw %%mm5, %%mm5\n\t"
-" psrlq $32, %%mm1\n\t"
+" movq 32(%%edx), %%mm0\n\t"
+" movq 48(%%edx), %%mm1\n\t"
+" pfadd 48(%%edx), %%mm0\n\t"
+" pfadd 40(%%edx), %%mm1\n\t"
+" pf2iw %%mm0, %%mm0\n\t"
+" pf2iw %%mm1, %%mm1\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm1, %%ecx\n\t"
+" movw %%ax, 448(%%esi)\n\t"
+" movw %%cx, 320(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" psrlq $32, %%mm1\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm1, %%ecx\n\t"
+" movw %%ax, 64(%%edi)\n\t"
+" movw %%cx, 192(%%edi)\n\t"
+
+" movd 40(%%edx), %%mm3\n\t"
+" movd 56(%%edx), %%mm4\n\t"
+" movd 60(%%edx), %%mm0\n\t"
+" movd 44(%%edx), %%mm2\n\t"
+" movd 120(%%edx), %%mm5\n\t"
+" punpckldq %%mm4, %%mm3\n\t"
+" punpckldq 124(%%edx), %%mm0\n\t"
+" pfadd 100(%%edx), %%mm5\n\t"
+" punpckldq 36(%%edx), %%mm4\n\t"
+" punpckldq 92(%%edx), %%mm2\n\t"
+" movq %%mm5, %%mm6\n\t"
+" pfadd %%mm4, %%mm3\n\t"
+" pf2iw %%mm0, %%mm1\n\t"
+" pf2iw %%mm3, %%mm3\n\t"
+" pfadd 88(%%edx), %%mm5\n\t"
+" movd %%mm1, %%eax\n\t"
+" movd %%mm3, %%ecx\n\t"
+" movw %%ax, 448(%%edi)\n\t"
+" movw %%cx, 192(%%esi)\n\t"
+" pf2iw %%mm5, %%mm5\n\t"
+" psrlq $32, %%mm1\n\t"
+" psrlq $32, %%mm3\n\t"
+" movd %%mm5, %%ebx\n\t"
+" movd %%mm1, %%eax\n\t"
+" movd %%mm3, %%ecx\n\t"
+" movw %%bx, 96(%%esi)\n\t"
+" movw %%ax, 480(%%edi)\n\t"
+" movw %%cx, 64(%%esi)\n\t"
+" pfadd %%mm2, %%mm0\n\t"
+" pf2iw %%mm0, %%mm0\n\t"
+" movd %%mm0, %%eax\n\t"
+" pfadd 68(%%edx), %%mm6\n\t"
+" movw %%ax, 320(%%edi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" pf2iw %%mm6, %%mm6\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm6, %%ebx\n\t"
+" movw %%ax, 416(%%edi)\n\t"
+" movw %%bx, 32(%%esi)\n\t"
+
+" movq 96(%%edx), %%mm0\n\t"
+" movq 112(%%edx), %%mm2\n\t"
+" movq 104(%%edx), %%mm4\n\t"
+" pfadd %%mm2, %%mm0\n\t"
+" pfadd %%mm4, %%mm2\n\t"
+" pfadd 120(%%edx), %%mm4\n\t"
+" movq %%mm0, %%mm1\n\t"
+" movq %%mm2, %%mm3\n\t"
+" movq %%mm4, %%mm5\n\t"
+" pfadd 64(%%edx), %%mm0\n\t"
+" pfadd 80(%%edx), %%mm2\n\t"
+" pfadd 72(%%edx), %%mm4\n\t"
+" pf2iw %%mm0, %%mm0\n\t"
+" pf2iw %%mm2, %%mm2\n\t"
+" pf2iw %%mm4, %%mm4\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm2, %%ecx\n\t"
+" movd %%mm4, %%ebx\n\t"
+" movw %%ax, 480(%%esi)\n\t"
+" movw %%cx, 352(%%esi)\n\t"
+" movw %%bx, 224(%%esi)\n\t"
+" psrlq $32, %%mm0\n\t"
+" psrlq $32, %%mm2\n\t"
+" psrlq $32, %%mm4\n\t"
+" movd %%mm0, %%eax\n\t"
+" movd %%mm2, %%ecx\n\t"
+" movd %%mm4, %%ebx\n\t"
+" movw %%ax, 32(%%edi)\n\t"
+" movw %%cx, 160(%%edi)\n\t"
+" movw %%bx, 288(%%edi)\n\t"
+" pfadd 80(%%edx), %%mm1\n\t"
+" pfadd 72(%%edx), %%mm3\n\t"
+" pfadd 88(%%edx), %%mm5\n\t"
+" pf2iw %%mm1, %%mm1\n\t"
+" pf2iw %%mm3, %%mm3\n\t"
+" pf2iw %%mm5, %%mm5\n\t"
+" movd %%mm1, %%eax\n\t"
+" movd %%mm3, %%ecx\n\t"
+" movd %%mm5, %%ebx\n\t"
+" movw %%ax, 416(%%esi)\n\t"
+" movw %%cx, 288(%%esi)\n\t"
+" movw %%bx, 160(%%esi)\n\t"
+" psrlq $32, %%mm1\n\t"
" psrlq $32, %%mm3\n\t"
-" movd %%mm5, %%ebx\n\t"
-" movd %%mm1, %%eax\n\t"
-" movd %%mm3, %%ecx\n\t"
-" movw %%bx, 96(%%esi)\n\t"
-" movw %%ax, 480(%%edi)\n\t"
-" movw %%cx, 64(%%esi)\n\t"
-" pfadd %%mm2, %%mm0\n\t"
-" pf2iw %%mm0, %%mm0\n\t"
-" movd %%mm0, %%eax\n\t"
-" pfadd 68(%%edx), %%mm6\n\t"
-" movw %%ax, 320(%%edi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" pf2iw %%mm6, %%mm6\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm6, %%ebx\n\t"
-" movw %%ax, 416(%%edi)\n\t"
-" movw %%bx, 32(%%esi)\n\t"
-
-" movq 96(%%edx), %%mm0\n\t"
-" movq 112(%%edx), %%mm2\n\t"
-" movq 104(%%edx), %%mm4\n\t"
-" pfadd %%mm2, %%mm0\n\t"
-" pfadd %%mm4, %%mm2\n\t"
-" pfadd 120(%%edx), %%mm4\n\t"
-" movq %%mm0, %%mm1\n\t"
-" movq %%mm2, %%mm3\n\t"
-" movq %%mm4, %%mm5\n\t"
-" pfadd 64(%%edx), %%mm0\n\t"
-" pfadd 80(%%edx), %%mm2\n\t"
-" pfadd 72(%%edx), %%mm4\n\t"
-" pf2iw %%mm0, %%mm0\n\t"
-" pf2iw %%mm2, %%mm2\n\t"
-" pf2iw %%mm4, %%mm4\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm2, %%ecx\n\t"
-" movd %%mm4, %%ebx\n\t"
-" movw %%ax, 480(%%esi)\n\t"
-" movw %%cx, 352(%%esi)\n\t"
-" movw %%bx, 224(%%esi)\n\t"
-" psrlq $32, %%mm0\n\t"
-" psrlq $32, %%mm2\n\t"
-" psrlq $32, %%mm4\n\t"
-" movd %%mm0, %%eax\n\t"
-" movd %%mm2, %%ecx\n\t"
-" movd %%mm4, %%ebx\n\t"
-" movw %%ax, 32(%%edi)\n\t"
-" movw %%cx, 160(%%edi)\n\t"
-" movw %%bx, 288(%%edi)\n\t"
-" pfadd 80(%%edx), %%mm1\n\t"
-" pfadd 72(%%edx), %%mm3\n\t"
-" pfadd 88(%%edx), %%mm5\n\t"
-" pf2iw %%mm1, %%mm1\n\t"
-" pf2iw %%mm3, %%mm3\n\t"
-" pf2iw %%mm5, %%mm5\n\t"
-" movd %%mm1, %%eax\n\t"
-" movd %%mm3, %%ecx\n\t"
-" movd %%mm5, %%ebx\n\t"
-" movw %%ax, 416(%%esi)\n\t"
-" movw %%cx, 288(%%esi)\n\t"
-" movw %%bx, 160(%%esi)\n\t"
-" psrlq $32, %%mm1\n\t"
-" psrlq $32, %%mm3\n\t"
-" psrlq $32, %%mm5\n\t"
-" movd %%mm1, %%eax\n\t"
-" movd %%mm3, %%ecx\n\t"
-" movd %%mm5, %%ebx\n\t"
-" movw %%ax, 96(%%edi)\n\t"
-" movw %%cx, 224(%%edi)\n\t"
-" movw %%bx, 352(%%edi)\n\t"
-
-" movsw\n\t"
+" psrlq $32, %%mm5\n\t"
+" movd %%mm1, %%eax\n\t"
+" movd %%mm3, %%ecx\n\t"
+" movd %%mm5, %%ebx\n\t"
+" movw %%ax, 96(%%edi)\n\t"
+" movw %%cx, 224(%%edi)\n\t"
+" movw %%bx, 352(%%edi)\n\t"
+
+" movsw\n\t"
".L_bye:\n\t"
-" femms\n\t"
- :
- :"m"(a),"m"(b),"m"(c),"m"(tmp[0])
- :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi");
+" femms\n\t"
+ :
+ :"m"(a),"m"(b),"m"(c),"m"(tmp[0])
+ :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi");
}
diff --git a/mp3lib/dct64_mmx.c b/mp3lib/dct64_mmx.c
index 817913a016..6231ebf723 100644
--- a/mp3lib/dct64_mmx.c
+++ b/mp3lib/dct64_mmx.c
@@ -11,976 +11,976 @@ void dct64_MMX(short *a,short *b,real *c)
{
char tmp[256];
__asm__ volatile(
-" movl %2,%%eax\n\t"
+" movl %2,%%eax\n\t"
/* Phase 1*/
-" flds (%%eax)\n\t"
-" leal 128+%3,%%edx\n\t"
-" fadds 124(%%eax)\n\t"
-" movl %0,%%esi\n\t"
-" fstps (%%edx)\n\t"
-" movl %1,%%edi\n\t"
-
-" flds 4(%%eax)\n\t"
-" movl $"MANGLE(costab_mmx)",%%ebx\n\t"
-" fadds 120(%%eax)\n\t"
-" orl %%ecx,%%ecx\n\t"
-" fstps 4(%%edx)\n\t"
-
-" flds (%%eax)\n\t"
-" leal %3,%%ecx\n\t"
-" fsubs 124(%%eax)\n\t"
-" fmuls (%%ebx)\n\t"
-" fstps 124(%%edx)\n\t"
-
-" flds 4(%%eax)\n\t"
-" fsubs 120(%%eax)\n\t"
-" fmuls 4(%%ebx)\n\t"
-" fstps 120(%%edx)\n\t"
-
-" flds 8(%%eax)\n\t"
-" fadds 116(%%eax)\n\t"
-" fstps 8(%%edx)\n\t"
-
-" flds 12(%%eax)\n\t"
-" fadds 112(%%eax)\n\t"
-" fstps 12(%%edx)\n\t"
-
-" flds 8(%%eax)\n\t"
-" fsubs 116(%%eax)\n\t"
-" fmuls 8(%%ebx)\n\t"
-" fstps 116(%%edx)\n\t"
-
-" flds 12(%%eax)\n\t"
-" fsubs 112(%%eax)\n\t"
-" fmuls 12(%%ebx)\n\t"
-" fstps 112(%%edx)\n\t"
-
-" flds 16(%%eax)\n\t"
-" fadds 108(%%eax)\n\t"
-" fstps 16(%%edx)\n\t"
-
-" flds 20(%%eax)\n\t"
-" fadds 104(%%eax)\n\t"
-" fstps 20(%%edx)\n\t"
-
-" flds 16(%%eax)\n\t"
-" fsubs 108(%%eax)\n\t"
-" fmuls 16(%%ebx)\n\t"
-" fstps 108(%%edx)\n\t"
-
-" flds 20(%%eax)\n\t"
-" fsubs 104(%%eax)\n\t"
-" fmuls 20(%%ebx)\n\t"
-" fstps 104(%%edx)\n\t"
-
-" flds 24(%%eax)\n\t"
-" fadds 100(%%eax)\n\t"
-" fstps 24(%%edx)\n\t"
-
-" flds 28(%%eax)\n\t"
-" fadds 96(%%eax)\n\t"
-" fstps 28(%%edx)\n\t"
-
-" flds 24(%%eax)\n\t"
-" fsubs 100(%%eax)\n\t"
-" fmuls 24(%%ebx)\n\t"
-" fstps 100(%%edx)\n\t"
-
-" flds 28(%%eax)\n\t"
-" fsubs 96(%%eax)\n\t"
-" fmuls 28(%%ebx)\n\t"
-" fstps 96(%%edx)\n\t"
-
-" flds 32(%%eax)\n\t"
-" fadds 92(%%eax)\n\t"
-" fstps 32(%%edx)\n\t"
-
-" flds 36(%%eax)\n\t"
-" fadds 88(%%eax)\n\t"
-" fstps 36(%%edx)\n\t"
-
-" flds 32(%%eax)\n\t"
-" fsubs 92(%%eax)\n\t"
-" fmuls 32(%%ebx)\n\t"
-" fstps 92(%%edx)\n\t"
-
-" flds 36(%%eax)\n\t"
-" fsubs 88(%%eax)\n\t"
-" fmuls 36(%%ebx)\n\t"
-" fstps 88(%%edx)\n\t"
-
-" flds 40(%%eax)\n\t"
-" fadds 84(%%eax)\n\t"
-" fstps 40(%%edx)\n\t"
-
-" flds 44(%%eax)\n\t"
-" fadds 80(%%eax)\n\t"
-" fstps 44(%%edx)\n\t"
-
-" flds 40(%%eax)\n\t"
-" fsubs 84(%%eax)\n\t"
-" fmuls 40(%%ebx)\n\t"
-" fstps 84(%%edx)\n\t"
-
-" flds 44(%%eax)\n\t"
-" fsubs 80(%%eax)\n\t"
-" fmuls 44(%%ebx)\n\t"
-" fstps 80(%%edx)\n\t"
-
-" flds 48(%%eax)\n\t"
-" fadds 76(%%eax)\n\t"
-" fstps 48(%%edx)\n\t"
-
-" flds 52(%%eax)\n\t"
-" fadds 72(%%eax)\n\t"
-" fstps 52(%%edx)\n\t"
-
-" flds 48(%%eax)\n\t"
-" fsubs 76(%%eax)\n\t"
-" fmuls 48(%%ebx)\n\t"
-" fstps 76(%%edx)\n\t"
-
-" flds 52(%%eax)\n\t"
-" fsubs 72(%%eax)\n\t"
-" fmuls 52(%%ebx)\n\t"
-" fstps 72(%%edx)\n\t"
-
-" flds 56(%%eax)\n\t"
-" fadds 68(%%eax)\n\t"
-" fstps 56(%%edx)\n\t"
-
-" flds 60(%%eax)\n\t"
-" fadds 64(%%eax)\n\t"
-" fstps 60(%%edx)\n\t"
-
-" flds 56(%%eax)\n\t"
-" fsubs 68(%%eax)\n\t"
-" fmuls 56(%%ebx)\n\t"
-" fstps 68(%%edx)\n\t"
-
-" flds 60(%%eax)\n\t"
-" fsubs 64(%%eax)\n\t"
-" fmuls 60(%%ebx)\n\t"
-" fstps 64(%%edx)\n\t"
+" flds (%%eax)\n\t"
+" leal 128+%3,%%edx\n\t"
+" fadds 124(%%eax)\n\t"
+" movl %0,%%esi\n\t"
+" fstps (%%edx)\n\t"
+" movl %1,%%edi\n\t"
+
+" flds 4(%%eax)\n\t"
+" movl $"MANGLE(costab_mmx)",%%ebx\n\t"
+" fadds 120(%%eax)\n\t"
+" orl %%ecx,%%ecx\n\t"
+" fstps 4(%%edx)\n\t"
+
+" flds (%%eax)\n\t"
+" leal %3,%%ecx\n\t"
+" fsubs 124(%%eax)\n\t"
+" fmuls (%%ebx)\n\t"
+" fstps 124(%%edx)\n\t"
+
+" flds 4(%%eax)\n\t"
+" fsubs 120(%%eax)\n\t"
+" fmuls 4(%%ebx)\n\t"
+" fstps 120(%%edx)\n\t"
+
+" flds 8(%%eax)\n\t"
+" fadds 116(%%eax)\n\t"
+" fstps 8(%%edx)\n\t"
+
+" flds 12(%%eax)\n\t"
+" fadds 112(%%eax)\n\t"
+" fstps 12(%%edx)\n\t"
+
+" flds 8(%%eax)\n\t"
+" fsubs 116(%%eax)\n\t"
+" fmuls 8(%%ebx)\n\t"
+" fstps 116(%%edx)\n\t"
+
+" flds 12(%%eax)\n\t"
+" fsubs 112(%%eax)\n\t"
+" fmuls 12(%%ebx)\n\t"
+" fstps 112(%%edx)\n\t"
+
+" flds 16(%%eax)\n\t"
+" fadds 108(%%eax)\n\t"
+" fstps 16(%%edx)\n\t"
+
+" flds 20(%%eax)\n\t"
+" fadds 104(%%eax)\n\t"
+" fstps 20(%%edx)\n\t"
+
+" flds 16(%%eax)\n\t"
+" fsubs 108(%%eax)\n\t"
+" fmuls 16(%%ebx)\n\t"
+" fstps 108(%%edx)\n\t"
+
+" flds 20(%%eax)\n\t"
+" fsubs 104(%%eax)\n\t"
+" fmuls 20(%%ebx)\n\t"
+" fstps 104(%%edx)\n\t"
+
+" flds 24(%%eax)\n\t"
+" fadds 100(%%eax)\n\t"
+" fstps 24(%%edx)\n\t"
+
+" flds 28(%%eax)\n\t"
+" fadds 96(%%eax)\n\t"
+" fstps 28(%%edx)\n\t"
+
+" flds 24(%%eax)\n\t"
+" fsubs 100(%%eax)\n\t"
+" fmuls 24(%%ebx)\n\t"
+" fstps 100(%%edx)\n\t"
+
+" flds 28(%%eax)\n\t"
+" fsubs 96(%%eax)\n\t"
+" fmuls 28(%%ebx)\n\t"
+" fstps 96(%%edx)\n\t"
+
+" flds 32(%%eax)\n\t"
+" fadds 92(%%eax)\n\t"
+" fstps 32(%%edx)\n\t"
+
+" flds 36(%%eax)\n\t"
+" fadds 88(%%eax)\n\t"
+" fstps 36(%%edx)\n\t"
+
+" flds 32(%%eax)\n\t"
+" fsubs 92(%%eax)\n\t"
+" fmuls 32(%%ebx)\n\t"
+" fstps 92(%%edx)\n\t"
+
+" flds 36(%%eax)\n\t"
+" fsubs 88(%%eax)\n\t"
+" fmuls 36(%%ebx)\n\t"
+" fstps 88(%%edx)\n\t"
+
+" flds 40(%%eax)\n\t"
+" fadds 84(%%eax)\n\t"
+" fstps 40(%%edx)\n\t"
+
+" flds 44(%%eax)\n\t"
+" fadds 80(%%eax)\n\t"
+" fstps 44(%%edx)\n\t"
+
+" flds 40(%%eax)\n\t"
+" fsubs 84(%%eax)\n\t"
+" fmuls 40(%%ebx)\n\t"
+" fstps 84(%%edx)\n\t"
+
+" flds 44(%%eax)\n\t"
+" fsubs 80(%%eax)\n\t"
+" fmuls 44(%%ebx)\n\t"
+" fstps 80(%%edx)\n\t"
+
+" flds 48(%%eax)\n\t"
+" fadds 76(%%eax)\n\t"
+" fstps 48(%%edx)\n\t"
+
+" flds 52(%%eax)\n\t"
+" fadds 72(%%eax)\n\t"
+" fstps 52(%%edx)\n\t"
+
+" flds 48(%%eax)\n\t"
+" fsubs 76(%%eax)\n\t"
+" fmuls 48(%%ebx)\n\t"
+" fstps 76(%%edx)\n\t"
+
+" flds 52(%%eax)\n\t"
+" fsubs 72(%%eax)\n\t"
+" fmuls 52(%%ebx)\n\t"
+" fstps 72(%%edx)\n\t"
+
+" flds 56(%%eax)\n\t"
+" fadds 68(%%eax)\n\t"
+" fstps 56(%%edx)\n\t"
+
+" flds 60(%%eax)\n\t"
+" fadds 64(%%eax)\n\t"
+" fstps 60(%%edx)\n\t"
+
+" flds 56(%%eax)\n\t"
+" fsubs 68(%%eax)\n\t"
+" fmuls 56(%%ebx)\n\t"
+" fstps 68(%%edx)\n\t"
+
+" flds 60(%%eax)\n\t"
+" fsubs 64(%%eax)\n\t"
+" fmuls 60(%%ebx)\n\t"
+" fstps 64(%%edx)\n\t"
/* Phase 2*/
-" flds (%%edx)\n\t"
-" fadds 60(%%edx)\n\t"
-" fstps (%%ecx)\n\t"
-
-" flds 4(%%edx)\n\t"
-" fadds 56(%%edx)\n\t"
-" fstps 4(%%ecx)\n\t"
-
-" flds (%%edx)\n\t"
-" fsubs 60(%%edx)\n\t"
-" fmuls 64(%%ebx)\n\t"
-" fstps 60(%%ecx)\n\t"
-
-" flds 4(%%edx)\n\t"
-" fsubs 56(%%edx)\n\t"
-" fmuls 68(%%ebx)\n\t"
-" fstps 56(%%ecx)\n\t"
-
-" flds 8(%%edx)\n\t"
-" fadds 52(%%edx)\n\t"
-" fstps 8(%%ecx)\n\t"
-
-" flds 12(%%edx)\n\t"
-" fadds 48(%%edx)\n\t"
-" fstps 12(%%ecx)\n\t"
-
-" flds 8(%%edx)\n\t"
-" fsubs 52(%%edx)\n\t"
-" fmuls 72(%%ebx)\n\t"
-" fstps 52(%%ecx)\n\t"
-
-" flds 12(%%edx)\n\t"
-" fsubs 48(%%edx)\n\t"
-" fmuls 76(%%ebx)\n\t"
-" fstps 48(%%ecx)\n\t"
-
-" flds 16(%%edx)\n\t"
-" fadds 44(%%edx)\n\t"
-" fstps 16(%%ecx)\n\t"
-
-" flds 20(%%edx)\n\t"
-" fadds 40(%%edx)\n\t"
-" fstps 20(%%ecx)\n\t"
-
-" flds 16(%%edx)\n\t"
-" fsubs 44(%%edx)\n\t"
-" fmuls 80(%%ebx)\n\t"
-" fstps 44(%%ecx)\n\t"
-
-" flds 20(%%edx)\n\t"
-" fsubs 40(%%edx)\n\t"
-" fmuls 84(%%ebx)\n\t"
-" fstps 40(%%ecx)\n\t"
-
-" flds 24(%%edx)\n\t"
-" fadds 36(%%edx)\n\t"
-" fstps 24(%%ecx)\n\t"
-
-" flds 28(%%edx)\n\t"
-" fadds 32(%%edx)\n\t"
-" fstps 28(%%ecx)\n\t"
-
-" flds 24(%%edx)\n\t"
-" fsubs 36(%%edx)\n\t"
-" fmuls 88(%%ebx)\n\t"
-" fstps 36(%%ecx)\n\t"
-
-" flds 28(%%edx)\n\t"
-" fsubs 32(%%edx)\n\t"
-" fmuls 92(%%ebx)\n\t"
-" fstps 32(%%ecx)\n\t"
+" flds (%%edx)\n\t"
+" fadds 60(%%edx)\n\t"
+" fstps (%%ecx)\n\t"
+
+" flds 4(%%edx)\n\t"
+" fadds 56(%%edx)\n\t"
+" fstps 4(%%ecx)\n\t"
+
+" flds (%%edx)\n\t"
+" fsubs 60(%%edx)\n\t"
+" fmuls 64(%%ebx)\n\t"
+" fstps 60(%%ecx)\n\t"
+
+" flds 4(%%edx)\n\t"
+" fsubs 56(%%edx)\n\t"
+" fmuls 68(%%ebx)\n\t"
+" fstps 56(%%ecx)\n\t"
+
+" flds 8(%%edx)\n\t"
+" fadds 52(%%edx)\n\t"
+" fstps 8(%%ecx)\n\t"
+
+" flds 12(%%edx)\n\t"
+" fadds 48(%%edx)\n\t"
+" fstps 12(%%ecx)\n\t"
+
+" flds 8(%%edx)\n\t"
+" fsubs 52(%%edx)\n\t"
+" fmuls 72(%%ebx)\n\t"
+" fstps 52(%%ecx)\n\t"
+
+" flds 12(%%edx)\n\t"
+" fsubs 48(%%edx)\n\t"
+" fmuls 76(%%ebx)\n\t"
+" fstps 48(%%ecx)\n\t"
+
+" flds 16(%%edx)\n\t"
+" fadds 44(%%edx)\n\t"
+" fstps 16(%%ecx)\n\t"
+
+" flds 20(%%edx)\n\t"
+" fadds 40(%%edx)\n\t"
+" fstps 20(%%ecx)\n\t"
+
+" flds 16(%%edx)\n\t"
+" fsubs 44(%%edx)\n\t"
+" fmuls 80(%%ebx)\n\t"
+" fstps 44(%%ecx)\n\t"
+
+" flds 20(%%edx)\n\t"
+" fsubs 40(%%edx)\n\t"
+" fmuls 84(%%ebx)\n\t"
+" fstps 40(%%ecx)\n\t"
+
+" flds 24(%%edx)\n\t"
+" fadds 36(%%edx)\n\t"
+" fstps 24(%%ecx)\n\t"
+
+" flds 28(%%edx)\n\t"
+" fadds 32(%%edx)\n\t"
+" fstps 28(%%ecx)\n\t"
+
+" flds 24(%%edx)\n\t"
+" fsubs 36(%%edx)\n\t"
+" fmuls 88(%%ebx)\n\t"
+" fstps 36(%%ecx)\n\t"
+
+" flds 28(%%edx)\n\t"
+" fsubs 32(%%edx)\n\t"
+" fmuls 92(%%ebx)\n\t"
+" fstps 32(%%ecx)\n\t"
/* Phase 3*/
-" flds 64(%%edx)\n\t"
-" fadds 124(%%edx)\n\t"
-" fstps 64(%%ecx)\n\t"
-
-" flds 68(%%edx)\n\t"
-" fadds 120(%%edx)\n\t"
-" fstps 68(%%ecx)\n\t"
-
-" flds 124(%%edx)\n\t"
-" fsubs 64(%%edx)\n\t"
-" fmuls 64(%%ebx)\n\t"
-" fstps 124(%%ecx)\n\t"
-
-" flds 120(%%edx)\n\t"
-" fsubs 68(%%edx)\n\t"
-" fmuls 68(%%ebx)\n\t"
-" fstps 120(%%ecx)\n\t"
-
-" flds 72(%%edx)\n\t"
-" fadds 116(%%edx)\n\t"
-" fstps 72(%%ecx)\n\t"
-
-" flds 76(%%edx)\n\t"
-" fadds 112(%%edx)\n\t"
-" fstps 76(%%ecx)\n\t"
-
-" flds 116(%%edx)\n\t"
-" fsubs 72(%%edx)\n\t"
-" fmuls 72(%%ebx)\n\t"
-" fstps 116(%%ecx)\n\t"
-
-" flds 112(%%edx)\n\t"
-" fsubs 76(%%edx)\n\t"
-" fmuls 76(%%ebx)\n\t"
-" fstps 112(%%ecx)\n\t"
-
-" flds 80(%%edx)\n\t"
-" fadds 108(%%edx)\n\t"
-" fstps 80(%%ecx)\n\t"
-
-" flds 84(%%edx)\n\t"
-" fadds 104(%%edx)\n\t"
-" fstps 84(%%ecx)\n\t"
-
-" flds 108(%%edx)\n\t"
-" fsubs 80(%%edx)\n\t"
-" fmuls 80(%%ebx)\n\t"
-" fstps 108(%%ecx)\n\t"
-
-" flds 104(%%edx)\n\t"
-" fsubs 84(%%edx)\n\t"
-" fmuls 84(%%ebx)\n\t"
-" fstps 104(%%ecx)\n\t"
-
-" flds 88(%%edx)\n\t"
-" fadds 100(%%edx)\n\t"
-" fstps 88(%%ecx)\n\t"
-
-" flds 92(%%edx)\n\t"
-" fadds 96(%%edx)\n\t"
-" fstps 92(%%ecx)\n\t"
-
-" flds 100(%%edx)\n\t"
-" fsubs 88(%%edx)\n\t"
-" fmuls 88(%%ebx)\n\t"
-" fstps 100(%%ecx)\n\t"
-
-" flds 96(%%edx)\n\t"
-" fsubs 92(%%edx)\n\t"
-" fmuls 92(%%ebx)\n\t"
-" fstps 96(%%ecx)\n\t"
+" flds 64(%%edx)\n\t"
+" fadds 124(%%edx)\n\t"
+" fstps 64(%%ecx)\n\t"
+
+" flds 68(%%edx)\n\t"
+" fadds 120(%%edx)\n\t"
+" fstps 68(%%ecx)\n\t"
+
+" flds 124(%%edx)\n\t"
+" fsubs 64(%%edx)\n\t"
+" fmuls 64(%%ebx)\n\t"
+" fstps 124(%%ecx)\n\t"
+
+" flds 120(%%edx)\n\t"
+" fsubs 68(%%edx)\n\t"
+" fmuls 68(%%ebx)\n\t"
+" fstps 120(%%ecx)\n\t"
+
+" flds 72(%%edx)\n\t"
+" fadds 116(%%edx)\n\t"
+" fstps 72(%%ecx)\n\t"
+
+" flds 76(%%edx)\n\t"
+" fadds 112(%%edx)\n\t"
+" fstps 76(%%ecx)\n\t"
+
+" flds 116(%%edx)\n\t"
+" fsubs 72(%%edx)\n\t"
+" fmuls 72(%%ebx)\n\t"
+" fstps 116(%%ecx)\n\t"
+
+" flds 112(%%edx)\n\t"
+" fsubs 76(%%edx)\n\t"
+" fmuls 76(%%ebx)\n\t"
+" fstps 112(%%ecx)\n\t"
+
+" flds 80(%%edx)\n\t"
+" fadds 108(%%edx)\n\t"
+" fstps 80(%%ecx)\n\t"
+
+" flds 84(%%edx)\n\t"
+" fadds 104(%%edx)\n\t"
+" fstps 84(%%ecx)\n\t"
+
+" flds 108(%%edx)\n\t"
+" fsubs 80(%%edx)\n\t"
+" fmuls 80(%%ebx)\n\t"
+" fstps 108(%%ecx)\n\t"
+
+" flds 104(%%edx)\n\t"
+" fsubs 84(%%edx)\n\t"
+" fmuls 84(%%ebx)\n\t"
+" fstps 104(%%ecx)\n\t"
+
+" flds 88(%%edx)\n\t"
+" fadds 100(%%edx)\n\t"
+" fstps 88(%%ecx)\n\t"
+
+" flds 92(%%edx)\n\t"
+" fadds 96(%%edx)\n\t"
+" fstps 92(%%ecx)\n\t"
+
+" flds 100(%%edx)\n\t"
+" fsubs 88(%%edx)\n\t"
+" fmuls 88(%%ebx)\n\t"
+" fstps 100(%%ecx)\n\t"
+
+" flds 96(%%edx)\n\t"
+" fsubs 92(%%edx)\n\t"
+" fmuls 92(%%ebx)\n\t"
+" fstps 96(%%ecx)\n\t"
/* Phase 4*/
-" flds (%%ecx)\n\t"
-" fadds 28(%%ecx)\n\t"
-" fstps (%%edx)\n\t"
-
-" flds (%%ecx)\n\t"
-" fsubs 28(%%ecx)\n\t"
-" fmuls 96(%%ebx)\n\t"
-" fstps 28(%%edx)\n\t"
-
-" flds 4(%%ecx)\n\t"
-" fadds 24(%%ecx)\n\t"
-" fstps 4(%%edx)\n\t"
-
-" flds 4(%%ecx)\n\t"
-" fsubs 24(%%ecx)\n\t"
-" fmuls 100(%%ebx)\n\t"
-" fstps 24(%%edx)\n\t"
-
-" flds 8(%%ecx)\n\t"
-" fadds 20(%%ecx)\n\t"
-" fstps 8(%%edx)\n\t"
-
-" flds 8(%%ecx)\n\t"
-" fsubs 20(%%ecx)\n\t"
-" fmuls 104(%%ebx)\n\t"
-" fstps 20(%%edx)\n\t"
-
-" flds 12(%%ecx)\n\t"
-" fadds 16(%%ecx)\n\t"
-" fstps 12(%%edx)\n\t"
-
-" flds 12(%%ecx)\n\t"
-" fsubs 16(%%ecx)\n\t"
-" fmuls 108(%%ebx)\n\t"
-" fstps 16(%%edx)\n\t"
-
-" flds 32(%%ecx)\n\t"
-" fadds 60(%%ecx)\n\t"
-" fstps 32(%%edx)\n\t"
-
-" flds 60(%%ecx)\n\t"
-" fsubs 32(%%ecx)\n\t"
-" fmuls 96(%%ebx)\n\t"
-" fstps 60(%%edx)\n\t"
-
-" flds 36(%%ecx)\n\t"
-" fadds 56(%%ecx)\n\t"
-" fstps 36(%%edx)\n\t"
-
-" flds 56(%%ecx)\n\t"
-" fsubs 36(%%ecx)\n\t"
-" fmuls 100(%%ebx)\n\t"
-" fstps 56(%%edx)\n\t"
-
-" flds 40(%%ecx)\n\t"
-" fadds 52(%%ecx)\n\t"
-" fstps 40(%%edx)\n\t"
-
-" flds 52(%%ecx)\n\t"
-" fsubs 40(%%ecx)\n\t"
-" fmuls 104(%%ebx)\n\t"
-" fstps 52(%%edx)\n\t"
-
-" flds 44(%%ecx)\n\t"
-" fadds 48(%%ecx)\n\t"
-" fstps 44(%%edx)\n\t"
-
-" flds 48(%%ecx)\n\t"
-" fsubs 44(%%ecx)\n\t"
-" fmuls 108(%%ebx)\n\t"
-" fstps 48(%%edx)\n\t"
-
-" flds 64(%%ecx)\n\t"
-" fadds 92(%%ecx)\n\t"
-" fstps 64(%%edx)\n\t"
-
-" flds 64(%%ecx)\n\t"
-" fsubs 92(%%ecx)\n\t"
-" fmuls 96(%%ebx)\n\t"
-" fstps 92(%%edx)\n\t"
-
-" flds 68(%%ecx)\n\t"
-" fadds 88(%%ecx)\n\t"
-" fstps 68(%%edx)\n\t"
-
-" flds 68(%%ecx)\n\t"
-" fsubs 88(%%ecx)\n\t"
-" fmuls 100(%%ebx)\n\t"
-" fstps 88(%%edx)\n\t"
-
-" flds 72(%%ecx)\n\t"
-" fadds 84(%%ecx)\n\t"
-" fstps 72(%%edx)\n\t"
-
-" flds 72(%%ecx)\n\t"
-" fsubs 84(%%ecx)\n\t"
-" fmuls 104(%%ebx)\n\t"
-" fstps 84(%%edx)\n\t"
-
-" flds 76(%%ecx)\n\t"
-" fadds 80(%%ecx)\n\t"
-" fstps 76(%%edx)\n\t"
-
-" flds 76(%%ecx)\n\t"
-" fsubs 80(%%ecx)\n\t"
-" fmuls 108(%%ebx)\n\t"
-" fstps 80(%%edx)\n\t"
-
-" flds 96(%%ecx)\n\t"
-" fadds 124(%%ecx)\n\t"
-" fstps 96(%%edx)\n\t"
-
-" flds 124(%%ecx)\n\t"
-" fsubs 96(%%ecx)\n\t"
-" fmuls 96(%%ebx)\n\t"
-" fstps 124(%%edx)\n\t"
-
-" flds 100(%%ecx)\n\t"
-" fadds 120(%%ecx)\n\t"
-" fstps 100(%%edx)\n\t"
-
-" flds 120(%%ecx)\n\t"
-" fsubs 100(%%ecx)\n\t"
-" fmuls 100(%%ebx)\n\t"
-" fstps 120(%%edx)\n\t"
-
-" flds 104(%%ecx)\n\t"
-" fadds 116(%%ecx)\n\t"
-" fstps 104(%%edx)\n\t"
-
-" flds 116(%%ecx)\n\t"
-" fsubs 104(%%ecx)\n\t"
-" fmuls 104(%%ebx)\n\t"
-" fstps 116(%%edx)\n\t"
-
-" flds 108(%%ecx)\n\t"
-" fadds 112(%%ecx)\n\t"
-" fstps 108(%%edx)\n\t"
-
-" flds 112(%%ecx)\n\t"
-" fsubs 108(%%ecx)\n\t"
-" fmuls 108(%%ebx)\n\t"
-" fstps 112(%%edx)\n\t"
-
-" flds (%%edx)\n\t"
-" fadds 12(%%edx)\n\t"
-" fstps (%%ecx)\n\t"
-
-" flds (%%edx)\n\t"
-" fsubs 12(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 12(%%ecx)\n\t"
-
-" flds 4(%%edx)\n\t"
-" fadds 8(%%edx)\n\t"
-" fstps 4(%%ecx)\n\t"
-
-" flds 4(%%edx)\n\t"
-" fsubs 8(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 8(%%ecx)\n\t"
-
-" flds 16(%%edx)\n\t"
-" fadds 28(%%edx)\n\t"
-" fstps 16(%%ecx)\n\t"
-
-" flds 28(%%edx)\n\t"
-" fsubs 16(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 28(%%ecx)\n\t"
-
-" flds 20(%%edx)\n\t"
-" fadds 24(%%edx)\n\t"
-" fstps 20(%%ecx)\n\t"
-
-" flds 24(%%edx)\n\t"
-" fsubs 20(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 24(%%ecx)\n\t"
-
-" flds 32(%%edx)\n\t"
-" fadds 44(%%edx)\n\t"
-" fstps 32(%%ecx)\n\t"
-
-" flds 32(%%edx)\n\t"
-" fsubs 44(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 44(%%ecx)\n\t"
-
-" flds 36(%%edx)\n\t"
-" fadds 40(%%edx)\n\t"
-" fstps 36(%%ecx)\n\t"
-
-" flds 36(%%edx)\n\t"
-" fsubs 40(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 40(%%ecx)\n\t"
-
-" flds 48(%%edx)\n\t"
-" fadds 60(%%edx)\n\t"
-" fstps 48(%%ecx)\n\t"
-
-" flds 60(%%edx)\n\t"
-" fsubs 48(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 60(%%ecx)\n\t"
-
-" flds 52(%%edx)\n\t"
-" fadds 56(%%edx)\n\t"
-" fstps 52(%%ecx)\n\t"
-
-" flds 56(%%edx)\n\t"
-" fsubs 52(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 56(%%ecx)\n\t"
-
-" flds 64(%%edx)\n\t"
-" fadds 76(%%edx)\n\t"
-" fstps 64(%%ecx)\n\t"
-
-" flds 64(%%edx)\n\t"
-" fsubs 76(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 76(%%ecx)\n\t"
-
-" flds 68(%%edx)\n\t"
-" fadds 72(%%edx)\n\t"
-" fstps 68(%%ecx)\n\t"
-
-" flds 68(%%edx)\n\t"
-" fsubs 72(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 72(%%ecx)\n\t"
-
-" flds 80(%%edx)\n\t"
-" fadds 92(%%edx)\n\t"
-" fstps 80(%%ecx)\n\t"
-
-" flds 92(%%edx)\n\t"
-" fsubs 80(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 92(%%ecx)\n\t"
-
-" flds 84(%%edx)\n\t"
-" fadds 88(%%edx)\n\t"
-" fstps 84(%%ecx)\n\t"
-
-" flds 88(%%edx)\n\t"
-" fsubs 84(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 88(%%ecx)\n\t"
-
-" flds 96(%%edx)\n\t"
-" fadds 108(%%edx)\n\t"
-" fstps 96(%%ecx)\n\t"
-
-" flds 96(%%edx)\n\t"
-" fsubs 108(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 108(%%ecx)\n\t"
-
-" flds 100(%%edx)\n\t"
-" fadds 104(%%edx)\n\t"
-" fstps 100(%%ecx)\n\t"
-
-" flds 100(%%edx)\n\t"
-" fsubs 104(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 104(%%ecx)\n\t"
-
-" flds 112(%%edx)\n\t"
-" fadds 124(%%edx)\n\t"
-" fstps 112(%%ecx)\n\t"
-
-" flds 124(%%edx)\n\t"
-" fsubs 112(%%edx)\n\t"
-" fmuls 112(%%ebx)\n\t"
-" fstps 124(%%ecx)\n\t"
-
-" flds 116(%%edx)\n\t"
-" fadds 120(%%edx)\n\t"
-" fstps 116(%%ecx)\n\t"
-
-" flds 120(%%edx)\n\t"
-" fsubs 116(%%edx)\n\t"
-" fmuls 116(%%ebx)\n\t"
-" fstps 120(%%ecx)\n\t"
+" flds (%%ecx)\n\t"
+" fadds 28(%%ecx)\n\t"
+" fstps (%%edx)\n\t"
+
+" flds (%%ecx)\n\t"
+" fsubs 28(%%ecx)\n\t"
+" fmuls 96(%%ebx)\n\t"
+" fstps 28(%%edx)\n\t"
+
+" flds 4(%%ecx)\n\t"
+" fadds 24(%%ecx)\n\t"
+" fstps 4(%%edx)\n\t"
+
+" flds 4(%%ecx)\n\t"
+" fsubs 24(%%ecx)\n\t"
+" fmuls 100(%%ebx)\n\t"
+" fstps 24(%%edx)\n\t"
+
+" flds 8(%%ecx)\n\t"
+" fadds 20(%%ecx)\n\t"
+" fstps 8(%%edx)\n\t"
+
+" flds 8(%%ecx)\n\t"
+" fsubs 20(%%ecx)\n\t"
+" fmuls 104(%%ebx)\n\t"
+" fstps 20(%%edx)\n\t"
+
+" flds 12(%%ecx)\n\t"
+" fadds 16(%%ecx)\n\t"
+" fstps 12(%%edx)\n\t"
+
+" flds 12(%%ecx)\n\t"
+" fsubs 16(%%ecx)\n\t"
+" fmuls 108(%%ebx)\n\t"
+" fstps 16(%%edx)\n\t"
+
+" flds 32(%%ecx)\n\t"
+" fadds 60(%%ecx)\n\t"
+" fstps 32(%%edx)\n\t"
+
+" flds 60(%%ecx)\n\t"
+" fsubs 32(%%ecx)\n\t"
+" fmuls 96(%%ebx)\n\t"
+" fstps 60(%%edx)\n\t"
+
+" flds 36(%%ecx)\n\t"
+" fadds 56(%%ecx)\n\t"
+" fstps 36(%%edx)\n\t"
+
+" flds 56(%%ecx)\n\t"
+" fsubs 36(%%ecx)\n\t"
+" fmuls 100(%%ebx)\n\t"
+" fstps 56(%%edx)\n\t"
+
+" flds 40(%%ecx)\n\t"
+" fadds 52(%%ecx)\n\t"
+" fstps 40(%%edx)\n\t"
+
+" flds 52(%%ecx)\n\t"
+" fsubs 40(%%ecx)\n\t"
+" fmuls 104(%%ebx)\n\t"
+" fstps 52(%%edx)\n\t"
+
+" flds 44(%%ecx)\n\t"
+" fadds 48(%%ecx)\n\t"
+" fstps 44(%%edx)\n\t"
+
+" flds 48(%%ecx)\n\t"
+" fsubs 44(%%ecx)\n\t"
+" fmuls 108(%%ebx)\n\t"
+" fstps 48(%%edx)\n\t"
+
+" flds 64(%%ecx)\n\t"
+" fadds 92(%%ecx)\n\t"
+" fstps 64(%%edx)\n\t"
+
+" flds 64(%%ecx)\n\t"
+" fsubs 92(%%ecx)\n\t"
+" fmuls 96(%%ebx)\n\t"
+" fstps 92(%%edx)\n\t"
+
+" flds 68(%%ecx)\n\t"
+" fadds 88(%%ecx)\n\t"
+" fstps 68(%%edx)\n\t"
+
+" flds 68(%%ecx)\n\t"
+" fsubs 88(%%ecx)\n\t"
+" fmuls 100(%%ebx)\n\t"
+" fstps 88(%%edx)\n\t"
+
+" flds 72(%%ecx)\n\t"
+" fadds 84(%%ecx)\n\t"
+" fstps 72(%%edx)\n\t"
+
+" flds 72(%%ecx)\n\t"
+" fsubs 84(%%ecx)\n\t"
+" fmuls 104(%%ebx)\n\t"
+" fstps 84(%%edx)\n\t"
+
+" flds 76(%%ecx)\n\t"
+" fadds 80(%%ecx)\n\t"
+" fstps 76(%%edx)\n\t"
+
+" flds 76(%%ecx)\n\t"
+" fsubs 80(%%ecx)\n\t"
+" fmuls 108(%%ebx)\n\t"
+" fstps 80(%%edx)\n\t"
+
+" flds 96(%%ecx)\n\t"
+" fadds 124(%%ecx)\n\t"
+" fstps 96(%%edx)\n\t"
+
+" flds 124(%%ecx)\n\t"
+" fsubs 96(%%ecx)\n\t"
+" fmuls 96(%%ebx)\n\t"
+" fstps 124(%%edx)\n\t"
+
+" flds 100(%%ecx)\n\t"
+" fadds 120(%%ecx)\n\t"
+" fstps 100(%%edx)\n\t"
+
+" flds 120(%%ecx)\n\t"
+" fsubs 100(%%ecx)\n\t"
+" fmuls 100(%%ebx)\n\t"
+" fstps 120(%%edx)\n\t"
+
+" flds 104(%%ecx)\n\t"
+" fadds 116(%%ecx)\n\t"
+" fstps 104(%%edx)\n\t"
+
+" flds 116(%%ecx)\n\t"
+" fsubs 104(%%ecx)\n\t"
+" fmuls 104(%%ebx)\n\t"
+" fstps 116(%%edx)\n\t"
+
+" flds 108(%%ecx)\n\t"
+" fadds 112(%%ecx)\n\t"
+" fstps 108(%%edx)\n\t"
+
+" flds 112(%%ecx)\n\t"
+" fsubs 108(%%ecx)\n\t"
+" fmuls 108(%%ebx)\n\t"
+" fstps 112(%%edx)\n\t"
+
+" flds (%%edx)\n\t"
+" fadds 12(%%edx)\n\t"
+" fstps (%%ecx)\n\t"
+
+" flds (%%edx)\n\t"
+" fsubs 12(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 12(%%ecx)\n\t"
+
+" flds 4(%%edx)\n\t"
+" fadds 8(%%edx)\n\t"
+" fstps 4(%%ecx)\n\t"
+
+" flds 4(%%edx)\n\t"
+" fsubs 8(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 8(%%ecx)\n\t"
+
+" flds 16(%%edx)\n\t"
+" fadds 28(%%edx)\n\t"
+" fstps 16(%%ecx)\n\t"
+
+" flds 28(%%edx)\n\t"
+" fsubs 16(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 28(%%ecx)\n\t"
+
+" flds 20(%%edx)\n\t"
+" fadds 24(%%edx)\n\t"
+" fstps 20(%%ecx)\n\t"
+
+" flds 24(%%edx)\n\t"
+" fsubs 20(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 24(%%ecx)\n\t"
+
+" flds 32(%%edx)\n\t"
+" fadds 44(%%edx)\n\t"
+" fstps 32(%%ecx)\n\t"
+
+" flds 32(%%edx)\n\t"
+" fsubs 44(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 44(%%ecx)\n\t"
+
+" flds 36(%%edx)\n\t"
+" fadds 40(%%edx)\n\t"
+" fstps 36(%%ecx)\n\t"
+
+" flds 36(%%edx)\n\t"
+" fsubs 40(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 40(%%ecx)\n\t"
+
+" flds 48(%%edx)\n\t"
+" fadds 60(%%edx)\n\t"
+" fstps 48(%%ecx)\n\t"
+
+" flds 60(%%edx)\n\t"
+" fsubs 48(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 60(%%ecx)\n\t"
+
+" flds 52(%%edx)\n\t"
+" fadds 56(%%edx)\n\t"
+" fstps 52(%%ecx)\n\t"
+
+" flds 56(%%edx)\n\t"
+" fsubs 52(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 56(%%ecx)\n\t"
+
+" flds 64(%%edx)\n\t"
+" fadds 76(%%edx)\n\t"
+" fstps 64(%%ecx)\n\t"
+
+" flds 64(%%edx)\n\t"
+" fsubs 76(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 76(%%ecx)\n\t"
+
+" flds 68(%%edx)\n\t"
+" fadds 72(%%edx)\n\t"
+" fstps 68(%%ecx)\n\t"
+
+" flds 68(%%edx)\n\t"
+" fsubs 72(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 72(%%ecx)\n\t"
+
+" flds 80(%%edx)\n\t"
+" fadds 92(%%edx)\n\t"
+" fstps 80(%%ecx)\n\t"
+
+" flds 92(%%edx)\n\t"
+" fsubs 80(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 92(%%ecx)\n\t"
+
+" flds 84(%%edx)\n\t"
+" fadds 88(%%edx)\n\t"
+" fstps 84(%%ecx)\n\t"
+
+" flds 88(%%edx)\n\t"
+" fsubs 84(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 88(%%ecx)\n\t"
+
+" flds 96(%%edx)\n\t"
+" fadds 108(%%edx)\n\t"
+" fstps 96(%%ecx)\n\t"
+
+" flds 96(%%edx)\n\t"
+" fsubs 108(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 108(%%ecx)\n\t"
+
+" flds 100(%%edx)\n\t"
+" fadds 104(%%edx)\n\t"
+" fstps 100(%%ecx)\n\t"
+
+" flds 100(%%edx)\n\t"
+" fsubs 104(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 104(%%ecx)\n\t"
+
+" flds 112(%%edx)\n\t"
+" fadds 124(%%edx)\n\t"
+" fstps 112(%%ecx)\n\t"
+
+" flds 124(%%edx)\n\t"
+" fsubs 112(%%edx)\n\t"
+" fmuls 112(%%ebx)\n\t"
+" fstps 124(%%ecx)\n\t"
+
+" flds 116(%%edx)\n\t"
+" fadds 120(%%edx)\n\t"
+" fstps 116(%%ecx)\n\t"
+
+" flds 120(%%edx)\n\t"
+" fsubs 116(%%edx)\n\t"
+" fmuls 116(%%ebx)\n\t"
+" fstps 120(%%ecx)\n\t"
/* Phase 5*/
-" flds 32(%%ecx)\n\t"
-" fadds 36(%%ecx)\n\t"
-" fstps 32(%%edx)\n\t"
-
-" flds 32(%%ecx)\n\t"
-" fsubs 36(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fstps 36(%%edx)\n\t"
-
-" flds 44(%%ecx)\n\t"
-" fsubs 40(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 44(%%edx)\n\t"
-" fadds 40(%%ecx)\n\t"
-" fadds 44(%%ecx)\n\t"
-" fstps 40(%%edx)\n\t"
-
-" flds 48(%%ecx)\n\t"
-" fsubs 52(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-
-" flds 60(%%ecx)\n\t"
-" fsubs 56(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 56(%%ecx)\n\t"
-" fadds 60(%%ecx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 48(%%ecx)\n\t"
-" fadds 52(%%ecx)\n\t"
-" fstps 48(%%edx)\n\t"
-" fadd %%st(2)\n\t"
-" fstps 56(%%edx)\n\t"
-" fsts 60(%%edx)\n\t"
-" faddp %%st(1)\n\t"
-" fstps 52(%%edx)\n\t"
-
-" flds 64(%%ecx)\n\t"
-" fadds 68(%%ecx)\n\t"
-" fstps 64(%%edx)\n\t"
-
-" flds 64(%%ecx)\n\t"
-" fsubs 68(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fstps 68(%%edx)\n\t"
-
-" flds 76(%%ecx)\n\t"
-" fsubs 72(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 76(%%edx)\n\t"
-" fadds 72(%%ecx)\n\t"
-" fadds 76(%%ecx)\n\t"
-" fstps 72(%%edx)\n\t"
-
-" flds 92(%%ecx)\n\t"
-" fsubs 88(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 92(%%edx)\n\t"
-" fadds 92(%%ecx)\n\t"
-" fadds 88(%%ecx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 80(%%ecx)\n\t"
-" fadds 84(%%ecx)\n\t"
-" fstps 80(%%edx)\n\t"
-
-" flds 80(%%ecx)\n\t"
-" fsubs 84(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fadd %%st(0), %%st(1)\n\t"
-" fadds 92(%%edx)\n\t"
-" fstps 84(%%edx)\n\t"
-" fstps 88(%%edx)\n\t"
-
-" flds 96(%%ecx)\n\t"
-" fadds 100(%%ecx)\n\t"
-" fstps 96(%%edx)\n\t"
-
-" flds 96(%%ecx)\n\t"
-" fsubs 100(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fstps 100(%%edx)\n\t"
-
-" flds 108(%%ecx)\n\t"
-" fsubs 104(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 108(%%edx)\n\t"
-" fadds 104(%%ecx)\n\t"
-" fadds 108(%%ecx)\n\t"
-" fstps 104(%%edx)\n\t"
-
-" flds 124(%%ecx)\n\t"
-" fsubs 120(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 124(%%edx)\n\t"
-" fadds 120(%%ecx)\n\t"
-" fadds 124(%%ecx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 112(%%ecx)\n\t"
-" fadds 116(%%ecx)\n\t"
-" fstps 112(%%edx)\n\t"
-
-" flds 112(%%ecx)\n\t"
-" fsubs 116(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fadd %%st(0),%%st(1)\n\t"
-" fadds 124(%%edx)\n\t"
-" fstps 116(%%edx)\n\t"
-" fstps 120(%%edx)\n\t"
-" jnz .L01\n\t"
+" flds 32(%%ecx)\n\t"
+" fadds 36(%%ecx)\n\t"
+" fstps 32(%%edx)\n\t"
+
+" flds 32(%%ecx)\n\t"
+" fsubs 36(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fstps 36(%%edx)\n\t"
+
+" flds 44(%%ecx)\n\t"
+" fsubs 40(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 44(%%edx)\n\t"
+" fadds 40(%%ecx)\n\t"
+" fadds 44(%%ecx)\n\t"
+" fstps 40(%%edx)\n\t"
+
+" flds 48(%%ecx)\n\t"
+" fsubs 52(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+
+" flds 60(%%ecx)\n\t"
+" fsubs 56(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 56(%%ecx)\n\t"
+" fadds 60(%%ecx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 48(%%ecx)\n\t"
+" fadds 52(%%ecx)\n\t"
+" fstps 48(%%edx)\n\t"
+" fadd %%st(2)\n\t"
+" fstps 56(%%edx)\n\t"
+" fsts 60(%%edx)\n\t"
+" faddp %%st(1)\n\t"
+" fstps 52(%%edx)\n\t"
+
+" flds 64(%%ecx)\n\t"
+" fadds 68(%%ecx)\n\t"
+" fstps 64(%%edx)\n\t"
+
+" flds 64(%%ecx)\n\t"
+" fsubs 68(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fstps 68(%%edx)\n\t"
+
+" flds 76(%%ecx)\n\t"
+" fsubs 72(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 76(%%edx)\n\t"
+" fadds 72(%%ecx)\n\t"
+" fadds 76(%%ecx)\n\t"
+" fstps 72(%%edx)\n\t"
+
+" flds 92(%%ecx)\n\t"
+" fsubs 88(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 92(%%edx)\n\t"
+" fadds 92(%%ecx)\n\t"
+" fadds 88(%%ecx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 80(%%ecx)\n\t"
+" fadds 84(%%ecx)\n\t"
+" fstps 80(%%edx)\n\t"
+
+" flds 80(%%ecx)\n\t"
+" fsubs 84(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fadd %%st(0), %%st(1)\n\t"
+" fadds 92(%%edx)\n\t"
+" fstps 84(%%edx)\n\t"
+" fstps 88(%%edx)\n\t"
+
+" flds 96(%%ecx)\n\t"
+" fadds 100(%%ecx)\n\t"
+" fstps 96(%%edx)\n\t"
+
+" flds 96(%%ecx)\n\t"
+" fsubs 100(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fstps 100(%%edx)\n\t"
+
+" flds 108(%%ecx)\n\t"
+" fsubs 104(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 108(%%edx)\n\t"
+" fadds 104(%%ecx)\n\t"
+" fadds 108(%%ecx)\n\t"
+" fstps 104(%%edx)\n\t"
+
+" flds 124(%%ecx)\n\t"
+" fsubs 120(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 124(%%edx)\n\t"
+" fadds 120(%%ecx)\n\t"
+" fadds 124(%%ecx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 112(%%ecx)\n\t"
+" fadds 116(%%ecx)\n\t"
+" fstps 112(%%edx)\n\t"
+
+" flds 112(%%ecx)\n\t"
+" fsubs 116(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fadd %%st(0),%%st(1)\n\t"
+" fadds 124(%%edx)\n\t"
+" fstps 116(%%edx)\n\t"
+" fstps 120(%%edx)\n\t"
+" jnz .L01\n\t"
/* Phase 6*/
-" flds (%%ecx)\n\t"
-" fadds 4(%%ecx)\n\t"
-" fstps 1024(%%esi)\n\t"
-
-" flds (%%ecx)\n\t"
-" fsubs 4(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts (%%esi)\n\t"
-" fstps (%%edi)\n\t"
-
-" flds 12(%%ecx)\n\t"
-" fsubs 8(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 512(%%edi)\n\t"
-" fadds 12(%%ecx)\n\t"
-" fadds 8(%%ecx)\n\t"
-" fstps 512(%%esi)\n\t"
-
-" flds 16(%%ecx)\n\t"
-" fsubs 20(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-
-" flds 28(%%ecx)\n\t"
-" fsubs 24(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fsts 768(%%edi)\n\t"
-" fld %%st(0)\n\t"
-" fadds 24(%%ecx)\n\t"
-" fadds 28(%%ecx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 16(%%ecx)\n\t"
-" fadds 20(%%ecx)\n\t"
-" fstps 768(%%esi)\n\t"
-" fadd %%st(2)\n\t"
-" fstps 256(%%esi)\n\t"
-" faddp %%st(1)\n\t"
-" fstps 256(%%edi)\n\t"
+" flds (%%ecx)\n\t"
+" fadds 4(%%ecx)\n\t"
+" fstps 1024(%%esi)\n\t"
+
+" flds (%%ecx)\n\t"
+" fsubs 4(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts (%%esi)\n\t"
+" fstps (%%edi)\n\t"
+
+" flds 12(%%ecx)\n\t"
+" fsubs 8(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 512(%%edi)\n\t"
+" fadds 12(%%ecx)\n\t"
+" fadds 8(%%ecx)\n\t"
+" fstps 512(%%esi)\n\t"
+
+" flds 16(%%ecx)\n\t"
+" fsubs 20(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+
+" flds 28(%%ecx)\n\t"
+" fsubs 24(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fsts 768(%%edi)\n\t"
+" fld %%st(0)\n\t"
+" fadds 24(%%ecx)\n\t"
+" fadds 28(%%ecx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 16(%%ecx)\n\t"
+" fadds 20(%%ecx)\n\t"
+" fstps 768(%%esi)\n\t"
+" fadd %%st(2)\n\t"
+" fstps 256(%%esi)\n\t"
+" faddp %%st(1)\n\t"
+" fstps 256(%%edi)\n\t"
/* Phase 7*/
-" flds 32(%%edx)\n\t"
-" fadds 48(%%edx)\n\t"
-" fstps 896(%%esi)\n\t"
-
-" flds 48(%%edx)\n\t"
-" fadds 40(%%edx)\n\t"
-" fstps 640(%%esi)\n\t"
-
-" flds 40(%%edx)\n\t"
-" fadds 56(%%edx)\n\t"
-" fstps 384(%%esi)\n\t"
-
-" flds 56(%%edx)\n\t"
-" fadds 36(%%edx)\n\t"
-" fstps 128(%%esi)\n\t"
-
-" flds 36(%%edx)\n\t"
-" fadds 52(%%edx)\n\t"
-" fstps 128(%%edi)\n\t"
-
-" flds 52(%%edx)\n\t"
-" fadds 44(%%edx)\n\t"
-" fstps 384(%%edi)\n\t"
-
-" flds 60(%%edx)\n\t"
-" fsts 896(%%edi)\n\t"
-" fadds 44(%%edx)\n\t"
-" fstps 640(%%edi)\n\t"
-
-" flds 96(%%edx)\n\t"
-" fadds 112(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 64(%%edx)\n\t"
-" fstps 960(%%esi)\n\t"
-" fadds 80(%%edx)\n\t"
-" fstps 832(%%esi)\n\t"
-
-" flds 112(%%edx)\n\t"
-" fadds 104(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 80(%%edx)\n\t"
-" fstps 704(%%esi)\n\t"
-" fadds 72(%%edx)\n\t"
-" fstps 576(%%esi)\n\t"
-
-" flds 104(%%edx)\n\t"
-" fadds 120(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 72(%%edx)\n\t"
-" fstps 448(%%esi)\n\t"
-" fadds 88(%%edx)\n\t"
-" fstps 320(%%esi)\n\t"
-
-" flds 120(%%edx)\n\t"
-" fadds 100(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 88(%%edx)\n\t"
-" fstps 192(%%esi)\n\t"
-" fadds 68(%%edx)\n\t"
-" fstps 64(%%esi)\n\t"
-
-" flds 100(%%edx)\n\t"
-" fadds 116(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 68(%%edx)\n\t"
-" fstps 64(%%edi)\n\t"
-" fadds 84(%%edx)\n\t"
-" fstps 192(%%edi)\n\t"
-
-" flds 116(%%edx)\n\t"
-" fadds 108(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 84(%%edx)\n\t"
-" fstps 320(%%edi)\n\t"
-" fadds 76(%%edx)\n\t"
-" fstps 448(%%edi)\n\t"
-
-" flds 108(%%edx)\n\t"
-" fadds 124(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 76(%%edx)\n\t"
-" fstps 576(%%edi)\n\t"
-" fadds 92(%%edx)\n\t"
-" fstps 704(%%edi)\n\t"
-
-" flds 124(%%edx)\n\t"
-" fsts 960(%%edi)\n\t"
-" fadds 92(%%edx)\n\t"
-" fstps 832(%%edi)\n\t"
-" jmp .L_bye\n\t"
+" flds 32(%%edx)\n\t"
+" fadds 48(%%edx)\n\t"
+" fstps 896(%%esi)\n\t"
+
+" flds 48(%%edx)\n\t"
+" fadds 40(%%edx)\n\t"
+" fstps 640(%%esi)\n\t"
+
+" flds 40(%%edx)\n\t"
+" fadds 56(%%edx)\n\t"
+" fstps 384(%%esi)\n\t"
+
+" flds 56(%%edx)\n\t"
+" fadds 36(%%edx)\n\t"
+" fstps 128(%%esi)\n\t"
+
+" flds 36(%%edx)\n\t"
+" fadds 52(%%edx)\n\t"
+" fstps 128(%%edi)\n\t"
+
+" flds 52(%%edx)\n\t"
+" fadds 44(%%edx)\n\t"
+" fstps 384(%%edi)\n\t"
+
+" flds 60(%%edx)\n\t"
+" fsts 896(%%edi)\n\t"
+" fadds 44(%%edx)\n\t"
+" fstps 640(%%edi)\n\t"
+
+" flds 96(%%edx)\n\t"
+" fadds 112(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 64(%%edx)\n\t"
+" fstps 960(%%esi)\n\t"
+" fadds 80(%%edx)\n\t"
+" fstps 832(%%esi)\n\t"
+
+" flds 112(%%edx)\n\t"
+" fadds 104(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 80(%%edx)\n\t"
+" fstps 704(%%esi)\n\t"
+" fadds 72(%%edx)\n\t"
+" fstps 576(%%esi)\n\t"
+
+" flds 104(%%edx)\n\t"
+" fadds 120(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 72(%%edx)\n\t"
+" fstps 448(%%esi)\n\t"
+" fadds 88(%%edx)\n\t"
+" fstps 320(%%esi)\n\t"
+
+" flds 120(%%edx)\n\t"
+" fadds 100(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 88(%%edx)\n\t"
+" fstps 192(%%esi)\n\t"
+" fadds 68(%%edx)\n\t"
+" fstps 64(%%esi)\n\t"
+
+" flds 100(%%edx)\n\t"
+" fadds 116(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 68(%%edx)\n\t"
+" fstps 64(%%edi)\n\t"
+" fadds 84(%%edx)\n\t"
+" fstps 192(%%edi)\n\t"
+
+" flds 116(%%edx)\n\t"
+" fadds 108(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 84(%%edx)\n\t"
+" fstps 320(%%edi)\n\t"
+" fadds 76(%%edx)\n\t"
+" fstps 448(%%edi)\n\t"
+
+" flds 108(%%edx)\n\t"
+" fadds 124(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 76(%%edx)\n\t"
+" fstps 576(%%edi)\n\t"
+" fadds 92(%%edx)\n\t"
+" fstps 704(%%edi)\n\t"
+
+" flds 124(%%edx)\n\t"
+" fsts 960(%%edi)\n\t"
+" fadds 92(%%edx)\n\t"
+" fstps 832(%%edi)\n\t"
+" jmp .L_bye\n\t"
".L01:\n\t"
/* Phase 8*/
-" flds (%%ecx)\n\t"
-" fadds 4(%%ecx)\n\t"
-" fistp 512(%%esi)\n\t"
-
-" flds (%%ecx)\n\t"
-" fsubs 4(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-
-" fistp (%%esi)\n\t"
-
-
-" flds 12(%%ecx)\n\t"
-" fsubs 8(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fist 256(%%edi)\n\t"
-" fadds 12(%%ecx)\n\t"
-" fadds 8(%%ecx)\n\t"
-" fistp 256(%%esi)\n\t"
-
-" flds 16(%%ecx)\n\t"
-" fsubs 20(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-
-" flds 28(%%ecx)\n\t"
-" fsubs 24(%%ecx)\n\t"
-" fmuls 120(%%ebx)\n\t"
-" fist 384(%%edi)\n\t"
-" fld %%st(0)\n\t"
-" fadds 24(%%ecx)\n\t"
-" fadds 28(%%ecx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 16(%%ecx)\n\t"
-" fadds 20(%%ecx)\n\t"
-" fistp 384(%%esi)\n\t"
-" fadd %%st(2)\n\t"
-" fistp 128(%%esi)\n\t"
-" faddp %%st(1)\n\t"
-" fistp 128(%%edi)\n\t"
+" flds (%%ecx)\n\t"
+" fadds 4(%%ecx)\n\t"
+" fistp 512(%%esi)\n\t"
+
+" flds (%%ecx)\n\t"
+" fsubs 4(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+
+" fistp (%%esi)\n\t"
+
+
+" flds 12(%%ecx)\n\t"
+" fsubs 8(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fist 256(%%edi)\n\t"
+" fadds 12(%%ecx)\n\t"
+" fadds 8(%%ecx)\n\t"
+" fistp 256(%%esi)\n\t"
+
+" flds 16(%%ecx)\n\t"
+" fsubs 20(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+
+" flds 28(%%ecx)\n\t"
+" fsubs 24(%%ecx)\n\t"
+" fmuls 120(%%ebx)\n\t"
+" fist 384(%%edi)\n\t"
+" fld %%st(0)\n\t"
+" fadds 24(%%ecx)\n\t"
+" fadds 28(%%ecx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 16(%%ecx)\n\t"
+" fadds 20(%%ecx)\n\t"
+" fistp 384(%%esi)\n\t"
+" fadd %%st(2)\n\t"
+" fistp 128(%%esi)\n\t"
+" faddp %%st(1)\n\t"
+" fistp 128(%%edi)\n\t"
/* Phase 9*/
-" flds 32(%%edx)\n\t"
-" fadds 48(%%edx)\n\t"
-" fistp 448(%%esi)\n\t"
-
-" flds 48(%%edx)\n\t"
-" fadds 40(%%edx)\n\t"
-" fistp 320(%%esi)\n\t"
-
-" flds 40(%%edx)\n\t"
-" fadds 56(%%edx)\n\t"
-" fistp 192(%%esi)\n\t"
-
-" flds 56(%%edx)\n\t"
-" fadds 36(%%edx)\n\t"
-" fistp 64(%%esi)\n\t"
-
-" flds 36(%%edx)\n\t"
-" fadds 52(%%edx)\n\t"
-" fistp 64(%%edi)\n\t"
-
-" flds 52(%%edx)\n\t"
-" fadds 44(%%edx)\n\t"
-" fistp 192(%%edi)\n\t"
-
-" flds 60(%%edx)\n\t"
-" fist 448(%%edi)\n\t"
-" fadds 44(%%edx)\n\t"
-" fistp 320(%%edi)\n\t"
-
-" flds 96(%%edx)\n\t"
-" fadds 112(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 64(%%edx)\n\t"
-" fistp 480(%%esi)\n\t"
-" fadds 80(%%edx)\n\t"
-" fistp 416(%%esi)\n\t"
-
-" flds 112(%%edx)\n\t"
-" fadds 104(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 80(%%edx)\n\t"
-" fistp 352(%%esi)\n\t"
-" fadds 72(%%edx)\n\t"
-" fistp 288(%%esi)\n\t"
-
-" flds 104(%%edx)\n\t"
-" fadds 120(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 72(%%edx)\n\t"
-" fistp 224(%%esi)\n\t"
-" fadds 88(%%edx)\n\t"
-" fistp 160(%%esi)\n\t"
-
-" flds 120(%%edx)\n\t"
-" fadds 100(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 88(%%edx)\n\t"
-" fistp 96(%%esi)\n\t"
-" fadds 68(%%edx)\n\t"
-" fistp 32(%%esi)\n\t"
-
-" flds 100(%%edx)\n\t"
-" fadds 116(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 68(%%edx)\n\t"
-" fistp 32(%%edi)\n\t"
-" fadds 84(%%edx)\n\t"
-" fistp 96(%%edi)\n\t"
-
-" flds 116(%%edx)\n\t"
-" fadds 108(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 84(%%edx)\n\t"
-" fistp 160(%%edi)\n\t"
-" fadds 76(%%edx)\n\t"
-" fistp 224(%%edi)\n\t"
-
-" flds 108(%%edx)\n\t"
-" fadds 124(%%edx)\n\t"
-" fld %%st(0)\n\t"
-" fadds 76(%%edx)\n\t"
-" fistp 288(%%edi)\n\t"
-" fadds 92(%%edx)\n\t"
-" fistp 352(%%edi)\n\t"
-
-" flds 124(%%edx)\n\t"
-" fist 480(%%edi)\n\t"
-" fadds 92(%%edx)\n\t"
-" fistp 416(%%edi)\n\t"
-" movsw\n\t"
+" flds 32(%%edx)\n\t"
+" fadds 48(%%edx)\n\t"
+" fistp 448(%%esi)\n\t"
+
+" flds 48(%%edx)\n\t"
+" fadds 40(%%edx)\n\t"
+" fistp 320(%%esi)\n\t"
+
+" flds 40(%%edx)\n\t"
+" fadds 56(%%edx)\n\t"
+" fistp 192(%%esi)\n\t"
+
+" flds 56(%%edx)\n\t"
+" fadds 36(%%edx)\n\t"
+" fistp 64(%%esi)\n\t"
+
+" flds 36(%%edx)\n\t"
+" fadds 52(%%edx)\n\t"
+" fistp 64(%%edi)\n\t"
+
+" flds 52(%%edx)\n\t"
+" fadds 44(%%edx)\n\t"
+" fistp 192(%%edi)\n\t"
+
+" flds 60(%%edx)\n\t"
+" fist 448(%%edi)\n\t"
+" fadds 44(%%edx)\n\t"
+" fistp 320(%%edi)\n\t"
+
+" flds 96(%%edx)\n\t"
+" fadds 112(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 64(%%edx)\n\t"
+" fistp 480(%%esi)\n\t"
+" fadds 80(%%edx)\n\t"
+" fistp 416(%%esi)\n\t"
+
+" flds 112(%%edx)\n\t"
+" fadds 104(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 80(%%edx)\n\t"
+" fistp 352(%%esi)\n\t"
+" fadds 72(%%edx)\n\t"
+" fistp 288(%%esi)\n\t"
+
+" flds 104(%%edx)\n\t"
+" fadds 120(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 72(%%edx)\n\t"
+" fistp 224(%%esi)\n\t"
+" fadds 88(%%edx)\n\t"
+" fistp 160(%%esi)\n\t"
+
+" flds 120(%%edx)\n\t"
+" fadds 100(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 88(%%edx)\n\t"
+" fistp 96(%%esi)\n\t"
+" fadds 68(%%edx)\n\t"
+" fistp 32(%%esi)\n\t"
+
+" flds 100(%%edx)\n\t"
+" fadds 116(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 68(%%edx)\n\t"
+" fistp 32(%%edi)\n\t"
+" fadds 84(%%edx)\n\t"
+" fistp 96(%%edi)\n\t"
+
+" flds 116(%%edx)\n\t"
+" fadds 108(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 84(%%edx)\n\t"
+" fistp 160(%%edi)\n\t"
+" fadds 76(%%edx)\n\t"
+" fistp 224(%%edi)\n\t"
+
+" flds 108(%%edx)\n\t"
+" fadds 124(%%edx)\n\t"
+" fld %%st(0)\n\t"
+" fadds 76(%%edx)\n\t"
+" fistp 288(%%edi)\n\t"
+" fadds 92(%%edx)\n\t"
+" fistp 352(%%edi)\n\t"
+
+" flds 124(%%edx)\n\t"
+" fist 480(%%edi)\n\t"
+" fadds 92(%%edx)\n\t"
+" fistp 416(%%edi)\n\t"
+" movsw\n\t"
".L_bye:"
- :
- :"m"(a),"m"(b),"m"(c),"m"(tmp[0])
- :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi");
+ :
+ :"m"(a),"m"(b),"m"(c),"m"(tmp[0])
+ :"memory","%eax","%ebx","%ecx","%edx","%esi","%edi");
}
diff --git a/mp3lib/decod386.c b/mp3lib/decod386.c
index a2cfb56ce8..82657aedc3 100644
--- a/mp3lib/decod386.c
+++ b/mp3lib/decod386.c
@@ -22,10 +22,10 @@
#if 0
/* old WRITE_SAMPLE */
/* is portable */
-#define WRITE_SAMPLE(samples,sum,clip) { \
- if( (sum) > 32767.0) { *(samples) = 0x7fff; (clip)++; } \
+#define WRITE_SAMPLE(samples,sum,clip) { \
+ if( (sum) > 32767.0) { *(samples) = 0x7fff; (clip)++; } \
else if( (sum) < -32768.0) { *(samples) = -0x8000; (clip)++; }\
- else { *(samples) = sum; } \
+ else { *(samples) = sum; } \
}
#else
/* new WRITE_SAMPLE */
@@ -55,9 +55,9 @@
* it doesn't work for you, just enable the "old WRITE_SAMPLE" macro.
*/
#if HAVE_BIGENDIAN
-#define MANTISSA_OFFSET 1
+#define MANTISSA_OFFSET 1
#else
-#define MANTISSA_OFFSET 0
+#define MANTISSA_OFFSET 0
#endif
/* sizeof(int) == 4 */
diff --git a/mp3lib/decode_i586.c b/mp3lib/decode_i586.c
index d4cea638c1..83933d7ad4 100644
--- a/mp3lib/decode_i586.c
+++ b/mp3lib/decode_i586.c
@@ -311,8 +311,8 @@ int synth_1to1_pent(real *bandPtr, int channel, short *samples)
" jnz .L68\n\t"
" movl %%edi,%%eax\n\t"
" movl "MANGLE(saved_ebp)",%%ebp\n\t"
- :"=a"(retval)
- :"m"(bandPtr),"m"(channel),"m"(samples),"m"(tmp[0])
- :"memory","%edi","%esi","%ebx","%ecx","%edx");
+ :"=a"(retval)
+ :"m"(bandPtr),"m"(channel),"m"(samples),"m"(tmp[0])
+ :"memory","%edi","%esi","%ebx","%ecx","%edx");
return retval;
}
diff --git a/mp3lib/decode_mmx.c b/mp3lib/decode_mmx.c
index 211630f219..3027657421 100644
--- a/mp3lib/decode_mmx.c
+++ b/mp3lib/decode_mmx.c
@@ -15,37 +15,37 @@ static const unsigned long long attribute_used __attribute__((aligned(8))) null_
static const unsigned long long attribute_used __attribute__((aligned(8))) one_null = 0xffff0000ffff0000ULL;
const unsigned int __attribute__((aligned(16))) costab_mmx[] =
{
- 1056974725,
- 1057056395,
- 1057223771,
- 1057485416,
- 1057855544,
- 1058356026,
- 1059019886,
- 1059897405,
- 1061067246,
- 1062657950,
- 1064892987,
- 1066774581,
- 1069414683,
- 1073984175,
- 1079645762,
- 1092815430,
- 1057005197,
- 1057342072,
- 1058087743,
- 1059427869,
- 1061799040,
- 1065862217,
- 1071413542,
- 1084439708,
- 1057128951,
- 1058664893,
- 1063675095,
- 1076102863,
- 1057655764,
- 1067924853,
- 1060439283,
+ 1056974725,
+ 1057056395,
+ 1057223771,
+ 1057485416,
+ 1057855544,
+ 1058356026,
+ 1059019886,
+ 1059897405,
+ 1061067246,
+ 1062657950,
+ 1064892987,
+ 1066774581,
+ 1069414683,
+ 1073984175,
+ 1079645762,
+ 1092815430,
+ 1057005197,
+ 1057342072,
+ 1058087743,
+ 1059427869,
+ 1061799040,
+ 1065862217,
+ 1071413542,
+ 1084439708,
+ 1057128951,
+ 1058664893,
+ 1063675095,
+ 1076102863,
+ 1057655764,
+ 1067924853,
+ 1060439283,
};
/**
@@ -55,134 +55,134 @@ const unsigned int __attribute__((aligned(16))) costab_mmx[] =
*/
static const short __attribute__((aligned(8))) mp3lib_decwins[] =
{
- 0, 7, 54, 114, 510, 1288, 1644, 9372,
- 18760, -9373, 1644, -1289, 510, -115, 54, -8,
- 0, 7, 54, 114, 510, 1288, 1644, 9372,
- 18760, -9373, 1644, -1289, 510, -115, 54, -8,
- 0, 7, 55, 129, 500, 1379, 1490, 9834,
- 18748, -8910, 1784, -1197, 516, -101, 52, -7,
- 0, 7, 55, 129, 500, 1379, 1490, 9834,
- 18748, -8910, 1784, -1197, 516, -101, 52, -7,
- 0, 8, 56, 145, 488, 1469, 1322, 10294,
- 18714, -8448, 1910, -1107, 520, -87, 51, -6,
- 0, 8, 56, 145, 488, 1469, 1322, 10294,
- 18714, -8448, 1910, -1107, 520, -87, 51, -6,
- 0, 9, 57, 161, 474, 1559, 1141, 10751,
- 18658, -7987, 2023, -1016, 522, -74, 49, -6,
- 0, 9, 57, 161, 474, 1559, 1141, 10751,
- 18658, -7987, 2023, -1016, 522, -74, 49, -6,
- 0, 10, 57, 177, 456, 1647, 944, 11205,
- 18579, -7528, 2123, -927, 522, -61, 48, -5,
- 0, 10, 57, 177, 456, 1647, 944, 11205,
- 18579, -7528, 2123, -927, 522, -61, 48, -5,
- 0, 11, 57, 194, 435, 1733, 734, 11654,
- 18477, -7073, 2210, -838, 519, -50, 46, -5,
- 0, 11, 57, 194, 435, 1733, 734, 11654,
- 18477, -7073, 2210, -838, 519, -50, 46, -5,
- 0, 12, 57, 212, 411, 1817, 510, 12097,
- 18354, -6621, 2285, -751, 515, -39, 44, -4,
- 0, 12, 57, 212, 411, 1817, 510, 12097,
- 18354, -6621, 2285, -751, 515, -39, 44, -4,
- 0, 13, 57, 229, 384, 1899, 271, 12534,
- 18209, -6174, 2348, -666, 508, -28, 43, -4,
- 0, 13, 57, 229, 384, 1899, 271, 12534,
- 18209, -6174, 2348, -666, 508, -28, 43, -4,
- 0, 14, 56, 247, 354, 1977, 18, 12963,
- 18043, -5733, 2398, -583, 501, -18, 41, -4,
- 0, 14, 56, 247, 354, 1977, 18, 12963,
- 18043, -5733, 2398, -583, 501, -18, 41, -4,
- 0, 15, 56, 266, 320, 2052, -249, 13383,
- 17855, -5298, 2438, -502, 491, -9, 39, -3,
- 0, 15, 56, 266, 320, 2052, -249, 13383,
- 17855, -5298, 2438, -502, 491, -9, 39, -3,
- 0, 17, 54, 284, 283, 2122, -530, 13794,
- 17648, -4870, 2466, -423, 480, -1, 37, -3,
- 0, 17, 54, 284, 283, 2122, -530, 13794,
- 17648, -4870, 2466, -423, 480, -1, 37, -3,
- 0, 18, 52, 302, 243, 2188, -825, 14194,
- 17420, -4450, 2484, -347, 468, 7, 35, -3,
- 0, 18, 52, 302, 243, 2188, -825, 14194,
- 17420, -4450, 2484, -347, 468, 7, 35, -3,
- 0, 19, 50, 320, 199, 2249, -1133, 14583,
- 17173, -4039, 2492, -274, 455, 14, 33, -2,
- 0, 19, 50, 320, 199, 2249, -1133, 14583,
- 17173, -4039, 2492, -274, 455, 14, 33, -2,
- -1, 21, 48, 339, 152, 2304, -1454, 14959,
- 16908, -3637, 2490, -204, 440, 20, 32, -2,
- -1, 21, 48, 339, 152, 2304, -1454, 14959,
- 16908, -3637, 2490, -204, 440, 20, 32, -2,
- -1, 22, 45, 357, 101, 2354, -1788, 15322,
- 16624, -3245, 2479, -137, 425, 26, 30, -2,
- -1, 22, 45, 357, 101, 2354, -1788, 15322,
- 16624, -3245, 2479, -137, 425, 26, 30, -2,
- -1, 24, 41, 374, 47, 2396, -2135, 15671,
- 16323, -2864, 2460, -72, 409, 31, 28, -2,
- -1, 24, 41, 374, 47, 2396, -2135, 15671,
- 16323, -2864, 2460, -72, 409, 31, 28, -2,
- -1, 26, 37, 391, -11, 2431, -2493, 16004,
- 16005, -2494, 2432, -12, 392, 36, 26, -2,
- -1, 26, 37, 391, -11, 2431, -2493, 16004,
- 16005, -2494, 2432, -12, 392, 36, 26, -2,
- -2, -28, 31, -409, -72, -2460, -2864, -16323,
- 15671, 2135, 2396, -47, 374, -41, 24, 1,
- -2, -28, 31, -409, -72, -2460, -2864, -16323,
- 15671, 2135, 2396, -47, 374, -41, 24, 1,
- -2, -30, 26, -425, -137, -2479, -3245, -16624,
- 15322, 1788, 2354, -101, 357, -45, 22, 1,
- -2, -30, 26, -425, -137, -2479, -3245, -16624,
- 15322, 1788, 2354, -101, 357, -45, 22, 1,
- -2, -32, 20, -440, -204, -2490, -3637, -16908,
- 14959, 1454, 2304, -152, 339, -48, 21, 1,
- -2, -32, 20, -440, -204, -2490, -3637, -16908,
- 14959, 1454, 2304, -152, 339, -48, 21, 1,
- -2, -33, 14, -455, -274, -2492, -4039, -17173,
- 14583, 1133, 2249, -199, 320, -50, 19, 0,
- -2, -33, 14, -455, -274, -2492, -4039, -17173,
- 14583, 1133, 2249, -199, 320, -50, 19, 0,
- -3, -35, 7, -468, -347, -2484, -4450, -17420,
- 14194, 825, 2188, -243, 302, -52, 18, 0,
- -3, -35, 7, -468, -347, -2484, -4450, -17420,
- 14194, 825, 2188, -243, 302, -52, 18, 0,
- -3, -37, -1, -480, -423, -2466, -4870, -17648,
- 13794, 530, 2122, -283, 284, -54, 17, 0,
- -3, -37, -1, -480, -423, -2466, -4870, -17648,
- 13794, 530, 2122, -283, 284, -54, 17, 0,
- -3, -39, -9, -491, -502, -2438, -5298, -17855,
- 13383, 249, 2052, -320, 266, -56, 15, 0,
- -3, -39, -9, -491, -502, -2438, -5298, -17855,
- 13383, 249, 2052, -320, 266, -56, 15, 0,
- -4, -41, -18, -501, -583, -2398, -5733, -18043,
- 12963, -18, 1977, -354, 247, -56, 14, 0,
- -4, -41, -18, -501, -583, -2398, -5733, -18043,
- 12963, -18, 1977, -354, 247, -56, 14, 0,
- -4, -43, -28, -508, -666, -2348, -6174, -18209,
- 12534, -271, 1899, -384, 229, -57, 13, 0,
- -4, -43, -28, -508, -666, -2348, -6174, -18209,
- 12534, -271, 1899, -384, 229, -57, 13, 0,
- -4, -44, -39, -515, -751, -2285, -6621, -18354,
- 12097, -510, 1817, -411, 212, -57, 12, 0,
- -4, -44, -39, -515, -751, -2285, -6621, -18354,
- 12097, -510, 1817, -411, 212, -57, 12, 0,
- -5, -46, -50, -519, -838, -2210, -7073, -18477,
- 11654, -734, 1733, -435, 194, -57, 11, 0,
- -5, -46, -50, -519, -838, -2210, -7073, -18477,
- 11654, -734, 1733, -435, 194, -57, 11, 0,
- -5, -48, -61, -522, -927, -2123, -7528, -18579,
- 11205, -944, 1647, -456, 177, -57, 10, 0,
- -5, -48, -61, -522, -927, -2123, -7528, -18579,
- 11205, -944, 1647, -456, 177, -57, 10, 0,
- -6, -49, -74, -522, -1016, -2023, -7987, -18658,
- 10751, -1141, 1559, -474, 161, -57, 9, 0,
- -6, -49, -74, -522, -1016, -2023, -7987, -18658,
- 10751, -1141, 1559, -474, 161, -57, 9, 0,
- -6, -51, -87, -520, -1107, -1910, -8448, -18714,
- 10294, -1322, 1469, -488, 145, -56, 8, 0,
- -6, -51, -87, -520, -1107, -1910, -8448, -18714,
- 10294, -1322, 1469, -488, 145, -56, 8, 0,
- -7, -52, -101, -516, -1197, -1784, -8910, -18748,
- 9834, -1490, 1379, -500, 129, -55, 7, 0,
- -7, -52, -101, -516, -1197, -1784, -8910, -18748,
- 9834, -1490, 1379, -500, 129, -55, 7, 0,
+ 0, 7, 54, 114, 510, 1288, 1644, 9372,
+ 18760, -9373, 1644, -1289, 510, -115, 54, -8,
+ 0, 7, 54, 114, 510, 1288, 1644, 9372,
+ 18760, -9373, 1644, -1289, 510, -115, 54, -8,
+ 0, 7, 55, 129, 500, 1379, 1490, 9834,
+ 18748, -8910, 1784, -1197, 516, -101, 52, -7,
+ 0, 7, 55, 129, 500, 1379, 1490, 9834,
+ 18748, -8910, 1784, -1197, 516, -101, 52, -7,
+ 0, 8, 56, 145, 488, 1469, 1322, 10294,
+ 18714, -8448, 1910, -1107, 520, -87, 51, -6,
+ 0, 8, 56, 145, 488, 1469, 1322, 10294,
+ 18714, -8448, 1910, -1107, 520, -87, 51, -6,
+ 0, 9, 57, 161, 474, 1559, 1141, 10751,
+ 18658, -7987, 2023, -1016, 522, -74, 49, -6,
+ 0, 9, 57, 161, 474, 1559, 1141, 10751,
+ 18658, -7987, 2023, -1016, 522, -74, 49, -6,
+ 0, 10, 57, 177, 456, 1647, 944, 11205,
+ 18579, -7528, 2123, -927, 522, -61, 48, -5,
+ 0, 10, 57, 177, 456, 1647, 944, 11205,
+ 18579, -7528, 2123, -927, 522, -61, 48, -5,
+ 0, 11, 57, 194, 435, 1733, 734, 11654,
+ 18477, -7073, 2210, -838, 519, -50, 46, -5,
+ 0, 11, 57, 194, 435, 1733, 734, 11654,
+ 18477, -7073, 2210, -838, 519, -50, 46, -5,
+ 0, 12, 57, 212, 411, 1817, 510, 12097,
+ 18354, -6621, 2285, -751, 515, -39, 44, -4,
+ 0, 12, 57, 212, 411, 1817, 510, 12097,
+ 18354, -6621, 2285, -751, 515, -39, 44, -4,
+ 0, 13, 57, 229, 384, 1899, 271, 12534,
+ 18209, -6174, 2348, -666, 508, -28, 43, -4,
+ 0, 13, 57, 229, 384, 1899, 271, 12534,
+ 18209, -6174, 2348, -666, 508, -28, 43, -4,
+ 0, 14, 56, 247, 354, 1977, 18, 12963,
+ 18043, -5733, 2398, -583, 501, -18, 41, -4,
+ 0, 14, 56, 247, 354, 1977, 18, 12963,
+ 18043, -5733, 2398, -583, 501, -18, 41, -4,
+ 0, 15, 56, 266, 320, 2052, -249, 13383,
+ 17855, -5298, 2438, -502, 491, -9, 39, -3,
+ 0, 15, 56, 266, 320, 2052, -249, 13383,
+ 17855, -5298, 2438, -502, 491, -9, 39, -3,
+ 0, 17, 54, 284, 283, 2122, -530, 13794,
+ 17648, -4870, 2466, -423, 480, -1, 37, -3,
+ 0, 17, 54, 284, 283, 2122, -530, 13794,
+ 17648, -4870, 2466, -423, 480, -1, 37, -3,
+ 0, 18, 52, 302, 243, 2188, -825, 14194,
+ 17420, -4450, 2484, -347, 468, 7, 35, -3,
+ 0, 18, 52, 302, 243, 2188, -825, 14194,
+ 17420, -4450, 2484, -347, 468, 7, 35, -3,
+ 0, 19, 50, 320, 199, 2249, -1133, 14583,
+ 17173, -4039, 2492, -274, 455, 14, 33, -2,
+ 0, 19, 50, 320, 199, 2249, -1133, 14583,
+ 17173, -4039, 2492, -274, 455, 14, 33, -2,
+ -1, 21, 48, 339, 152, 2304, -1454, 14959,
+ 16908, -3637, 2490, -204, 440, 20, 32, -2,
+ -1, 21, 48, 339, 152, 2304, -1454, 14959,
+ 16908, -3637, 2490, -204, 440, 20, 32, -2,
+ -1, 22, 45, 357, 101, 2354, -1788, 15322,
+ 16624, -3245, 2479, -137, 425, 26, 30, -2,
+ -1, 22, 45, 357, 101, 2354, -1788, 15322,
+ 16624, -3245, 2479, -137, 425, 26, 30, -2,
+ -1, 24, 41, 374, 47, 2396, -2135, 15671,
+ 16323, -2864, 2460, -72, 409, 31, 28, -2,
+ -1, 24, 41, 374, 47, 2396, -2135, 15671,
+ 16323, -2864, 2460, -72, 409, 31, 28, -2,
+ -1, 26, 37, 391, -11, 2431, -2493, 16004,
+ 16005, -2494, 2432, -12, 392, 36, 26, -2,
+ -1, 26, 37, 391, -11, 2431, -2493, 16004,
+ 16005, -2494, 2432, -12, 392, 36, 26, -2,
+ -2, -28, 31, -409, -72, -2460, -2864, -16323,
+ 15671, 2135, 2396, -47, 374, -41, 24, 1,
+ -2, -28, 31, -409, -72, -2460, -2864, -16323,
+ 15671, 2135, 2396, -47, 374, -41, 24, 1,
+ -2, -30, 26, -425, -137, -2479, -3245, -16624,
+ 15322, 1788, 2354, -101, 357, -45, 22, 1,
+ -2, -30, 26, -425, -137, -2479, -3245, -16624,
+ 15322, 1788, 2354, -101, 357, -45, 22, 1,
+ -2, -32, 20, -440, -204, -2490, -3637, -16908,
+ 14959, 1454, 2304, -152, 339, -48, 21, 1,
+ -2, -32, 20, -440, -204, -2490, -3637, -16908,
+ 14959, 1454, 2304, -152, 339, -48, 21, 1,
+ -2, -33, 14, -455, -274, -2492, -4039, -17173,
+ 14583, 1133, 2249, -199, 320, -50, 19, 0,
+ -2, -33, 14, -455, -274, -2492, -4039, -17173,
+ 14583, 1133, 2249, -199, 320, -50, 19, 0,
+ -3, -35, 7, -468, -347, -2484, -4450, -17420,
+ 14194, 825, 2188, -243, 302, -52, 18, 0,
+ -3, -35, 7, -468, -347, -2484, -4450, -17420,
+ 14194, 825, 2188, -243, 302, -52, 18, 0,
+ -3, -37, -1, -480, -423, -2466, -4870, -17648,
+ 13794, 530, 2122, -283, 284, -54, 17, 0,
+ -3, -37, -1, -480, -423, -2466, -4870, -17648,
+ 13794, 530, 2122, -283, 284, -54, 17, 0,
+ -3, -39, -9, -491, -502, -2438, -5298, -17855,
+ 13383, 249, 2052, -320, 266, -56, 15, 0,
+ -3, -39, -9, -491, -502, -2438, -5298, -17855,
+ 13383, 249, 2052, -320, 266, -56, 15, 0,
+ -4, -41, -18, -501, -583, -2398, -5733, -18043,
+ 12963, -18, 1977, -354, 247, -56, 14, 0,
+ -4, -41, -18, -501, -583, -2398, -5733, -18043,
+ 12963, -18, 1977, -354, 247, -56, 14, 0,
+ -4, -43, -28, -508, -666, -2348, -6174, -18209,
+ 12534, -271, 1899, -384, 229, -57, 13, 0,
+ -4, -43, -28, -508, -666, -2348, -6174, -18209,
+ 12534, -271, 1899, -384, 229, -57, 13, 0,
+ -4, -44, -39, -515, -751, -2285, -6621, -18354,
+ 12097, -510, 1817, -411, 212, -57, 12, 0,
+ -4, -44, -39, -515, -751, -2285, -6621, -18354,
+ 12097, -510, 1817, -411, 212, -57, 12, 0,
+ -5, -46, -50, -519, -838, -2210, -7073, -18477,
+ 11654, -734, 1733, -435, 194, -57, 11, 0,
+ -5, -46, -50, -519, -838, -2210, -7073, -18477,
+ 11654, -734, 1733, -435, 194, -57, 11, 0,
+ -5, -48, -61, -522, -927, -2123, -7528, -18579,
+ 11205, -944, 1647, -456, 177, -57, 10, 0,
+ -5, -48, -61, -522, -927, -2123, -7528, -18579,
+ 11205, -944, 1647, -456, 177, -57, 10, 0,
+ -6, -49, -74, -522, -1016, -2023, -7987, -18658,
+ 10751, -1141, 1559, -474, 161, -57, 9, 0,
+ -6, -49, -74, -522, -1016, -2023, -7987, -18658,
+ 10751, -1141, 1559, -474, 161, -57, 9, 0,
+ -6, -51, -87, -520, -1107, -1910, -8448, -18714,
+ 10294, -1322, 1469, -488, 145, -56, 8, 0,
+ -6, -51, -87, -520, -1107, -1910, -8448, -18714,
+ 10294, -1322, 1469, -488, 145, -56, 8, 0,
+ -7, -52, -101, -516, -1197, -1784, -8910, -18748,
+ 9834, -1490, 1379, -500, 129, -55, 7, 0,
+ -7, -52, -101, -516, -1197, -1784, -8910, -18748,
+ 9834, -1490, 1379, -500, 129, -55, 7, 0,
};
int synth_1to1_MMX(real *bandPtr, int channel, short *samples)
@@ -194,23 +194,23 @@ int synth_1to1_MMX(real *bandPtr, int channel, short *samples)
int bo1, i = 8;
if (channel == 0) {
- bo = (bo - 1) & 0xf;
- buf = buffs[1];
+ bo = (bo - 1) & 0xf;
+ buf = buffs[1];
} else {
- samples++;
- buf = buffs[0];
+ samples++;
+ buf = buffs[0];
}
if (bo & 1) {
- b0 = buf[1];
- bo1 = bo + 1;
- a = buf[0] + bo;
- b = buf[1] + ((bo + 1) & 0xf);
+ b0 = buf[1];
+ bo1 = bo + 1;
+ a = buf[0] + bo;
+ b = buf[1] + ((bo + 1) & 0xf);
} else {
- b0 = buf[0];
- bo1 = bo;
- b = buf[0] + bo;
- a = buf[1] + ((bo + 1) & 0xf);
+ b0 = buf[0];
+ bo1 = bo;
+ b = buf[0] + bo;
+ a = buf[1] + ((bo + 1) & 0xf);
}
dct64_MMX_func(a, b, bandPtr);
@@ -252,18 +252,18 @@ ASMALIGN(4)
"packssdw %%mm0,%%mm0\n\t"
"packssdw %%mm4,%%mm4\n\t"
- "movq (%3), %%mm1\n\t"
- "punpckldq %%mm4, %%mm0\n\t"
- "pand "MANGLE(one_null)", %%mm1\n\t"
- "pand "MANGLE(null_one)", %%mm0\n\t"
- "por %%mm0, %%mm1\n\t"
- "movq %%mm1,(%3)\n\t"
+ "movq (%3), %%mm1\n\t"
+ "punpckldq %%mm4, %%mm0\n\t"
+ "pand "MANGLE(one_null)", %%mm1\n\t"
+ "pand "MANGLE(null_one)", %%mm0\n\t"
+ "por %%mm0, %%mm1\n\t"
+ "movq %%mm1,(%3)\n\t"
"add $64,%2\n\t"
"add $128,%1\n\t"
"add $8,%3\n\t"
- "decl %0\n\t"
+ "decl %0\n\t"
"jnz 0b\n\t"
"movq (%1),%%mm0\n\t"
@@ -283,7 +283,7 @@ ASMALIGN(4)
"psrad $13,%%mm0\n\t"
"packssdw %%mm0,%%mm0\n\t"
"movd %%mm0,%%eax\n\t"
- "movw %%ax, (%3)\n\t"
+ "movw %%ax, (%3)\n\t"
"sub $32,%2\n\t"
"add $64,%1\n\t"
"add $4,%3\n\t"
@@ -328,18 +328,18 @@ ASMALIGN(4)
"psubsw %%mm1,%%mm0\n\t"
"psubsw %%mm5,%%mm4\n\t"
- "movq (%3), %%mm1\n\t"
- "punpckldq %%mm4, %%mm0\n\t"
- "pand "MANGLE(one_null)", %%mm1\n\t"
- "pand "MANGLE(null_one)", %%mm0\n\t"
- "por %%mm0, %%mm1\n\t"
- "movq %%mm1,(%3)\n\t"
+ "movq (%3), %%mm1\n\t"
+ "punpckldq %%mm4, %%mm0\n\t"
+ "pand "MANGLE(one_null)", %%mm1\n\t"
+ "pand "MANGLE(null_one)", %%mm0\n\t"
+ "por %%mm0, %%mm1\n\t"
+ "movq %%mm1,(%3)\n\t"
"sub $64,%2\n\t"
"add $128,%1\n\t"
"add $8,%3\n\t"
"decl %0\n\t"
- "jnz 1b\n\t"
+ "jnz 1b\n\t"
"movq (%1),%%mm0\n\t"
"pmaddwd (%2),%%mm0\n\t"
@@ -360,10 +360,10 @@ ASMALIGN(4)
"psubd %%mm0,%%mm0\n\t"
"psubsw %%mm1,%%mm0\n\t"
"movd %%mm0,%%eax\n\t"
- "movw %%ax,(%3)\n\t"
- "emms\n\t"
- :"+r"(i), "+r"(window), "+r"(b0), "+r"(samples)
- :
- :"memory", "%eax");
+ "movw %%ax,(%3)\n\t"
+ "emms\n\t"
+ :"+r"(i), "+r"(window), "+r"(b0), "+r"(samples)
+ :
+ :"memory", "%eax");
return 0;
}
diff --git a/mp3lib/equalizer.c b/mp3lib/equalizer.c
index 78db17ef67..1c1a3f38ed 100644
--- a/mp3lib/equalizer.c
+++ b/mp3lib/equalizer.c
@@ -2,78 +2,77 @@
void init_spline(float *x, float *y, int n, float *y2)
{
+ int i, k;
+ float p, qn, sig, un, *u;
+ u = malloc(n * sizeof (float));
- int i, k;
- float p, qn, sig, un, *u;
- u = malloc(n * sizeof (float));
+ y2[0] = u[0] = 0.0;
- y2[0] = u[0] = 0.0;
+ for (i = 1; i < n - 1; i++)
+ {
+ sig = ((float) x[i] - x[i - 1]) / ((float) x[i + 1] - x[i - 1]);
+ p = sig * y2[i - 1] + 2.0;
+ y2[i] = (sig - 1.0) / p;
+ u[i] = (((float) y[i + 1] - y[i]) / (x[i + 1] - x[i])) -
+ (((float) y[i] - y[i - 1]) / (x[i] - x[i - 1]));
+ u[i] = (6.0 * u[i] / (x[i + 1] - x[i - 1]) - sig * u[i - 1]) / p;
+ }
+ qn = un = 0.0;
- for (i = 1; i < n - 1; i++)
- {
- sig = ((float) x[i] - x[i - 1]) / ((float) x[i + 1] - x[i - 1]);
- p = sig * y2[i - 1] + 2.0;
- y2[i] = (sig - 1.0) / p;
- u[i] = (((float) y[i + 1] - y[i]) / (x[i + 1] - x[i])) -
- (((float) y[i] - y[i - 1]) / (x[i] - x[i - 1]));
- u[i] = (6.0 * u[i] / (x[i + 1] - x[i - 1]) - sig * u[i - 1]) / p;
- }
- qn = un = 0.0;
-
- y2[n - 1] = (un - qn * u[n - 2]) / (qn * y2[n - 2] + 1.0);
- for (k = n - 2; k >= 0; k--)
- y2[k] = y2[k] * y2[k + 1] + u[k];
- free(u);
+ y2[n - 1] = (un - qn * u[n - 2]) / (qn * y2[n - 2] + 1.0);
+ for (k = n - 2; k >= 0; k--)
+ y2[k] = y2[k] * y2[k + 1] + u[k];
+ free(u);
}
float eval_spline(float xa[], float ya[], float y2a[], int n, float x)
{
- int klo, khi, k;
- float h, b, a;
+ int klo, khi, k;
+ float h, b, a;
- klo = 0;
- khi = n - 1;
- while (khi - klo > 1)
- {
- k = (khi + klo) >> 1;
- if (xa[k] > x)
- khi = k;
- else
- klo = k;
- }
- h = xa[khi] - xa[klo];
- a = (xa[khi] - x) / h;
- b = (x - xa[klo]) / h;
- return (a * ya[klo] + b * ya[khi] + ((a * a * a - a) * y2a[klo] + (b * b * b - b) * y2a[khi])
- * (h * h) / 6.0);
+ klo = 0;
+ khi = n - 1;
+ while (khi - klo > 1)
+ {
+ k = (khi + klo) >> 1;
+ if (xa[k] > x)
+ khi = k;
+ else
+ klo = k;
+ }
+ h = xa[khi] - xa[klo];
+ a = (xa[khi] - x) / h;
+ b = (x - xa[klo]) / h;
+ return (a * ya[klo] + b * ya[khi] + ((a * a * a - a) * y2a[klo] + (b * b * b - b) * y2a[khi])
+ * (h * h) / 6.0);
}
void mpg123_set_eq(int on, float preamp, float *b)
{
- float x[] =
- {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, yf[10], val, band[10];
- int bands[] =
- {0, 4, 8, 16, 26, 78, 157, 313, 366, 418};
- int i, j;
+ float x[] =
+ {0, 1, 2, 3, 4, 5, 6, 7, 8, 9}, yf[10], val, band[10];
+ int bands[] =
+ {0, 4, 8, 16, 26, 78, 157, 313, 366, 418};
+ int i, j;
- mpg123_info->eq_active = on;
- if (mpg123_info->eq_active)
- {
- for (i = 0; i < 10; i++)
- {
- band[i] = b[i] + preamp;
- }
+ mpg123_info->eq_active = on;
+ if (mpg123_info->eq_active)
+ {
+ for (i = 0; i < 10; i++)
+ {
+ band[i] = b[i] + preamp;
+ }
- init_spline(x, band, 10, yf);
- for (i = 0; i < 9; i++)
- {
- for (j = bands[i]; j < bands[i + 1]; j++)
- {
- val = eval_spline(x, band, yf, 10, i + ((float) (j - bands[i]) * (1.0 / (bands[i + 1] - bands[i]))));
- mpg123_info->eq_mul[j] = pow(2, val / 10.0);
- }
- }
- for (i = bands[9]; i < 576; i++)
- mpg123_info->eq_mul[i] = mpg123_info->eq_mul[bands[9] - 1];
- }
+ init_spline(x, band, 10, yf);
+ for (i = 0; i < 9; i++)
+ {
+ for (j = bands[i]; j < bands[i + 1]; j++)
+ {
+ val = eval_spline(x, band, yf, 10, i + ((float) (j - bands[i]) * (1.0 / (bands[i + 1] - bands[i]))));
+ mpg123_info->eq_mul[j] = pow(2, val / 10.0);
+ }
+ }
+ for (i = bands[9]; i < 576; i++)
+ mpg123_info->eq_mul[i] = mpg123_info->eq_mul[bands[9] - 1];
+ }
}
diff --git a/mp3lib/l2tables.h b/mp3lib/l2tables.h
index cf6299e88d..feef3d1cdb 100644
--- a/mp3lib/l2tables.h
+++ b/mp3lib/l2tables.h
@@ -17,143 +17,143 @@
*/
static struct al_table alloc_0[] = {
- {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
- {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
- {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
- {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
- {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
- {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767} };
+ {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
+ {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
+ {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
+ {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
+ {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
+ {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767} };
static struct al_table alloc_1[] = {
- {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
- {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
- {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
- {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
- {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
- {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767},
- {2,0},{5,3},{7,5},{16,-32767} };
+ {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
+ {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
+ {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
+ {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
+ {4,0},{5,3},{3,-3},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},{10,-511},
+ {11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {3,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767},
+ {2,0},{5,3},{7,5},{16,-32767} };
static struct al_table alloc_2[] = {
- {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
- {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
- {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
- {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63} };
+ {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
+ {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
+ {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
+ {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63} };
static struct al_table alloc_3[] = {
- {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
- {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
- {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
- {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63} };
+ {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
+ {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
+ {4,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},{9,-255},
+ {10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},{15,-16383},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63} };
static struct al_table alloc_4[] = {
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
- {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
- {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
- {2,0},{5,3},{7,5},{10,9},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
+ {4,0},{5,3},{7,5},{3,-3},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},{8,-127},
+ {9,-255},{10,-511},{11,-1023},{12,-2047},{13,-4095},{14,-8191},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {3,0},{5,3},{7,5},{10,9},{4,-7},{5,-15},{6,-31},{7,-63},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
+ {2,0},{5,3},{7,5},{10,9},
{2,0},{5,3},{7,5},{10,9},
{2,0},{5,3},{7,5},{10,9},
{2,0},{5,3},{7,5},{10,9},
diff --git a/mp3lib/layer1.c b/mp3lib/layer1.c
index d53c628314..a4be24677a 100644
--- a/mp3lib/layer1.c
+++ b/mp3lib/layer1.c
@@ -61,7 +61,7 @@ static void I_step_one(unsigned int balloc[], unsigned int scale_index[2][SBLIMI
}
static void I_step_two(real fraction[2][SBLIMIT],unsigned int balloc[2*SBLIMIT],
- unsigned int scale_index[2][SBLIMIT],struct frame *fr)
+ unsigned int scale_index[2][SBLIMIT],struct frame *fr)
{
int i,n;
int smpb[2*SBLIMIT]; /* values: 0-65535 */
diff --git a/mp3lib/layer2.c b/mp3lib/layer2.c
index 867da2f2dc..f86d716882 100644
--- a/mp3lib/layer2.c
+++ b/mp3lib/layer2.c
@@ -18,7 +18,7 @@ static int grp_3tab[32 * 3] = { 0, }; /* used: 27 */
static int grp_5tab[128 * 3] = { 0, }; /* used: 125 */
static int grp_9tab[1024 * 3] = { 0, }; /* used: 729 */
-static real muls[27][64]; /* also used by layer 1 */
+static real muls[27][64]; /* also used by layer 1 */
static void init_layer2(void)
{
@@ -59,7 +59,7 @@ static void init_layer2(void)
if(_has_mmx)
{
for(j=3,i=0;i<63;i++,j--)
- *table++ = 16384 * m * pow(2.0,(double) j / 3.0);
+ *table++ = 16384 * m * pow(2.0,(double) j / 3.0);
}
else
for(j=3,i=0;i<63;i++,j--)
@@ -189,7 +189,7 @@ static void II_step_two(unsigned int *bit_alloc,real fraction[2][4][SBLIMIT],int
for (i=jsbound;i<sblimit;i++,alloc1+=(1<<step))
{
step = alloc1->bits;
- bita++; /* channel 1 and channel 2 bitalloc are the same */
+ bita++; /* channel 1 and channel 2 bitalloc are the same */
if ( (ba=*bita++) )
{
k=(alloc2 = alloc1+ba)->bits;
diff --git a/mp3lib/layer3.c b/mp3lib/layer3.c
index 16dfb06bb8..91943a8f18 100644
--- a/mp3lib/layer3.c
+++ b/mp3lib/layer3.c
@@ -25,7 +25,7 @@
#define CUT_HF
#endif
-# define REAL_MUL(x, y) ((x) * (y))
+#define REAL_MUL(x, y) ((x) * (y))
static real ispow[8207];
static real aa_ca[8],aa_cs[8];
@@ -734,8 +734,8 @@ static int III_dequantize_sample(real xr[SBLIMIT][SSLIMIT],int *scf,
mask <<= 1;
}
if(part2remain+num <= 0) {
- num -= part2remain+num;
- break;
+ num -= part2remain+num;
+ break;
}
for(i=0;i<4;i++) {
@@ -851,7 +851,7 @@ static int III_dequantize_sample(real xr[SBLIMIT][SSLIMIT],int *scf,
if (x == 15 && h->linbits) {
max = cb;
- REFRESH_MASK;
+ REFRESH_MASK;
x += ((unsigned long) mask) >> (BITSHIFT+8-h->linbits);
num -= h->linbits+1;
mask <<= h->linbits;
@@ -875,7 +875,7 @@ static int III_dequantize_sample(real xr[SBLIMIT][SSLIMIT],int *scf,
if (y == 15 && h->linbits) {
max = cb;
- REFRESH_MASK;
+ REFRESH_MASK;
y += ((unsigned long) mask) >> (BITSHIFT+8-h->linbits);
num -= h->linbits+1;
mask <<= h->linbits;
@@ -914,7 +914,7 @@ static int III_dequantize_sample(real xr[SBLIMIT][SSLIMIT],int *scf,
mask <<= 1;
}
if(part2remain+num <= 0) {
- num -= part2remain+num;
+ num -= part2remain+num;
break;
}
@@ -1003,7 +1003,7 @@ static void III_i_stereo(real xr_buf[2][SBLIMIT][SSLIMIT],int *scalefac,
#if 0
if(lsf) {
int p = gr_info->scalefac_compress & 0x1;
- if(ms_stereo) {
+ if(ms_stereo) {
tab1 = pow1_2[p]; tab2 = pow2_2[p];
}
else {
@@ -1329,17 +1329,17 @@ static int do_layer3(struct frame *fr,int single){
for(ch=0;ch<stereo1;ch++) {
struct gr_info_s *gr_info = &(sideinfo.ch[ch].gr[gr]);
- III_antialias(hybridIn[ch],gr_info);
- III_hybrid(hybridIn[ch], hybridOut[ch], ch,gr_info);
+ III_antialias(hybridIn[ch],gr_info);
+ III_hybrid(hybridIn[ch], hybridOut[ch], ch,gr_info);
}
for(ss=0;ss<SSLIMIT;ss++) {
if(single >= 0) {
- clip += (fr->synth_mono)(hybridOut[0][ss],pcm_sample,&pcm_point);
- } else {
- int p1 = pcm_point;
- clip += (fr->synth)(hybridOut[0][ss],0,pcm_sample,&p1);
- clip += (fr->synth)(hybridOut[1][ss],1,pcm_sample,&pcm_point);
+ clip += (fr->synth_mono)(hybridOut[0][ss],pcm_sample,&pcm_point);
+ } else {
+ int p1 = pcm_point;
+ clip += (fr->synth)(hybridOut[0][ss],0,pcm_sample,&p1);
+ clip += (fr->synth)(hybridOut[1][ss],1,pcm_sample,&pcm_point);
}
}
diff --git a/mp3lib/mpg123.h b/mp3lib/mpg123.h
index 5a7548250a..0b9f781f80 100644
--- a/mp3lib/mpg123.h
+++ b/mp3lib/mpg123.h
@@ -15,10 +15,10 @@
#include "config.h"
#ifndef M_PI
-#define M_PI 3.141592653589793238462
+#define M_PI 3.141592653589793238462
#endif
#ifndef M_SQRT2
-#define M_SQRT2 1.414213562373095048802
+#define M_SQRT2 1.414213562373095048802
#endif
#define REAL_IS_FLOAT
#define NEW_DCT9
diff --git a/mp3lib/sr1.c b/mp3lib/sr1.c
index 694961ebc0..caed5f8c90 100644
--- a/mp3lib/sr1.c
+++ b/mp3lib/sr1.c
@@ -412,34 +412,34 @@ void MP3_Init(void){
#if HAVE_MMX
if (gCpuCaps.hasMMX)
{
- _has_mmx = 1;
- synth_func = synth_1to1_MMX;
+ _has_mmx = 1;
+ synth_func = synth_1to1_MMX;
}
#endif
#if HAVE_AMD3DNOWEXT
if (gCpuCaps.has3DNowExt)
{
- dct36_func=dct36_3dnowex;
- dct64_MMX_func= dct64_MMX_3dnowex;
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using 3DNow!Ex optimized decore!\n");
+ dct36_func=dct36_3dnowex;
+ dct64_MMX_func= dct64_MMX_3dnowex;
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using 3DNow!Ex optimized decore!\n");
}
else
#endif
#if HAVE_AMD3DNOW
if (gCpuCaps.has3DNow)
{
- dct36_func = dct36_3dnow;
- dct64_MMX_func = dct64_MMX_3dnow;
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using 3DNow! optimized decore!\n");
+ dct36_func = dct36_3dnow;
+ dct64_MMX_func = dct64_MMX_3dnow;
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using 3DNow! optimized decore!\n");
}
else
#endif
#if HAVE_SSE
if (gCpuCaps.hasSSE)
{
- dct64_MMX_func = dct64_sse;
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using SSE optimized decore!\n");
+ dct64_MMX_func = dct64_sse;
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using SSE optimized decore!\n");
}
else
#endif
@@ -447,28 +447,28 @@ void MP3_Init(void){
#if HAVE_MMX
if (gCpuCaps.hasMMX)
{
- dct64_MMX_func = dct64_MMX;
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using MMX optimized decore!\n");
+ dct64_MMX_func = dct64_MMX;
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using MMX optimized decore!\n");
}
else
#endif
if (gCpuCaps.cpuType >= CPUTYPE_I586)
{
- synth_func = synth_1to1_pent;
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using Pentium optimized decore!\n");
+ synth_func = synth_1to1_pent;
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using Pentium optimized decore!\n");
}
else
#endif /* ARCH_X86_32 */
#if HAVE_ALTIVEC
if (gCpuCaps.hasAltiVec)
{
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using AltiVec optimized decore!\n");
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using AltiVec optimized decore!\n");
}
else
#endif
{
- synth_func = NULL; /* use default c version */
- mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using generic C decore!\n");
+ synth_func = NULL; /* use default c version */
+ mp_msg(MSGT_DECAUDIO,MSGL_V,"mp3lib: using generic C decore!\n");
}
#ifdef CONFIG_FAKE_MONO
@@ -535,7 +535,7 @@ int MP3_DecodeFrame(unsigned char *hova,short single){
case 3: do_layer3(&fr,single);break;
case 1: do_layer1(&fr,single);break;
default:
- return 0; // unsupported
+ return 0; // unsupported
}
// ++MP3_frames;
return pcm_point ? pcm_point : 2;