1
mirror of https://github.com/mpv-player/mpv synced 2025-01-05 03:06:28 +01:00

Make 3dnow and MMX code compile for 64 bit (just stupid search-and-replace).

They are not compiled/enabled on 64 bit though, since they are vastly slower
but would still be selected by default.


git-svn-id: svn://svn.mplayerhq.hu/mplayer/trunk@31281 b3059339-0415-0410-9bf9-f77b7e298cf2
This commit is contained in:
reimar 2010-05-30 10:01:40 +00:00
parent 8829003b51
commit 8830acfc73
4 changed files with 1748 additions and 1744 deletions

View File

@ -30,6 +30,7 @@
#include "config.h"
#include "mangle.h"
#include "mpg123.h"
#include "libavutil/x86_cpu.h"
#ifdef DCT36_OPTIMIZE_FOR_K7
void dct36_3dnowex(real *inbuf, real *o1,
@ -40,123 +41,123 @@ void dct36_3dnow(real *inbuf, real *o1,
#endif
{
__asm__ volatile(
"movq (%%eax),%%mm0\n\t"
"movq 4(%%eax),%%mm1\n\t"
"movq (%%"REG_a"),%%mm0\n\t"
"movq 4(%%"REG_a"),%%mm1\n\t"
"pfadd %%mm1,%%mm0\n\t"
"movq %%mm0,4(%%eax)\n\t"
"movq %%mm0,4(%%"REG_a")\n\t"
"psrlq $32,%%mm1\n\t"
"movq 12(%%eax),%%mm2\n\t"
"movq 12(%%"REG_a"),%%mm2\n\t"
"punpckldq %%mm2,%%mm1\n\t"
"pfadd %%mm2,%%mm1\n\t"
"movq %%mm1,12(%%eax)\n\t"
"movq %%mm1,12(%%"REG_a")\n\t"
"psrlq $32,%%mm2\n\t"
"movq 20(%%eax),%%mm3\n\t"
"movq 20(%%"REG_a"),%%mm3\n\t"
"punpckldq %%mm3,%%mm2\n\t"
"pfadd %%mm3,%%mm2\n\t"
"movq %%mm2,20(%%eax)\n\t"
"movq %%mm2,20(%%"REG_a")\n\t"
"psrlq $32,%%mm3\n\t"
"movq 28(%%eax),%%mm4\n\t"
"movq 28(%%"REG_a"),%%mm4\n\t"
"punpckldq %%mm4,%%mm3\n\t"
"pfadd %%mm4,%%mm3\n\t"
"movq %%mm3,28(%%eax)\n\t"
"movq %%mm3,28(%%"REG_a")\n\t"
"psrlq $32,%%mm4\n\t"
"movq 36(%%eax),%%mm5\n\t"
"movq 36(%%"REG_a"),%%mm5\n\t"
"punpckldq %%mm5,%%mm4\n\t"
"pfadd %%mm5,%%mm4\n\t"
"movq %%mm4,36(%%eax)\n\t"
"movq %%mm4,36(%%"REG_a")\n\t"
"psrlq $32,%%mm5\n\t"
"movq 44(%%eax),%%mm6\n\t"
"movq 44(%%"REG_a"),%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movq %%mm5,44(%%eax)\n\t"
"movq %%mm5,44(%%"REG_a")\n\t"
"psrlq $32,%%mm6\n\t"
"movq 52(%%eax),%%mm7\n\t"
"movq 52(%%"REG_a"),%%mm7\n\t"
"punpckldq %%mm7,%%mm6\n\t"
"pfadd %%mm7,%%mm6\n\t"
"movq %%mm6,52(%%eax)\n\t"
"movq %%mm6,52(%%"REG_a")\n\t"
"psrlq $32,%%mm7\n\t"
"movq 60(%%eax),%%mm0\n\t"
"movq 60(%%"REG_a"),%%mm0\n\t"
"punpckldq %%mm0,%%mm7\n\t"
"pfadd %%mm0,%%mm7\n\t"
"movq %%mm7,60(%%eax)\n\t"
"movq %%mm7,60(%%"REG_a")\n\t"
"psrlq $32,%%mm0\n\t"
"movd 68(%%eax),%%mm1\n\t"
"movd 68(%%"REG_a"),%%mm1\n\t"
"pfadd %%mm1,%%mm0\n\t"
"movd %%mm0,68(%%eax)\n\t"
"movd 4(%%eax),%%mm0\n\t"
"movd 12(%%eax),%%mm1\n\t"
"movd %%mm0,68(%%"REG_a")\n\t"
"movd 4(%%"REG_a"),%%mm0\n\t"
"movd 12(%%"REG_a"),%%mm1\n\t"
"punpckldq %%mm1,%%mm0\n\t"
"punpckldq 20(%%eax),%%mm1\n\t"
"punpckldq 20(%%"REG_a"),%%mm1\n\t"
"pfadd %%mm1,%%mm0\n\t"
"movd %%mm0,12(%%eax)\n\t"
"movd %%mm0,12(%%"REG_a")\n\t"
"psrlq $32,%%mm0\n\t"
"movd %%mm0,20(%%eax)\n\t"
"movd %%mm0,20(%%"REG_a")\n\t"
"psrlq $32,%%mm1\n\t"
"movd 28(%%eax),%%mm2\n\t"
"movd 28(%%"REG_a"),%%mm2\n\t"
"punpckldq %%mm2,%%mm1\n\t"
"punpckldq 36(%%eax),%%mm2\n\t"
"punpckldq 36(%%"REG_a"),%%mm2\n\t"
"pfadd %%mm2,%%mm1\n\t"
"movd %%mm1,28(%%eax)\n\t"
"movd %%mm1,28(%%"REG_a")\n\t"
"psrlq $32,%%mm1\n\t"
"movd %%mm1,36(%%eax)\n\t"
"movd %%mm1,36(%%"REG_a")\n\t"
"psrlq $32,%%mm2\n\t"
"movd 44(%%eax),%%mm3\n\t"
"movd 44(%%"REG_a"),%%mm3\n\t"
"punpckldq %%mm3,%%mm2\n\t"
"punpckldq 52(%%eax),%%mm3\n\t"
"punpckldq 52(%%"REG_a"),%%mm3\n\t"
"pfadd %%mm3,%%mm2\n\t"
"movd %%mm2,44(%%eax)\n\t"
"movd %%mm2,44(%%"REG_a")\n\t"
"psrlq $32,%%mm2\n\t"
"movd %%mm2,52(%%eax)\n\t"
"movd %%mm2,52(%%"REG_a")\n\t"
"psrlq $32,%%mm3\n\t"
"movd 60(%%eax),%%mm4\n\t"
"movd 60(%%"REG_a"),%%mm4\n\t"
"punpckldq %%mm4,%%mm3\n\t"
"punpckldq 68(%%eax),%%mm4\n\t"
"punpckldq 68(%%"REG_a"),%%mm4\n\t"
"pfadd %%mm4,%%mm3\n\t"
"movd %%mm3,60(%%eax)\n\t"
"movd %%mm3,60(%%"REG_a")\n\t"
"psrlq $32,%%mm3\n\t"
"movd %%mm3,68(%%eax)\n\t"
"movd %%mm3,68(%%"REG_a")\n\t"
"movq 24(%%eax),%%mm0\n\t"
"movq 48(%%eax),%%mm1\n\t"
"movq 24(%%"REG_a"),%%mm0\n\t"
"movq 48(%%"REG_a"),%%mm1\n\t"
"movd "MANGLE(COS9)"+12,%%mm2\n\t"
"punpckldq %%mm2,%%mm2\n\t"
"movd "MANGLE(COS9)"+24,%%mm3\n\t"
"punpckldq %%mm3,%%mm3\n\t"
"pfmul %%mm2,%%mm0\n\t"
"pfmul %%mm3,%%mm1\n\t"
"pushl %%eax\n\t"
"push %%"REG_a"\n\t"
"movl $1,%%eax\n\t"
"movd %%eax,%%mm7\n\t"
"pi2fd %%mm7,%%mm7\n\t"
"popl %%eax\n\t"
"movq 8(%%eax),%%mm2\n\t"
"pop %%"REG_a"\n\t"
"movq 8(%%"REG_a"),%%mm2\n\t"
"movd "MANGLE(COS9)"+4,%%mm3\n\t"
"punpckldq %%mm3,%%mm3\n\t"
"pfmul %%mm3,%%mm2\n\t"
"pfadd %%mm0,%%mm2\n\t"
"movq 40(%%eax),%%mm3\n\t"
"movq 40(%%"REG_a"),%%mm3\n\t"
"movd "MANGLE(COS9)"+20,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"pfadd %%mm3,%%mm2\n\t"
"movq 56(%%eax),%%mm3\n\t"
"movq 56(%%"REG_a"),%%mm3\n\t"
"movd "MANGLE(COS9)"+28,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"pfadd %%mm3,%%mm2\n\t"
"movq (%%eax),%%mm3\n\t"
"movq 16(%%eax),%%mm4\n\t"
"movq (%%"REG_a"),%%mm3\n\t"
"movq 16(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+8,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"pfadd %%mm4,%%mm3\n\t"
"movq 32(%%eax),%%mm4\n\t"
"movq 32(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+16,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"pfadd %%mm4,%%mm3\n\t"
"pfadd %%mm1,%%mm3\n\t"
"movq 64(%%eax),%%mm4\n\t"
"movq 64(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+32,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
@ -168,30 +169,30 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 108(%%edx),%%mm6\n\t"
"punpckldq 104(%%edx),%%mm6\n\t"
"movd 108(%%"REG_d"),%%mm6\n\t"
"punpckldq 104(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
#ifdef DCT36_OPTIMIZE_FOR_K7
"pswapd %%mm5,%%mm5\n\t"
"movq %%mm5,32(%%ecx)\n\t"
"movq %%mm5,32(%%"REG_c")\n\t"
#else
"movd %%mm5,36(%%ecx)\n\t"
"movd %%mm5,36(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,32(%%ecx)\n\t"
"movd %%mm5,32(%%"REG_c")\n\t"
#endif
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 32(%%edx),%%mm6\n\t"
"punpckldq 36(%%edx),%%mm6\n\t"
"movd 32(%%"REG_d"),%%mm6\n\t"
"punpckldq 36(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 32(%%esi),%%mm6\n\t"
"punpckldq 36(%%esi),%%mm6\n\t"
"movd 32(%%"REG_S"),%%mm6\n\t"
"punpckldq 36(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,1024(%%edi)\n\t"
"movd %%mm5,1024(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1152(%%edi)\n\t"
"movd %%mm5,1152(%%"REG_D")\n\t"
"movq %%mm3,%%mm4\n\t"
"pfsub %%mm2,%%mm4\n\t"
"movq %%mm7,%%mm5\n\t"
@ -199,44 +200,44 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 140(%%edx),%%mm6\n\t"
"punpckldq 72(%%edx),%%mm6\n\t"
"movd 140(%%"REG_d"),%%mm6\n\t"
"punpckldq 72(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,68(%%ecx)\n\t"
"movd %%mm5,68(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,0(%%ecx)\n\t"
"movd %%mm5,0(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 0(%%edx),%%mm6\n\t"
"punpckldq 68(%%edx),%%mm6\n\t"
"movd 0(%%"REG_d"),%%mm6\n\t"
"punpckldq 68(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 0(%%esi),%%mm6\n\t"
"punpckldq 68(%%esi),%%mm6\n\t"
"movd 0(%%"REG_S"),%%mm6\n\t"
"punpckldq 68(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,0(%%edi)\n\t"
"movd %%mm5,0(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,2176(%%edi)\n\t"
"movq 8(%%eax),%%mm2\n\t"
"movq 40(%%eax),%%mm3\n\t"
"movd %%mm5,2176(%%"REG_D")\n\t"
"movq 8(%%"REG_a"),%%mm2\n\t"
"movq 40(%%"REG_a"),%%mm3\n\t"
"pfsub %%mm3,%%mm2\n\t"
"movq 56(%%eax),%%mm3\n\t"
"movq 56(%%"REG_a"),%%mm3\n\t"
"pfsub %%mm3,%%mm2\n\t"
"movd "MANGLE(COS9)"+12,%%mm3\n\t"
"punpckldq %%mm3,%%mm3\n\t"
"pfmul %%mm3,%%mm2\n\t"
"movq 16(%%eax),%%mm3\n\t"
"movq 32(%%eax),%%mm4\n\t"
"movq 16(%%"REG_a"),%%mm3\n\t"
"movq 32(%%"REG_a"),%%mm4\n\t"
"pfsub %%mm4,%%mm3\n\t"
"movq 64(%%eax),%%mm4\n\t"
"movq 64(%%"REG_a"),%%mm4\n\t"
"pfsub %%mm4,%%mm3\n\t"
"movd "MANGLE(COS9)"+24,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"movq 48(%%eax),%%mm4\n\t"
"movq 48(%%"REG_a"),%%mm4\n\t"
"pfsub %%mm4,%%mm3\n\t"
"movq (%%eax),%%mm4\n\t"
"movq (%%"REG_a"),%%mm4\n\t"
"pfadd %%mm4,%%mm3\n\t"
"movq %%mm2,%%mm4\n\t"
"pfadd %%mm3,%%mm4\n\t"
@ -245,25 +246,25 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 112(%%edx),%%mm6\n\t"
"punpckldq 100(%%edx),%%mm6\n\t"
"movd 112(%%"REG_d"),%%mm6\n\t"
"punpckldq 100(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,40(%%ecx)\n\t"
"movd %%mm5,40(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,28(%%ecx)\n\t"
"movd %%mm5,28(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 28(%%edx),%%mm6\n\t"
"punpckldq 40(%%edx),%%mm6\n\t"
"movd 28(%%"REG_d"),%%mm6\n\t"
"punpckldq 40(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 28(%%esi),%%mm6\n\t"
"punpckldq 40(%%esi),%%mm6\n\t"
"movd 28(%%"REG_S"),%%mm6\n\t"
"punpckldq 40(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,896(%%edi)\n\t"
"movd %%mm5,896(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1280(%%edi)\n\t"
"movd %%mm5,1280(%%"REG_D")\n\t"
"movq %%mm3,%%mm4\n\t"
"pfsub %%mm2,%%mm4\n\t"
"movq %%mm7,%%mm5\n\t"
@ -271,54 +272,54 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 136(%%edx),%%mm6\n\t"
"punpckldq 76(%%edx),%%mm6\n\t"
"movd 136(%%"REG_d"),%%mm6\n\t"
"punpckldq 76(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,64(%%ecx)\n\t"
"movd %%mm5,64(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,4(%%ecx)\n\t"
"movd %%mm5,4(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 4(%%edx),%%mm6\n\t"
"punpckldq 64(%%edx),%%mm6\n\t"
"movd 4(%%"REG_d"),%%mm6\n\t"
"punpckldq 64(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 4(%%esi),%%mm6\n\t"
"punpckldq 64(%%esi),%%mm6\n\t"
"movd 4(%%"REG_S"),%%mm6\n\t"
"punpckldq 64(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,128(%%edi)\n\t"
"movd %%mm5,128(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,2048(%%edi)\n\t"
"movd %%mm5,2048(%%"REG_D")\n\t"
"movq 8(%%eax),%%mm2\n\t"
"movq 8(%%"REG_a"),%%mm2\n\t"
"movd "MANGLE(COS9)"+20,%%mm3\n\t"
"punpckldq %%mm3,%%mm3\n\t"
"pfmul %%mm3,%%mm2\n\t"
"pfsub %%mm0,%%mm2\n\t"
"movq 40(%%eax),%%mm3\n\t"
"movq 40(%%"REG_a"),%%mm3\n\t"
"movd "MANGLE(COS9)"+28,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"pfsub %%mm3,%%mm2\n\t"
"movq 56(%%eax),%%mm3\n\t"
"movq 56(%%"REG_a"),%%mm3\n\t"
"movd "MANGLE(COS9)"+4,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"pfadd %%mm3,%%mm2\n\t"
"movq (%%eax),%%mm3\n\t"
"movq 16(%%eax),%%mm4\n\t"
"movq (%%"REG_a"),%%mm3\n\t"
"movq 16(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+32,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"pfsub %%mm4,%%mm3\n\t"
"movq 32(%%eax),%%mm4\n\t"
"movq 32(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+8,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"pfsub %%mm4,%%mm3\n\t"
"pfadd %%mm1,%%mm3\n\t"
"movq 64(%%eax),%%mm4\n\t"
"movq 64(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+16,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
@ -330,25 +331,25 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 116(%%edx),%%mm6\n\t"
"punpckldq 96(%%edx),%%mm6\n\t"
"movd 116(%%"REG_d"),%%mm6\n\t"
"punpckldq 96(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,44(%%ecx)\n\t"
"movd %%mm5,44(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,24(%%ecx)\n\t"
"movd %%mm5,24(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 24(%%edx),%%mm6\n\t"
"punpckldq 44(%%edx),%%mm6\n\t"
"movd 24(%%"REG_d"),%%mm6\n\t"
"punpckldq 44(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 24(%%esi),%%mm6\n\t"
"punpckldq 44(%%esi),%%mm6\n\t"
"movd 24(%%"REG_S"),%%mm6\n\t"
"punpckldq 44(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,768(%%edi)\n\t"
"movd %%mm5,768(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1408(%%edi)\n\t"
"movd %%mm5,1408(%%"REG_D")\n\t"
"movq %%mm3,%%mm4\n\t"
"pfsub %%mm2,%%mm4\n\t"
"movq %%mm7,%%mm5\n\t"
@ -356,53 +357,53 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 132(%%edx),%%mm6\n\t"
"punpckldq 80(%%edx),%%mm6\n\t"
"movd 132(%%"REG_d"),%%mm6\n\t"
"punpckldq 80(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,60(%%ecx)\n\t"
"movd %%mm5,60(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,8(%%ecx)\n\t"
"movd %%mm5,8(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 8(%%edx),%%mm6\n\t"
"punpckldq 60(%%edx),%%mm6\n\t"
"movd 8(%%"REG_d"),%%mm6\n\t"
"punpckldq 60(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 8(%%esi),%%mm6\n\t"
"punpckldq 60(%%esi),%%mm6\n\t"
"movd 8(%%"REG_S"),%%mm6\n\t"
"punpckldq 60(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,256(%%edi)\n\t"
"movd %%mm5,256(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1920(%%edi)\n\t"
"movq 8(%%eax),%%mm2\n\t"
"movd %%mm5,1920(%%"REG_D")\n\t"
"movq 8(%%"REG_a"),%%mm2\n\t"
"movd "MANGLE(COS9)"+28,%%mm3\n\t"
"punpckldq %%mm3,%%mm3\n\t"
"pfmul %%mm3,%%mm2\n\t"
"pfsub %%mm0,%%mm2\n\t"
"movq 40(%%eax),%%mm3\n\t"
"movq 40(%%"REG_a"),%%mm3\n\t"
"movd "MANGLE(COS9)"+4,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"pfadd %%mm3,%%mm2\n\t"
"movq 56(%%eax),%%mm3\n\t"
"movq 56(%%"REG_a"),%%mm3\n\t"
"movd "MANGLE(COS9)"+20,%%mm4\n\t"
"punpckldq %%mm4,%%mm4\n\t"
"pfmul %%mm4,%%mm3\n\t"
"pfsub %%mm3,%%mm2\n\t"
"movq (%%eax),%%mm3\n\t"
"movq 16(%%eax),%%mm4\n\t"
"movq (%%"REG_a"),%%mm3\n\t"
"movq 16(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+16,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"pfsub %%mm4,%%mm3\n\t"
"movq 32(%%eax),%%mm4\n\t"
"movq 32(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+32,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"pfadd %%mm4,%%mm3\n\t"
"pfadd %%mm1,%%mm3\n\t"
"movq 64(%%eax),%%mm4\n\t"
"movq 64(%%"REG_a"),%%mm4\n\t"
"movd "MANGLE(COS9)"+8,%%mm5\n\t"
"punpckldq %%mm5,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
@ -414,25 +415,25 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 120(%%edx),%%mm6\n\t"
"punpckldq 92(%%edx),%%mm6\n\t"
"movd 120(%%"REG_d"),%%mm6\n\t"
"punpckldq 92(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,48(%%ecx)\n\t"
"movd %%mm5,48(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,20(%%ecx)\n\t"
"movd %%mm5,20(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 20(%%edx),%%mm6\n\t"
"punpckldq 48(%%edx),%%mm6\n\t"
"movd 20(%%"REG_d"),%%mm6\n\t"
"punpckldq 48(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 20(%%esi),%%mm6\n\t"
"punpckldq 48(%%esi),%%mm6\n\t"
"movd 20(%%"REG_S"),%%mm6\n\t"
"punpckldq 48(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,640(%%edi)\n\t"
"movd %%mm5,640(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1536(%%edi)\n\t"
"movd %%mm5,1536(%%"REG_D")\n\t"
"movq %%mm3,%%mm4\n\t"
"pfsub %%mm2,%%mm4\n\t"
"movq %%mm7,%%mm5\n\t"
@ -440,59 +441,59 @@ void dct36_3dnow(real *inbuf, real *o1,
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 128(%%edx),%%mm6\n\t"
"punpckldq 84(%%edx),%%mm6\n\t"
"movd 128(%%"REG_d"),%%mm6\n\t"
"punpckldq 84(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,56(%%ecx)\n\t"
"movd %%mm5,56(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,12(%%ecx)\n\t"
"movd %%mm5,12(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 12(%%edx),%%mm6\n\t"
"punpckldq 56(%%edx),%%mm6\n\t"
"movd 12(%%"REG_d"),%%mm6\n\t"
"punpckldq 56(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 12(%%esi),%%mm6\n\t"
"punpckldq 56(%%esi),%%mm6\n\t"
"movd 12(%%"REG_S"),%%mm6\n\t"
"punpckldq 56(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,384(%%edi)\n\t"
"movd %%mm5,384(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1792(%%edi)\n\t"
"movd %%mm5,1792(%%"REG_D")\n\t"
"movq (%%eax),%%mm4\n\t"
"movq 16(%%eax),%%mm3\n\t"
"movq (%%"REG_a"),%%mm4\n\t"
"movq 16(%%"REG_a"),%%mm3\n\t"
"pfsub %%mm3,%%mm4\n\t"
"movq 32(%%eax),%%mm3\n\t"
"movq 32(%%"REG_a"),%%mm3\n\t"
"pfadd %%mm3,%%mm4\n\t"
"movq 48(%%eax),%%mm3\n\t"
"movq 48(%%"REG_a"),%%mm3\n\t"
"pfsub %%mm3,%%mm4\n\t"
"movq 64(%%eax),%%mm3\n\t"
"movq 64(%%"REG_a"),%%mm3\n\t"
"pfadd %%mm3,%%mm4\n\t"
"movq %%mm7,%%mm5\n\t"
"punpckldq "MANGLE(tfcos36)"+16,%%mm5\n\t"
"pfmul %%mm5,%%mm4\n\t"
"movq %%mm4,%%mm5\n\t"
"pfacc %%mm5,%%mm5\n\t"
"movd 124(%%edx),%%mm6\n\t"
"punpckldq 88(%%edx),%%mm6\n\t"
"movd 124(%%"REG_d"),%%mm6\n\t"
"punpckldq 88(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd %%mm5,52(%%ecx)\n\t"
"movd %%mm5,52(%%"REG_c")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,16(%%ecx)\n\t"
"movd %%mm5,16(%%"REG_c")\n\t"
"movq %%mm4,%%mm6\n\t"
"punpckldq %%mm6,%%mm5\n\t"
"pfsub %%mm6,%%mm5\n\t"
"punpckhdq %%mm5,%%mm5\n\t"
"movd 16(%%edx),%%mm6\n\t"
"punpckldq 52(%%edx),%%mm6\n\t"
"movd 16(%%"REG_d"),%%mm6\n\t"
"punpckldq 52(%%"REG_d"),%%mm6\n\t"
"pfmul %%mm6,%%mm5\n\t"
"movd 16(%%esi),%%mm6\n\t"
"punpckldq 52(%%esi),%%mm6\n\t"
"movd 16(%%"REG_S"),%%mm6\n\t"
"punpckldq 52(%%"REG_S"),%%mm6\n\t"
"pfadd %%mm6,%%mm5\n\t"
"movd %%mm5,512(%%edi)\n\t"
"movd %%mm5,512(%%"REG_D")\n\t"
"psrlq $32,%%mm5\n\t"
"movd %%mm5,1664(%%edi)\n\t"
"movd %%mm5,1664(%%"REG_D")\n\t"
"femms\n\t"
:

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff

File diff suppressed because it is too large Load Diff