[Mplayer-cvslog] CVS: main/mp3lib dct64_k7.c,1.4,1.5

Atmosfear atmos4 at mplayerhq.hu
Sat Sep 7 15:57:59 CEST 2002


Update of /cvsroot/mplayer/main/mp3lib
In directory mail:/var/tmp.root/cvs-serv2278

Modified Files:
	dct64_k7.c 
Log Message:
Minor speedup by nick kurshev.


Index: dct64_k7.c
===================================================================
RCS file: /cvsroot/mplayer/main/mp3lib/dct64_k7.c,v
retrieving revision 1.4
retrieving revision 1.5
diff -u -r1.4 -r1.5
--- dct64_k7.c	24 May 2002 01:56:01 -0000	1.4
+++ dct64_k7.c	7 Sep 2002 13:57:41 -0000	1.5
@@ -31,10 +31,8 @@
 "	movq	8(%%eax), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	120(%%eax), %%mm1\n\t"
-"	movq	112(%%eax), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 120(%%eax), %%mm1\n\t"
+"	pshufw	$78, 112(%%eax), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, (%%edx)\n\t"
@@ -52,10 +50,8 @@
 "	movq	24(%%eax), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	104(%%eax), %%mm1\n\t"
-"	movq	96(%%eax), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 104(%%eax), %%mm1\n\t"
+"	pshufw	$78, 96(%%eax), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 16(%%edx)\n\t"
@@ -73,10 +69,8 @@
 "	movq	40(%%eax), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	88(%%eax), %%mm1\n\t"
-"	movq	80(%%eax), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 88(%%eax), %%mm1\n\t"
+"	pshufw	$78, 80(%%eax), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 32(%%edx)\n\t"
@@ -94,10 +88,8 @@
 "	movq	56(%%eax), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	72(%%eax), %%mm1\n\t"
-"	movq	64(%%eax), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 72(%%eax), %%mm1\n\t"
+"	pshufw	$78, 64(%%eax), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 48(%%edx)\n\t"
@@ -117,10 +109,8 @@
 "	movq	8(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	56(%%edx), %%mm1\n\t"
-"	movq	48(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 56(%%edx), %%mm1\n\t"
+"	pshufw	$78, 48(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, (%%ecx)\n\t"
@@ -138,10 +128,8 @@
 "	movq	24(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	40(%%edx), %%mm1\n\t"
-"	movq	32(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 40(%%edx), %%mm1\n\t"
+"	pshufw	$78, 32(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 16(%%ecx)\n\t"
@@ -161,10 +149,8 @@
 "	movq	72(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	120(%%edx), %%mm1\n\t"
-"	movq	112(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 120(%%edx), %%mm1\n\t"
+"	pshufw	$78, 112(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 64(%%ecx)\n\t"
@@ -182,10 +168,8 @@
 "	movq	88(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	104(%%edx), %%mm1\n\t"
-"	movq	96(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 104(%%edx), %%mm1\n\t"
+"	pshufw	$78, 96(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 80(%%ecx)\n\t"
@@ -208,10 +192,8 @@
 "	movq	8(%%ecx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	24(%%ecx), %%mm1\n\t"
-"	movq	16(%%ecx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 24(%%ecx), %%mm1\n\t"
+"	pshufw	$78, 16(%%ecx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, (%%edx)\n\t"
@@ -229,10 +211,8 @@
 "	movq	40(%%ecx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	56(%%ecx), %%mm1\n\t"
-"	movq	48(%%ecx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 56(%%ecx), %%mm1\n\t"
+"	pshufw	$78, 48(%%ecx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 32(%%edx)\n\t"
@@ -250,10 +230,8 @@
 "	movq	72(%%ecx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	88(%%ecx), %%mm1\n\t"
-"	movq	80(%%ecx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 88(%%ecx), %%mm1\n\t"
+"	pshufw	$78, 80(%%ecx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 64(%%edx)\n\t"
@@ -271,10 +249,8 @@
 "	movq	104(%%ecx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	120(%%ecx), %%mm1\n\t"
-"	movq	112(%%ecx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 120(%%ecx), %%mm1\n\t"
+"	pshufw	$78, 112(%%ecx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 96(%%edx)\n\t"
@@ -296,10 +272,8 @@
 "	movq	16(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	8(%%edx), %%mm1\n\t"
-"	movq	24(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 8(%%edx), %%mm1\n\t"
+"	pshufw	$78, 24(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, (%%ecx)\n\t"
@@ -317,10 +291,8 @@
 "	movq	48(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	40(%%edx), %%mm1\n\t"
-"	movq	56(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 40(%%edx), %%mm1\n\t"
+"	pshufw	$78, 56(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 32(%%ecx)\n\t"
@@ -338,10 +310,8 @@
 "	movq	80(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	72(%%edx), %%mm1\n\t"
-"	movq	88(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 72(%%edx), %%mm1\n\t"
+"	pshufw	$78, 88(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 64(%%ecx)\n\t"
@@ -359,10 +329,8 @@
 "	movq	112(%%edx), %%mm4\n\t"
 "	movq	%%mm0, %%mm3\n\t"
 "	movq	%%mm4, %%mm7\n\t"
-"	movq	104(%%edx), %%mm1\n\t"
-"	movq	120(%%edx), %%mm5\n\t"
-"	pswapd	%%mm1, %%mm1\n\t"
-"	pswapd	%%mm5, %%mm5\n\t"
+"	pshufw	$78, 104(%%edx), %%mm1\n\t"
+"	pshufw	$78, 120(%%edx), %%mm5\n\t"
 "	pfadd	%%mm1, %%mm0\n\t"
 "	pfadd	%%mm5, %%mm4\n\t"
 "	movq	%%mm0, 96(%%ecx)\n\t"




More information about the MPlayer-cvslog mailing list