[FFmpeg-devel] [PATCH] x86/sbrdsp: remove an unnecessary mova in sbr_autocorrelate
James Almer
jamrial at gmail.com
Tue Aug 4 00:26:15 CEST 2015
Signed-off-by: James Almer <jamrial at gmail.com>
---
libavcodec/x86/sbrdsp.asm | 34 +++++++++++++++++-----------------
1 file changed, 17 insertions(+), 17 deletions(-)
diff --git a/libavcodec/x86/sbrdsp.asm b/libavcodec/x86/sbrdsp.asm
index 083461a..a96451f 100644
--- a/libavcodec/x86/sbrdsp.asm
+++ b/libavcodec/x86/sbrdsp.asm
@@ -515,42 +515,42 @@ align 16
jl .loop
movlhps m1, m1
- mulps m4, m1, m2
+ mulps m2, m1
mulps m1, m1
- addps m4, m6 ; real_sum1 + x[38][0] * x[39][0], x[38][1] * x[39][1]; imag_sum1 + x[38][0] * x[39][1], x[38][1] * x[39][0];
+ addps m2, m6 ; real_sum1 + x[38][0] * x[39][0], x[38][1] * x[39][1]; imag_sum1 + x[38][0] * x[39][1], x[38][1] * x[39][0];
addps m1, m7 ; real_sum0 + x[38][0] * x[38][0], x[38][1] * x[38][1];
addps m6, [rsp ] ; real_sum1 + x[ 0][0] * x[ 1][0], x[ 0][1] * x[ 1][1]; imag_sum1 + x[ 0][0] * x[ 1][1], x[ 0][1] * x[ 1][0];
addps m7, [rsp+16] ; real_sum0 + x[ 0][0] * x[ 0][0], x[ 0][1] * x[ 0][1];
- xorps m4, [ps_mask3]
+ xorps m2, [ps_mask3]
xorps m5, [ps_mask3]
xorps m6, [ps_mask3]
%if cpuflag(sse3)
- movshdup m2, m1
- haddps m4, m5
+ movshdup m0, m1
+ haddps m2, m5
haddps m7, m6
- addss m1, m2
+ addss m1, m0
%else
- movaps m3, m4
- movaps m2, m5
- movaps m0, m6
+ movaps m3, m2
+ movaps m0, m5
+ movaps m4, m6
shufps m3, m3, q0301
- shufps m2, m2, q0301
shufps m0, m0, q0301
- addps m4, m3
- addps m5, m2
- addps m6, m0
+ shufps m4, m4, q0301
+ addps m2, m3
+ addps m5, m0
+ addps m6, m4
- movss m2, m7
+ movss m0, m7
movss m3, m1
shufps m7, m7, q0001
shufps m1, m1, q0001
- addss m7, m2
+ addss m7, m0
addss m1, m3
- shufps m4, m5, q2020
+ shufps m2, m5, q2020
shufps m7, m6, q2020
%endif
- movaps [phiq ], m4
+ movaps [phiq ], m2
movhps [phiq+0x18], m7
movss [phiq+0x28], m7
movss [phiq+0x10], m1
--
2.5.0
More information about the ffmpeg-devel
mailing list