[FFmpeg-cvslog] x86/tx_float: fix stray change in 15xM FFT and replace imul->lea

Lynne git at videolan.org
Mon Nov 28 18:03:31 EET 2022


ffmpeg | branch: master | Lynne <dev at lynne.ee> | Mon Nov 28 04:15:36 2022 +0100| [90c17a05aab798199f3cdafb7cab61f666f132be] | committer: Hendrik Leppkes

x86/tx_float: fix stray change in 15xM FFT and replace imul->lea

Thanks to rorgoroth for bisecting and kurosu for the lea suggestion.

> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=90c17a05aab798199f3cdafb7cab61f666f132be
---

 libavutil/x86/tx_float.asm | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/libavutil/x86/tx_float.asm b/libavutil/x86/tx_float.asm
index 2ad84c2885..e1533a8595 100644
--- a/libavutil/x86/tx_float.asm
+++ b/libavutil/x86/tx_float.asm
@@ -1772,7 +1772,7 @@ IMDCT_FN avx2
 %macro PFA_15_FN 2
 INIT_YMM %1
 %if %2
-cglobal fft_pfa_15xM_asm_float, 0, 8, 0, ctx, out, in, stride, len, lut, buf, map, tgt, tmp, \
+cglobal fft_pfa_15xM_asm_float, 0, 0, 0, ctx, out, in, stride, len, lut, buf, map, tgt, tmp, \
                                          tgt5, stride3, stride5, btmp
 %else
 cglobal fft_pfa_15xM_float, 4, 14, 16, 320, ctx, out, in, stride, len, lut, buf, map, tgt, tmp, \
@@ -1892,7 +1892,7 @@ cglobal fft_pfa_15xM_float, 4, 14, 16, 320, ctx, out, in, stride, len, lut, buf,
     mov stride5q, lenq
     mov tgt5q, btmpq
     POP strideq
-    imul tmpq, strideq, 3
+    lea tmpq, [strideq + 2*strideq]
 
 .post:
     LOAD64_LUT m0, inq, stride3q, 0, tmpq, m8, m9



More information about the ffmpeg-cvslog mailing list