[FFmpeg-cvslog] x86/tx_float: fix stray change in 15xM FFT and replace imul->lea
Lynne
git at videolan.org
Mon Nov 28 18:03:31 EET 2022
ffmpeg | branch: master | Lynne <dev at lynne.ee> | Mon Nov 28 04:15:36 2022 +0100| [90c17a05aab798199f3cdafb7cab61f666f132be] | committer: Hendrik Leppkes
x86/tx_float: fix stray change in 15xM FFT and replace imul->lea
Thanks to rorgoroth for bisecting and kurosu for the lea suggestion.
> http://git.videolan.org/gitweb.cgi/ffmpeg.git/?a=commit;h=90c17a05aab798199f3cdafb7cab61f666f132be
---
libavutil/x86/tx_float.asm | 4 ++--
1 file changed, 2 insertions(+), 2 deletions(-)
diff --git a/libavutil/x86/tx_float.asm b/libavutil/x86/tx_float.asm
index 2ad84c2885..e1533a8595 100644
--- a/libavutil/x86/tx_float.asm
+++ b/libavutil/x86/tx_float.asm
@@ -1772,7 +1772,7 @@ IMDCT_FN avx2
%macro PFA_15_FN 2
INIT_YMM %1
%if %2
-cglobal fft_pfa_15xM_asm_float, 0, 8, 0, ctx, out, in, stride, len, lut, buf, map, tgt, tmp, \
+cglobal fft_pfa_15xM_asm_float, 0, 0, 0, ctx, out, in, stride, len, lut, buf, map, tgt, tmp, \
tgt5, stride3, stride5, btmp
%else
cglobal fft_pfa_15xM_float, 4, 14, 16, 320, ctx, out, in, stride, len, lut, buf, map, tgt, tmp, \
@@ -1892,7 +1892,7 @@ cglobal fft_pfa_15xM_float, 4, 14, 16, 320, ctx, out, in, stride, len, lut, buf,
mov stride5q, lenq
mov tgt5q, btmpq
POP strideq
- imul tmpq, strideq, 3
+ lea tmpq, [strideq + 2*strideq]
.post:
LOAD64_LUT m0, inq, stride3q, 0, tmpq, m8, m9
More information about the ffmpeg-cvslog
mailing list