[FFmpeg-devel] [PATCH] lavc/audiodsp: unroll RISC-V clip functions
Rémi Denis-Courmont
remi at remlab.net
Thu Sep 28 18:07:22 EEST 2023
audiodsp.vector_clip_int32_c: 17500.7
audiodsp.vector_clip_int32_rvv_i32: 8404.7 (m1)
audiodsp.vector_clip_int32_rvv_i32: 2689.9 (m8)
audiodsp.vector_clipf_c: 33679.7
audiodsp.vector_clipf_rvf: 7019.7
audiodsp.vector_clipf_rvv_f32: 8328.0 (m1)
audiodsp.vector_clipf_rvv_f32: 2209.4 (m8)
---
libavcodec/riscv/audiodsp_rvv.S | 4 ++--
1 file changed, 2 insertions(+), 2 deletions(-)
diff --git a/libavcodec/riscv/audiodsp_rvv.S b/libavcodec/riscv/audiodsp_rvv.S
index f7eba2114f..f0b23bab5e 100644
--- a/libavcodec/riscv/audiodsp_rvv.S
+++ b/libavcodec/riscv/audiodsp_rvv.S
@@ -42,7 +42,7 @@ endfunc
func ff_vector_clip_int32_rvv, zve32x
1:
- vsetvli t0, a4, e32, m1, ta, ma
+ vsetvli t0, a4, e32, m8, ta, ma
vle32.v v8, (a1)
sub a4, a4, t0
vmax.vx v8, v8, a2
@@ -59,7 +59,7 @@ func ff_vector_clipf_rvv, zve32f
NOHWF fmv.w.x fa0, a3
NOHWF fmv.w.x fa1, a4
1:
- vsetvli t0, a2, e32, m1, ta, ma
+ vsetvli t0, a2, e32, m8, ta, ma
vle32.v v8, (a1)
sub a2, a2, t0
vfmax.vf v8, v8, fa0
--
2.40.1
More information about the ffmpeg-devel
mailing list