[FFmpeg-devel] [PATCH] Fix the tail handling in R-V V sad

uk7b at foxmail.com uk7b at foxmail.com
Mon Dec 23 17:01:32 EET 2024


From: sunyuechi <sunyuechi at iscas.ac.cn>

---
 libavcodec/riscv/h26x/asm.S    | 36 +++++++++++++++++-----------------
 libavcodec/riscv/vvc/sad_rvv.S |  2 +-
 2 files changed, 19 insertions(+), 19 deletions(-)

diff --git a/libavcodec/riscv/h26x/asm.S b/libavcodec/riscv/h26x/asm.S
index d99690d9a0..0c9ebbdaad 100644
--- a/libavcodec/riscv/h26x/asm.S
+++ b/libavcodec/riscv/h26x/asm.S
@@ -20,46 +20,46 @@
 
 #include "libavutil/riscv/asm.S"
 
-.macro vsetvlstatic w, vlen, en, mn1, mn2, mn3, mn4, mn5, mn6
+.macro vsetvlstatic w, vlen, en, mn1, mn2, mn3, mn4, mn5, mn6, vta=ta
         .if \w == 2 && \vlen == 128
-                vsetivli        zero, \w, \en, \mn1, ta, ma
+                vsetivli        zero, \w, \en, \mn1, \vta, ma
         .elseif \w <= 4 && \vlen == 128
-                vsetivli        zero, \w, \en, \mn2, ta, ma
+                vsetivli        zero, \w, \en, \mn2, \vta, ma
         .elseif \w <= 8 && \vlen == 128
-                vsetivli        zero, \w, \en, \mn3, ta, ma
+                vsetivli        zero, \w, \en, \mn3, \vta, ma
         .elseif \w <= 16 && \vlen == 128
-                vsetivli        zero, \w, \en, \mn4, ta, ma
+                vsetivli        zero, \w, \en, \mn4, \vta, ma
         .elseif \w <= 32 && \vlen == 128
                 li              t0, \w
-                vsetvli         zero, t0, \en, \mn5, ta, ma
+                vsetvli         zero, t0, \en, \mn5, \vta, ma
         .elseif \w <= 4 && \vlen == 256
-                vsetivli        zero, \w, \en, \mn1, ta, ma
+                vsetivli        zero, \w, \en, \mn1, \vta, ma
         .elseif \w <= 8 && \vlen == 256
-                vsetivli        zero, \w, \en, \mn2, ta, ma
+                vsetivli        zero, \w, \en, \mn2, \vta, ma
         .elseif \w <= 16 && \vlen == 256
-                vsetivli        zero, \w, \en, \mn3, ta, ma
+                vsetivli        zero, \w, \en, \mn3, \vta, ma
         .elseif \w <= 32 && \vlen == 256
                 li              t0, \w
-                vsetvli         zero, t0, \en, \mn4, ta, ma
+                vsetvli         zero, t0, \en, \mn4, \vta, ma
         .elseif \w <= 64 && \vlen == 256
                 li              t0, \w
-                vsetvli         zero, t0, \en, \mn5, ta, ma
+                vsetvli         zero, t0, \en, \mn5, \vta, ma
         .else
                 li              t0, \w
-                vsetvli         zero, t0, \en, \mn6, ta, ma
+                vsetvli         zero, t0, \en, \mn6, \vta, ma
         .endif
 .endm
 
-.macro vsetvlstatic8 w, vlen
-        vsetvlstatic \w, \vlen, e8, mf8, mf4, mf2, m1, m2, m4
+.macro vsetvlstatic8 w, vlen, vta
+        vsetvlstatic \w, \vlen, e8, mf8, mf4, mf2, m1, m2, m4, \vta
 .endm
 
-.macro vsetvlstatic16 w, vlen
-        vsetvlstatic \w, \vlen, e16, mf4, mf2, m1, m2, m4, m8
+.macro vsetvlstatic16 w, vlen, vta
+        vsetvlstatic \w, \vlen, e16, mf4, mf2, m1, m2, m4, m8, \vta
 .endm
 
-.macro vsetvlstatic32 w, vlen
-        vsetvlstatic \w, \vlen, e32, mf2, m1, m2, m4, m8, m8
+.macro vsetvlstatic32 w, vlen, vta
+        vsetvlstatic \w, \vlen, e32, mf2, m1, m2, m4, m8, m8, \vta
 .endm
 
 .macro POW2_JMP_TABLE id, vlen
diff --git a/libavcodec/riscv/vvc/sad_rvv.S b/libavcodec/riscv/vvc/sad_rvv.S
index 341167be1f..bb613cc340 100644
--- a/libavcodec/riscv/vvc/sad_rvv.S
+++ b/libavcodec/riscv/vvc/sad_rvv.S
@@ -37,7 +37,7 @@ SADVSET\vlen\w:
         vsetvlstatic32    \w, \vlen
         vmv.v.i           v0, 0
         vmv.s.x           v24, zero
-        vsetvlstatic16    \w, \vlen
+        vsetvlstatic16    \w, \vlen, tu
 SAD\vlen\w:
         addi              a5, a5, -2
         vle16.v           v8, (a0)
-- 
2.47.1



More information about the ffmpeg-devel mailing list