aboutsummaryrefslogtreecommitdiffstats
path: root/libavcodec
diff options
context:
space:
mode:
authorRémi Denis-Courmont <remi@remlab.net>2023-07-15 23:30:59 +0300
committerRémi Denis-Courmont <remi@remlab.net>2023-07-19 19:29:35 +0300
commit2eb55157aab49076eb581c99227ee81ef5d06b6e (patch)
tree4d2906929cf66fda8de7907b325af7084cabe78d /libavcodec
parentbe7ac511a6b4dd9883c0a6dd8323b04f651193f4 (diff)
downloadffmpeg-2eb55157aab49076eb581c99227ee81ef5d06b6e.tar.gz
lavc/aacpsdsp: unroll RISC-V V add_squares
This slightly improves performance with the Device Under Test.
Diffstat (limited to 'libavcodec')
-rw-r--r--libavcodec/riscv/aacpsdsp_rvv.S4
1 files changed, 2 insertions, 2 deletions
diff --git a/libavcodec/riscv/aacpsdsp_rvv.S b/libavcodec/riscv/aacpsdsp_rvv.S
index 80bd19f6ad..b581383f77 100644
--- a/libavcodec/riscv/aacpsdsp_rvv.S
+++ b/libavcodec/riscv/aacpsdsp_rvv.S
@@ -22,13 +22,13 @@
func ff_ps_add_squares_rvv, zve32f
1:
- vsetvli t0, a2, e32, m1, ta, ma
+ vsetvli t0, a2, e32, m4, ta, ma
vlseg2e32.v v24, (a1)
sub a2, a2, t0
vle32.v v16, (a0)
sh3add a1, t0, a1
vfmacc.vv v16, v24, v24
- vfmacc.vv v16, v25, v25
+ vfmacc.vv v16, v28, v28
vse32.v v16, (a0)
sh2add a0, t0, a0
bnez a2, 1b