diff options
author | Rémi Denis-Courmont <remi@remlab.net> | 2023-07-15 23:30:59 +0300 |
---|---|---|
committer | Rémi Denis-Courmont <remi@remlab.net> | 2023-07-19 19:29:35 +0300 |
commit | 2eb55157aab49076eb581c99227ee81ef5d06b6e (patch) | |
tree | 4d2906929cf66fda8de7907b325af7084cabe78d /libavcodec | |
parent | be7ac511a6b4dd9883c0a6dd8323b04f651193f4 (diff) | |
download | ffmpeg-2eb55157aab49076eb581c99227ee81ef5d06b6e.tar.gz |
lavc/aacpsdsp: unroll RISC-V V add_squares
This slightly improves performance with the Device Under Test.
Diffstat (limited to 'libavcodec')
-rw-r--r-- | libavcodec/riscv/aacpsdsp_rvv.S | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/libavcodec/riscv/aacpsdsp_rvv.S b/libavcodec/riscv/aacpsdsp_rvv.S index 80bd19f6ad..b581383f77 100644 --- a/libavcodec/riscv/aacpsdsp_rvv.S +++ b/libavcodec/riscv/aacpsdsp_rvv.S @@ -22,13 +22,13 @@ func ff_ps_add_squares_rvv, zve32f 1: - vsetvli t0, a2, e32, m1, ta, ma + vsetvli t0, a2, e32, m4, ta, ma vlseg2e32.v v24, (a1) sub a2, a2, t0 vle32.v v16, (a0) sh3add a1, t0, a1 vfmacc.vv v16, v24, v24 - vfmacc.vv v16, v25, v25 + vfmacc.vv v16, v28, v28 vse32.v v16, (a0) sh2add a0, t0, a0 bnez a2, 1b |