diff options
author | Martin Storsjö <martin@martin.st> | 2019-02-01 00:00:58 +0200 |
---|---|---|
committer | Martin Storsjö <martin@martin.st> | 2019-02-19 11:46:24 +0200 |
commit | 49f9c4272c4029b57ff300d908ba03c6332fc9c4 (patch) | |
tree | ab9517198a99dba3e430b786ac6db5fa8f05fc98 | |
parent | 37394ef01b040605f8e1c98e73aa12b1c0bcba07 (diff) | |
download | ffmpeg-49f9c4272c4029b57ff300d908ba03c6332fc9c4.tar.gz |
aarch64: vp8: Skip saturating in shrn in ff_vp8_idct_add_neon
The original arm version didn't do saturation here. This probably
doesn't make any difference for performance, but reduces the
differences.
Signed-off-by: Martin Storsjö <martin@martin.st>
-rw-r--r-- | libavcodec/aarch64/vp8dsp_neon.S | 8 |
1 files changed, 4 insertions, 4 deletions
diff --git a/libavcodec/aarch64/vp8dsp_neon.S b/libavcodec/aarch64/vp8dsp_neon.S index 139b380fa4..cac4558ab2 100644 --- a/libavcodec/aarch64/vp8dsp_neon.S +++ b/libavcodec/aarch64/vp8dsp_neon.S @@ -92,8 +92,8 @@ function ff_vp8_idct_add_neon, export=1 smull v27.4s, v3.4h, v4.h[0] sqdmulh v20.4h, v1.4h, v4.h[1] sqdmulh v23.4h, v3.4h, v4.h[1] - sqshrn v21.4h, v26.4s, #16 - sqshrn v22.4h, v27.4s, #16 + shrn v21.4h, v26.4s, #16 + shrn v22.4h, v27.4s, #16 add v21.4h, v21.4h, v1.4h add v22.4h, v22.4h, v3.4h @@ -117,8 +117,8 @@ function ff_vp8_idct_add_neon, export=1 st1 {v29.16b}, [x1] sqdmulh v21.4h, v1.4h, v4.h[1] sqdmulh v23.4h, v3.4h, v4.h[1] - sqshrn v20.4h, v26.4s, #16 - sqshrn v22.4h, v27.4s, #16 + shrn v20.4h, v26.4s, #16 + shrn v22.4h, v27.4s, #16 add v20.4h, v20.4h, v1.4h add v22.4h, v22.4h, v3.4h add v16.4h, v0.4h, v2.4h |