summaryrefslogtreecommitdiffstats
path: root/libavcodec/aarch64
diff options
context:
space:
mode:
authorMartin Storsjö <martin@martin.st>2019-02-01 00:00:58 +0200
committerMartin Storsjö <martin@martin.st>2019-02-19 11:46:24 +0200
commit49f9c4272c4029b57ff300d908ba03c6332fc9c4 (patch)
treeab9517198a99dba3e430b786ac6db5fa8f05fc98 /libavcodec/aarch64
parent37394ef01b040605f8e1c98e73aa12b1c0bcba07 (diff)
downloadffmpeg-streaming-49f9c4272c4029b57ff300d908ba03c6332fc9c4.zip
ffmpeg-streaming-49f9c4272c4029b57ff300d908ba03c6332fc9c4.tar.gz
aarch64: vp8: Skip saturating in shrn in ff_vp8_idct_add_neon
The original arm version didn't do saturation here. This probably doesn't make any difference for performance, but reduces the differences. Signed-off-by: Martin Storsjö <martin@martin.st>
Diffstat (limited to 'libavcodec/aarch64')
-rw-r--r--libavcodec/aarch64/vp8dsp_neon.S8
1 files changed, 4 insertions, 4 deletions
diff --git a/libavcodec/aarch64/vp8dsp_neon.S b/libavcodec/aarch64/vp8dsp_neon.S
index 139b380..cac4558 100644
--- a/libavcodec/aarch64/vp8dsp_neon.S
+++ b/libavcodec/aarch64/vp8dsp_neon.S
@@ -92,8 +92,8 @@ function ff_vp8_idct_add_neon, export=1
smull v27.4s, v3.4h, v4.h[0]
sqdmulh v20.4h, v1.4h, v4.h[1]
sqdmulh v23.4h, v3.4h, v4.h[1]
- sqshrn v21.4h, v26.4s, #16
- sqshrn v22.4h, v27.4s, #16
+ shrn v21.4h, v26.4s, #16
+ shrn v22.4h, v27.4s, #16
add v21.4h, v21.4h, v1.4h
add v22.4h, v22.4h, v3.4h
@@ -117,8 +117,8 @@ function ff_vp8_idct_add_neon, export=1
st1 {v29.16b}, [x1]
sqdmulh v21.4h, v1.4h, v4.h[1]
sqdmulh v23.4h, v3.4h, v4.h[1]
- sqshrn v20.4h, v26.4s, #16
- sqshrn v22.4h, v27.4s, #16
+ shrn v20.4h, v26.4s, #16
+ shrn v22.4h, v27.4s, #16
add v20.4h, v20.4h, v1.4h
add v22.4h, v22.4h, v3.4h
add v16.4h, v0.4h, v2.4h
OpenPOWER on IntegriCloud