summaryrefslogtreecommitdiffstats
path: root/libavcodec
diff options
context:
space:
mode:
authorAlexandra Hájková <alexandra.khirnova@gmail.com>2017-05-04 10:49:16 +0200
committerMartin Storsjö <martin@martin.st>2017-05-04 14:08:27 +0200
commit118dd4a321a2d67f67c21b076abd0b4d939ab642 (patch)
tree793360c630ef465fc228d572f9dbd1ea09fa540b /libavcodec
parent504403ab28688588fb85817ad58964482f67f29f (diff)
downloadffmpeg-streaming-118dd4a321a2d67f67c21b076abd0b4d939ab642.zip
ffmpeg-streaming-118dd4a321a2d67f67c21b076abd0b4d939ab642.tar.gz
hevc: 16x16 NEON idct: Use the right element size for loads/stores
This doesn't change the actual behaviour of the code but improves readability. Signed-off-by: Martin Storsjö <martin@martin.st>
Diffstat (limited to 'libavcodec')
-rw-r--r--libavcodec/arm/hevc_idct.S16
1 files changed, 8 insertions, 8 deletions
diff --git a/libavcodec/arm/hevc_idct.S b/libavcodec/arm/hevc_idct.S
index fac5758..eeb81e3 100644
--- a/libavcodec/arm/hevc_idct.S
+++ b/libavcodec/arm/hevc_idct.S
@@ -536,10 +536,10 @@ endfunc
butterfly q10, q14, q2, q5
butterfly q11, q15, q3, q4
add r4, sp, #512
- vst1.s16 {q0-q1}, [r4, :128]!
- vst1.s16 {q2-q3}, [r4, :128]!
- vst1.s16 {q4-q5}, [r4, :128]!
- vst1.s16 {q6-q7}, [r4, :128]
+ vst1.s32 {q0-q1}, [r4, :128]!
+ vst1.s32 {q2-q3}, [r4, :128]!
+ vst1.s32 {q4-q5}, [r4, :128]!
+ vst1.s32 {q6-q7}, [r4, :128]
.endm
.macro load16 in0, in1, in2, in3, in4, in5, in6, in7
@@ -631,8 +631,8 @@ function func_tr_16x4_\name
add_member d7, d1[3], d1[2], d1[1], d1[0], d0[3], d0[2], d0[1], d0[0], +, -, +, -, +, -, +, -
add r4, sp, #512
- vld1.s16 {q0-q1}, [r4, :128]!
- vld1.s16 {q2-q3}, [r4, :128]!
+ vld1.s32 {q0-q1}, [r4, :128]!
+ vld1.s32 {q2-q3}, [r4, :128]!
butterfly16 q0, q5, q1, q6, q2, q7, q3, q8
scale d26, d27, d28, d29, d30, d31, d16, d17, q4, q0, q5, q1, q6, q2, q7, q3, \shift
@@ -645,8 +645,8 @@ function func_tr_16x4_\name
store16 d26, d27, d28, d29, d30, d31, d16, d17
add r4, sp, #576
- vld1.s16 {q0-q1}, [r4, :128]!
- vld1.s16 {q2-q3}, [r4, :128]
+ vld1.s32 {q0-q1}, [r4, :128]!
+ vld1.s32 {q2-q3}, [r4, :128]
butterfly16 q0, q9, q1, q10, q2, q11, q3, q12
scale d26, d27, d28, d29, d30, d31, d8, d9, q4, q0, q9, q1, q10, q2, q11, q3, \shift
transpose8_4x4 d26, d28, d30, d8
OpenPOWER on IntegriCloud