From 8fb306575cef9c1882cfc693b1c47e68e27fc71a Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Martin=20Storsj=C3=B6?= Date: Sun, 9 Feb 2020 23:14:22 +0200 Subject: arm: looprestoration: Improve scheduling in box3/5_h slightly Set flags further from the branch instructions that use them. --- src/arm/32/looprestoration.S | 4 ++-- src/arm/64/looprestoration.S | 4 ++-- 2 files changed, 4 insertions(+), 4 deletions(-) (limited to 'src/arm') diff --git a/src/arm/32/looprestoration.S b/src/arm/32/looprestoration.S index 066f77a..be3533f 100644 --- a/src/arm/32/looprestoration.S +++ b/src/arm/32/looprestoration.S @@ -925,11 +925,11 @@ L(box3_variable_shift_tbl): vmull.u8 q6, d9, d9 add3 4 + subs r5, r5, #4 vst1.16 {d6}, [r1, :64]! vst1.16 {d14}, [r11, :64]! vst1.32 {q12}, [r0, :128]! vst1.32 {q8}, [r10, :128]! - subs r5, r5, #4 ble 9f vext.8 q0, q0, q0, #4 vext.8 q1, q1, q2, #8 @@ -1215,11 +1215,11 @@ L(box5_variable_shift_tbl): vmull.u8 q6, d9, d9 add5 4 + subs r5, r5, #4 vst1.16 {d6}, [r1, :64]! vst1.16 {d14}, [r11, :64]! vst1.32 {q12}, [r0, :128]! vst1.32 {q10}, [r10, :128]! - subs r5, r5, #4 ble 9f vext.8 q0, q0, q0, #4 vext.8 q1, q1, q2, #8 diff --git a/src/arm/64/looprestoration.S b/src/arm/64/looprestoration.S index c6a6ef7..af0ec1b 100644 --- a/src/arm/64/looprestoration.S +++ b/src/arm/64/looprestoration.S @@ -844,11 +844,11 @@ L(box3_variable_shift_tbl): umull2 v6.8h, v4.16b, v4.16b add3 4 + subs w5, w5, #4 st1 {v3.4h}, [x1], #8 st1 {v7.4h}, [x11], #8 st1 {v26.4s}, [x0], #16 st1 {v28.4s}, [x10], #16 - subs w5, w5, #4 b.le 9f ext v0.16b, v0.16b, v0.16b, #4 ext v4.16b, v4.16b, v4.16b, #4 @@ -1114,11 +1114,11 @@ L(box5_variable_shift_tbl): umull2 v6.8h, v4.16b, v4.16b add5 4 + subs w5, w5, #4 st1 {v3.4h}, [x1], #8 st1 {v7.4h}, [x11], #8 st1 {v26.4s}, [x0], #16 st1 {v28.4s}, [x10], #16 - subs w5, w5, #4 b.le 9f ext v0.16b, v0.16b, v0.16b, #4 ext v1.16b, v1.16b, v2.16b, #8 -- cgit v1.2.3