ref: 5769713608fa804c8f974644ba540a48186069bf
parent: 4f5815290cbbdf001c98d26c3218a7e70a9aa3b1
parent: 7fd5d8e6a4b52752c2787c84fef15ee6ac3a58a6
author: Frank Galligan <[email protected]>
date: Thu Jul 18 06:21:21 EDT 2013
Merge "Fix horz loopfilter loops"
--- a/vp9/common/arm/neon/vp9_loopfilter_neon.asm
+++ b/vp9/common/arm/neon/vp9_loopfilter_neon.asm
@@ -38,6 +38,7 @@
push {lr}
ldr r12, [sp,#8] ; load count
+ add r1, r1, r1 ; double pitch
cmp r12, #0
beq end_vp9_lf_h_edge
@@ -47,9 +48,8 @@
vld1.8 {d2[]}, [r2] ; duplicate *thresh
count_lf_h_loop
- sub r2, r0, r1, lsl #2 ; move src pointer down by 4 lines
- add r3, r2, r1
- add r1, r1, r1
+ sub r2, r0, r1, lsl #1 ; move src pointer down by 4 lines
+ add r3, r2, r1, lsr #1 ; set to 3 lines down
vld1.u8 {d3}, [r2@64], r1 ; p3
vld1.u8 {d4}, [r3@64], r1 ; p2
@@ -278,6 +278,7 @@
push {r4-r5, lr}
ldr r12, [sp,#16] ; load count
+ add r1, r1, r1 ; double pitch
cmp r12, #0
beq end_vp9_mblf_h_edge
@@ -287,9 +288,8 @@
vld1.8 {d2[]}, [r2] ; duplicate *thresh
count_mblf_h_loop
- sub r3, r0, r1, lsl #2 ; move src pointer down by 4 lines
- add r2, r3, r1
- add r1, r1, r1
+ sub r3, r0, r1, lsl #1 ; move src pointer down by 4 lines
+ add r2, r3, r1, lsr #1 ; set to 3 lines down
vld1.u8 {d3}, [r3@64], r1 ; p3
vld1.u8 {d4}, [r2@64], r1 ; p2