st1 {v1.16b}, [x0], x1
st1 {v2.16b}, [x0], x1
st1 {v3.16b}, [x0], x1
- bgt 1b
+ b.gt 1b
ret
endfunc
st1 {v0.d}[1], [x0], x1
st1 {v1.8b}, [x0], x1
st1 {v1.d}[1], [x0], x1
- bgt 1b
+ b.gt 1b
ret
endfunc
st1 {v1.1d - v2.1d}, [x0], x1
st1 {v3.1d - v4.1d}, [x0], x1
subs x4, x4, #2
- bne 1b
+ b.ne 1b
ret
endfunc
st1 {v1.16b}, [x0], x1
subs w4, w4, #1
- bne 1b
+ b.ne 1b
ret
endfunc
vp8_epel16_h6 v1, v1, v2
st1 {v1.16b}, [x7], #16
subs x16, x16, #1
- bne 1b
+ b.ne 1b
// second pass (vertical):
st1 {v2.16b}, [x0], x1
subs x4, x4, #1
- bne 2b
+ b.ne 2b
add sp, sp, #336+16
ret
st1 {v1.8b}, [x7], #8
subs x16, x16, #1
- bne 1b
+ b.ne 1b
// second pass (vertical):
sxtw x6, w6
st1 {v1.8b}, [x0], x1
st1 {v2.8b}, [x0], x1
subs x4, x4, #2
- bne 2b
+ b.ne 2b
add sp, sp, #168+16
ret
st1 {v1.8b}, [x7], #8
subs x16, x16, #1
- bne 1b
+ b.ne 1b
// second pass (vertical):
sxtw x6, w6
st1 {v1.8b}, [x0], x1
st1 {v2.8b}, [x0], x1
subs x4, x4, #2
- bne 2b
+ b.ne 2b
add sp, sp, #168+16
ret
st1 {v1.8b}, [x7], #8
subs x16, x16, #1
- bne 1b
+ b.ne 1b
// second pass (vertical):
sxtw x6, w6
st1 {v1.d}[0], [x0], x1
st1 {v1.d}[1], [x0], x1
subs x4, x4, #2
- bne 2b
+ b.ne 2b
add sp, sp, #168+16
ret
st1 {v1.8b}, [x7], #8
subs x16, x16, #1
- bne 1b
+ b.ne 1b
// second pass (vertical):
sxtw x6, w6
st1 {v1.d}[0], [x0], x1
st1 {v1.d}[1], [x0], x1
subs x4, x4, #2
- bne 2b
+ b.ne 2b
add sp, sp, #168+16
ret