Lines Matching refs:v16
115 ld1 {v16.s}[0], [x5] //D16[0] contains cliptab
118 tbl v14.8b, {v16.16b}, v12.8b //
121 dup v16.16b, w3 //Q8 contains beta
129 cmhs v24.16b, v24.16b, v16.16b
130 cmhs v26.16b, v26.16b, v16.16b
131 cmhi v20.16b, v16.16b , v28.16b //Q10=(Ap<Beta)
132 cmhi v22.16b, v16.16b , v30.16b //Q11=(Aq<Beta)
146 urhadd v16.16b, v6.16b , v0.16b //Q8 = ((p0+q0+1) >> 1)
147 mov v17.d[0], v16.d[1]
156 uaddl v10.8h, v16.8b, v10.8b //Q14,Q5 = p2 + (p0+q0+1)>>1
160 uaddl v4.8h, v16.8b, v4.8b //Q15,Q2 = q2 + (p0+q0+1)>>1
161 ushll v16.8h, v8.8b, #1 //Q13,Q8 = (p1<<1)
164 sub v10.8h, v10.8h , v16.8h //
165 ushll v16.8h, v2.8b, #1 //
170 sub v4.8h, v4.8h , v16.8h //
179 uqadd v16.16b, v6.16b , v18.16b //Q8 = p0 + delta
186 bif v16.16b, v6.16b , v24.16b //Q8 = (i_macro >= 0 ) ? (p0+delta) : (p0-delta)
190 st1 {v16.16b}, [x7], x1 //writting back filtered value of p0
265 uabd v16.16b , v10.16b, v6.16b
268 cmhs v16.16b, v16.16b , v2.16b //ABS(q1 - q0) >= Beta
273 …orr v18.16b, v18.16b , v16.16b //ABS(p0 - q0) >= Alpha || ABS(q1 - q0) >= Beta || ABS(p1 - p…
285 add v16.8h, v28.8h , v28.8h //2*(p0+q0+q1)L
287 uaddw v16.8h, v16.8h , v14.8b //2*(p0+q0+q1)+q2 L
289 uaddw v16.8h, v16.8h , v10.8b //2*(p0+q0+q1)+q2 +p1 L
291 rshrn v12.8b, v16.8h, #3 //(2*(p0+q0+q1)+q2 +p1 +4)>> 3 L [q0']
295 uaddl v16.8h, v8.8b, v8.8b //2*q1 L
297 uaddw v16.8h, v16.8h , v4.8b //2*q1+q0 L
299 uaddw v16.8h, v16.8h , v10.8b //2*q1+q0+p1 L
301 rshrn v16.8b, v16.8h, #2 //(2*q1+q0+p1+2)>>2 L [q0"]
303 mov v16.d[1] , v17.d[0]
308 bit v16.16b, v12.16b , v22.16b //choosing between q0' and q0" depending on condn
315 bif v4.16b, v16.16b , v18.16b //choose q0 or filtered q0
317 uaddl v16.8h, v14.8b, v0.8b //q2+q3,L
319 add v28.8h, v28.8h , v16.8h //p0+q0+q1+2*q2+q3 L
322 add v28.8h, v28.8h , v16.8h //p0+q0+q1+3*q2+2*q3 L
331 uabd v16.16b , v30.16b, v6.16b
337 cmhi v16.16b, v2.16b , v16.16b //Ap < Beta
341 and v20.16b, v20.16b , v16.16b //((Ap < Beta) && (ABS(p0 - q0) <((Alpha >>2) + 2)))
353 uaddl v16.8h, v7.8b, v9.8b //p0+q1 H
354 umlal v16.8h, v11.8b, v0.8b //2*p1+p0+q1 H
363 rshrn v3.8b, v16.8h, #2 //(2*p1+p0+q1+2)>>2,p0" H
366 uaddl v16.8h, v31.8b, v25.8b //p2+p3 H
368 mla v4.8h, v16.8h , v1.h[0] //(p0+q0+p1)+3*p2+2*p3 H
369 …bic v16.16b, v20.16b , v18.16b //((ABS(p0 - q0) >= Alpha || ABS(q1 - q0) >= Beta || ABS(p1 …
370 mov v17.d[0] , v16.d[1] //&& (Ap < Beta && ABS(p0 - q0) <((Alpha >>2) + 2))
377 bit v10.16b, v26.16b , v16.16b //choosing between p1 and p1'
378 bit v30.16b, v12.16b , v16.16b //choosing between p2 and p2'
447 ld1 {v16.s}[0], [x14] //D16[0] contains cliptab
452 tbl v16.8b, {v16.16b}, v18.8b //puc_ClipTab[uc_Bs]
455 uxtl v16.4s, v16.4h //
459 sli v16.4s, v16.4s, #8 //
463 sli v16.4s, v16.4s, #16
574 smin v24.16b, v24.16b , v16.16b //min(deltap1 ,C0)
576 neg v30.16b, v16.16b //-C0
595 smin v18.16b, v18.16b , v16.16b //min(delatq1,C0)
601 sub v16.16b, v16.16b , v22.16b //C0 + (Ap < Beta)
611 sub v16.16b, v16.16b , v20.16b //C0 + (Ap < Beta) + (Aq < Beta)
616 umin v30.16b, v30.16b , v16.16b //min((abs(delta),C)
868 uaddl v16.8h, v6.8b, v8.8b //p0+q0 L
876 uaddw v20.8h, v16.8h , v4.8b //p0+q0+p1 L
883 uaddw v16.8h, v20.8h , v2.8b //p0+q0+p1+p2 L
886 rshrn v20.8b, v16.8h, #2 //(p2 + p1 + p0 + q0 + 2) >> 2)L p1'
921 add v16.8h, v16.8h , v30.8h //(X2(p3) + X3(p2) + p1 + p0 + q0) L
925 rshrn v16.8b, v16.8h, #3 //((X2(p3) + X3(p2) + p1 + p0 + q0 + 4) >> 3); L p2'
927 mov v16.d[1] , v17.d[0]
945 bit v2.16b, v16.16b , v14.16b //final p2
952 uaddl v16.8h, v9.8b, v5.8b //q0+p1 H
953 umlal v16.8h, v11.8b, v28.8b //X2(q1) + q0 + p1 H
960 rshrn v25.8b, v16.8h, #2 //(X2(q1) + q0 + p1 + 2) >> 2; H q0'
964 rshrn v16.8b, v14.8h, #3 //(p1 + X2(p0) + X2(q0) + X2(q1) + q2 + 4) >> 3 L qo"
967 mov v16.d[1] , v17.d[0]
971 bit v24.16b, v16.16b , v30.16b //q0' or q0"
983 uaddl v16.8h, v12.8b, v14.8b //q2+q3 L
991 mla v18.8h, v16.8h , v28.8h //X2(q3) + X3(q2) + q1 + q0 + p0 L