Lines Matching refs:v16
116 ld1 {v16.s}[0], [x5] //D16[0] contains cliptab
119 tbl v14.8b, {v16.16b}, v12.8b //
122 dup v16.16b, w3 //Q8 contains beta
130 cmhs v24.16b, v24.16b, v16.16b
131 cmhs v26.16b, v26.16b, v16.16b
132 cmhi v20.16b, v16.16b , v28.16b //Q10=(Ap<Beta)
133 cmhi v22.16b, v16.16b , v30.16b //Q11=(Aq<Beta)
147 urhadd v16.16b, v6.16b , v0.16b //Q8 = ((p0+q0+1) >> 1)
148 mov v17.d[0], v16.d[1]
157 uaddl v10.8h, v16.8b, v10.8b //Q14,Q5 = p2 + (p0+q0+1)>>1
161 uaddl v4.8h, v16.8b, v4.8b //Q15,Q2 = q2 + (p0+q0+1)>>1
162 ushll v16.8h, v8.8b, #1 //Q13,Q8 = (p1<<1)
165 sub v10.8h, v10.8h , v16.8h //
166 ushll v16.8h, v2.8b, #1 //
171 sub v4.8h, v4.8h , v16.8h //
180 uqadd v16.16b, v6.16b , v18.16b //Q8 = p0 + delta
187 bif v16.16b, v6.16b , v24.16b //Q8 = (i_macro >= 0 ) ? (p0+delta) : (p0-delta)
191 st1 {v16.16b}, [x7], x1 //writting back filtered value of p0
267 uabd v16.16b , v10.16b, v6.16b
270 cmhs v16.16b, v16.16b , v2.16b //ABS(q1 - q0) >= Beta
275 …orr v18.16b, v18.16b , v16.16b //ABS(p0 - q0) >= Alpha || ABS(q1 - q0) >= Beta || ABS(p1 - p…
287 add v16.8h, v28.8h , v28.8h //2*(p0+q0+q1)L
289 uaddw v16.8h, v16.8h , v14.8b //2*(p0+q0+q1)+q2 L
291 uaddw v16.8h, v16.8h , v10.8b //2*(p0+q0+q1)+q2 +p1 L
293 rshrn v12.8b, v16.8h, #3 //(2*(p0+q0+q1)+q2 +p1 +4)>> 3 L [q0']
297 uaddl v16.8h, v8.8b, v8.8b //2*q1 L
299 uaddw v16.8h, v16.8h , v4.8b //2*q1+q0 L
301 uaddw v16.8h, v16.8h , v10.8b //2*q1+q0+p1 L
303 rshrn v16.8b, v16.8h, #2 //(2*q1+q0+p1+2)>>2 L [q0"]
305 mov v16.d[1] , v17.d[0]
310 bit v16.16b, v12.16b , v22.16b //choosing between q0' and q0" depending on condn
317 bif v4.16b, v16.16b , v18.16b //choose q0 or filtered q0
319 uaddl v16.8h, v14.8b, v0.8b //q2+q3,L
321 add v28.8h, v28.8h , v16.8h //p0+q0+q1+2*q2+q3 L
324 add v28.8h, v28.8h , v16.8h //p0+q0+q1+3*q2+2*q3 L
333 uabd v16.16b , v30.16b, v6.16b
339 cmhi v16.16b, v2.16b , v16.16b //Ap < Beta
343 and v20.16b, v20.16b , v16.16b //((Ap < Beta) && (ABS(p0 - q0) <((Alpha >>2) + 2)))
355 uaddl v16.8h, v7.8b, v9.8b //p0+q1 H
356 umlal v16.8h, v11.8b, v0.8b //2*p1+p0+q1 H
365 rshrn v3.8b, v16.8h, #2 //(2*p1+p0+q1+2)>>2,p0" H
368 uaddl v16.8h, v31.8b, v25.8b //p2+p3 H
370 mla v4.8h, v16.8h , v1.h[0] //(p0+q0+p1)+3*p2+2*p3 H
371 …bic v16.16b, v20.16b , v18.16b //((ABS(p0 - q0) >= Alpha || ABS(q1 - q0) >= Beta || ABS(p1 …
372 mov v17.d[0] , v16.d[1] //&& (Ap < Beta && ABS(p0 - q0) <((Alpha >>2) + 2))
379 bit v10.16b, v26.16b , v16.16b //choosing between p1 and p1'
380 bit v30.16b, v12.16b , v16.16b //choosing between p2 and p2'
450 ld1 {v16.s}[0], [x14] //D16[0] contains cliptab
455 tbl v16.8b, {v16.16b}, v18.8b //puc_ClipTab[uc_Bs]
458 uxtl v16.4s, v16.4h //
462 sli v16.4s, v16.4s, #8 //
466 sli v16.4s, v16.4s, #16
577 smin v24.16b, v24.16b , v16.16b //min(deltap1 ,C0)
579 neg v30.16b, v16.16b //-C0
598 smin v18.16b, v18.16b , v16.16b //min(delatq1,C0)
604 sub v16.16b, v16.16b , v22.16b //C0 + (Ap < Beta)
614 sub v16.16b, v16.16b , v20.16b //C0 + (Ap < Beta) + (Aq < Beta)
619 umin v30.16b, v30.16b , v16.16b //min((abs(delta),C)
871 uaddl v16.8h, v6.8b, v8.8b //p0+q0 L
879 uaddw v20.8h, v16.8h , v4.8b //p0+q0+p1 L
886 uaddw v16.8h, v20.8h , v2.8b //p0+q0+p1+p2 L
889 rshrn v20.8b, v16.8h, #2 //(p2 + p1 + p0 + q0 + 2) >> 2)L p1'
924 add v16.8h, v16.8h , v30.8h //(X2(p3) + X3(p2) + p1 + p0 + q0) L
928 rshrn v16.8b, v16.8h, #3 //((X2(p3) + X3(p2) + p1 + p0 + q0 + 4) >> 3); L p2'
930 mov v16.d[1] , v17.d[0]
948 bit v2.16b, v16.16b , v14.16b //final p2
955 uaddl v16.8h, v9.8b, v5.8b //q0+p1 H
956 umlal v16.8h, v11.8b, v28.8b //X2(q1) + q0 + p1 H
963 rshrn v25.8b, v16.8h, #2 //(X2(q1) + q0 + p1 + 2) >> 2; H q0'
967 rshrn v16.8b, v14.8h, #3 //(p1 + X2(p0) + X2(q0) + X2(q1) + q2 + 4) >> 3 L qo"
970 mov v16.d[1] , v17.d[0]
974 bit v24.16b, v16.16b , v30.16b //q0' or q0"
986 uaddl v16.8h, v12.8b, v14.8b //q2+q3 L
994 mla v18.8h, v16.8h , v28.8h //X2(q3) + X3(q2) + q1 + q0 + p0 L