• Home
  • Raw
  • Download

Lines Matching refs:v4

301     ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 //only use 21(16+5); v2=src[-2]
304 ext v5.16b, v2.16b, v4.16b, #1 //v5=src[-1]
305 ext v6.16b, v2.16b, v4.16b, #2 //v6=src[0]
306 ext v7.16b, v2.16b, v4.16b, #3 //v7=src[1]
307 ext v16.16b, v2.16b, v4.16b, #4 //v16=src[2]
308 ext v17.16b, v2.16b, v4.16b, #5 //v17=src[3]
348 …VEC4_UADDL_8BITS v16, v17, v20, v21, v24, v25, v28, v29, v0, v2, v4, v6 //v0/v2/v4/v6=src[-2]+sr…
350 …VEC4_MLS_16BITS v1, v9, v3, v9, v5, v9, v7, v9, v0, v2, v4, v6 //v0/v2/v4/v6 -= 5*(src[-1]+src[2])
366 … VEC4_MLA_16BITS v1, v8, v3, v8, v5, v8, v7, v8, v0, v2, v4, v6 //v0/v2/v4/v6+=20*(src[0]+src[1])
368 VEC4_SQRSHRUN_16BITS_SHIFT5 v0, v2, v4, v6, v1, v3, v5, v7
392 zip1 v4.4s, v2.4s, v3.4s // v4=src[-2] 1st:2nd
393 ext v17.16b, v4.16b, v4.16b, #8 // v17=src[2:5] 1st:2nd
395 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[-1:6]
396 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[-1:6]
398 ext v7.16b, v5.16b, v4.16b, #8 //v7=src[3:6] 1st:2nd
400 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[0:6]
401 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[0:6]
404 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[1:6]
405 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[1:6]
408 FILTER_6TAG_8BITS1 v4, v5, v6, v16, v17, v7, v20, v0, v1
426 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 //only use 21(16+5); v2=src[-2]
429 ext v5.16b, v2.16b, v4.16b, #1 //v5=src[-1]
430 ext v6.16b, v2.16b, v4.16b, #2 //v6=src[0]
431 ext v7.16b, v2.16b, v4.16b, #3 //v7=src[1]
432 ext v16.16b, v2.16b, v4.16b, #4 //v16=src[2]
433 ext v17.16b, v2.16b, v4.16b, #5 //v17=src[3]
474 …VEC4_UADDL_8BITS v16, v17, v20, v21, v24, v25, v28, v29, v0, v2, v4, v6 //v0/v2/v4/v6=src[-2]+sr…
476 …VEC4_MLS_16BITS v1, v9, v3, v9, v5, v9, v7, v9, v0, v2, v4, v6 //v0/v2/v4/v6 -= 5*(src[-1]+src[2])
492 … VEC4_MLA_16BITS v1, v8, v3, v8, v5, v8, v7, v8, v0, v2, v4, v6 //v0/v2/v4/v6+=20*(src[0]+src[1])
493 VEC4_SQRSHRUN_16BITS_SHIFT5 v0, v2, v4, v6, v1, v3, v5, v7
495 VEC4_UADDL_8BITS v1, v18, v3, v22, v5, v26, v7, v30, v0, v2, v4, v6 //average with arc[0]
496 VEC4_RSHRN_16BITS_SHIFT1 v0, v2, v4, v6, v1, v3, v5, v7
520 zip1 v4.4s, v2.4s, v3.4s // v4=src[-2] 1st:2nd
521 ext v17.16b, v4.16b, v4.16b, #8 // v17=src[2:5] 1st:2nd
523 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[-1:6]
524 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[-1:6]
526 ext v7.16b, v5.16b, v4.16b, #8 //v7=src[3:6] 1st:2nd
528 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[0:6]
529 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[0:6]
532 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[1:6]
533 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[1:6]
536 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v4, v5, v6, v16, v17, v7, v20, v0, v1
554 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 //only use 21(16+5); v2=src[-2]
557 ext v5.16b, v2.16b, v4.16b, #1 //v5=src[-1]
558 ext v6.16b, v2.16b, v4.16b, #2 //v6=src[0]
559 ext v7.16b, v2.16b, v4.16b, #3 //v7=src[1]
560 ext v16.16b, v2.16b, v4.16b, #4 //v16=src[2]
561 ext v17.16b, v2.16b, v4.16b, #5 //v17=src[3]
602 …VEC4_UADDL_8BITS v16, v17, v20, v21, v24, v25, v28, v29, v0, v2, v4, v6 //v0/v2/v4/v6=src[-2]+sr…
604 …VEC4_MLS_16BITS v1, v9, v3, v9, v5, v9, v7, v9, v0, v2, v4, v6 //v0/v2/v4/v6 -= 5*(src[-1]+src[2])
620 … VEC4_MLA_16BITS v1, v8, v3, v8, v5, v8, v7, v8, v0, v2, v4, v6 //v0/v2/v4/v6+=20*(src[0]+src[1])
621 VEC4_SQRSHRUN_16BITS_SHIFT5 v0, v2, v4, v6, v1, v3, v5, v7
623 VEC4_UADDL_8BITS v1, v19, v3, v23, v5, v27, v7, v31, v0, v2, v4, v6 //average with arc[0]
624 VEC4_RSHRN_16BITS_SHIFT1 v0, v2, v4, v6, v1, v3, v5, v7
648 zip1 v4.4s, v2.4s, v3.4s // v4=src[-2] 1st:2nd
649 ext v17.16b, v4.16b, v4.16b, #8 // v17=src[2:5] 1st:2nd
651 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[-1:6]
652 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[-1:6]
654 ext v7.16b, v5.16b, v4.16b, #8 //v7=src[3:6] 1st:2nd
656 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[0:6]
657 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[0:6]
660 ext v2.16b, v2.16b, v4.16b, #1 //1st row src[1:6]
661 ext v3.16b, v3.16b, v4.16b, #1 //2nd row src[1:6]
664 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v4, v5, v6, v16, v17, v7, v20, v0, v1
688 ld1 {v4.16b}, [x0], x1 // v4=src[0*stride]
698 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v2, v3, v4, v5, v6, v7, v20, v0, v1
699 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v2, v3, v4, v5, v6, v7, v20, v0, v1
705 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v3, v4, v5, v6, v7, v2, v20, v0, v1
706 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v3, v4, v5, v6, v7, v2, v20, v0, v1
712 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v4, v5, v6, v7, v2, v3, v20, v0, v1
713 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v4, v5, v6, v7, v2, v3, v20, v0, v1
718 ld1 {v4.16b}, [x0], x1 // v4=src[3*stride]
719 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v5, v6, v7, v2, v3, v4, v20, v0, v1
720 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v5, v6, v7, v2, v3, v4, v20, v0, v1
726 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v6, v7, v2, v3, v4, v5, v20, v0, v1
727 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v6, v7, v2, v3, v4, v5, v20, v0, v1
733 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v7, v2, v3, v4, v5, v6, v20, v0, v1
734 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v7, v2, v3, v4, v5, v6, v20, v0, v1
739 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v2, v3, v4, v5, v6, v7, v20, v0, v1
740 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v2, v3, v4, v5, v6, v7, v20, v0, v1
745 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v3, v4, v5, v6, v7, v2, v20, v0, v1
746 FILTER_6TAG_8BITS2_AVERAGE_WITH_0 v3, v4, v5, v6, v7, v2, v20, v0, v1
752 mov v2.16b, v4.16b
753 mov v4.16b, v6.16b
781 …VEC4_UADDL_8BITS v16, v21, v17, v22, v18, v23, v19, v24, v0, v2, v4, v6 //v0/v2/v4/v6 =src[-2]+src…
783 …VEC4_MLS_16BITS v1, v31, v3, v31, v5, v31, v7, v31, v0, v2, v4, v6 //v0/v2/v4/v6 -=5*(src[-1]+src…
785 …VEC4_MLA_16BITS v1, v30, v3, v30, v5, v30, v7, v30, v0, v2, v4, v6 //v0/v2/v4/v6 += 20*(src[0]+sr…
786 VEC4_SQRSHRUN_16BITS_SHIFT5 v0, v2, v4, v6, v1, v3, v5, v7
788 …VEC4_UADDL_8BITS v1, v18, v3, v19, v5, v20, v7, v21, v0, v2, v4, v6 //v0/v2/v4/v6 = average with s…
789 VEC4_RSHRN_16BITS_SHIFT1 v0, v2, v4, v6, v1, v3, v5, v7
820 ld1 {v4.s}[0], [x0], x1 // v4=src[0*stride]
821 mov v3.s[1], v4.s[0]
824 mov v4.s[1], v5.s[0]
835 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v2, v3, v4, v5, v6, v7, v20, v0, v1
845 FILTER_6TAG_8BITS1_AVERAGE_WITH_0 v4, v5, v6, v7, v2, v3, v20, v0, v1
848 mov v4.s[0], v3.s[1]
851 mov v6.8b, v4.8b
852 mov v4.8b, v2.8b
879 ld1 {v4.16b}, [x0], x1 // v4=src[0*stride]
889 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v2, v3, v4, v5, v6, v7, v20, v0, v1
890 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v2, v3, v4, v5, v6, v7, v20, v0, v1
896 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v3, v4, v5, v6, v7, v2, v20, v0, v1
897 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v3, v4, v5, v6, v7, v2, v20, v0, v1
903 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v4, v5, v6, v7, v2, v3, v20, v0, v1
904 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v4, v5, v6, v7, v2, v3, v20, v0, v1
909 ld1 {v4.16b}, [x0], x1 // v4=src[3*stride]
910 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v5, v6, v7, v2, v3, v4, v20, v0, v1
911 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v5, v6, v7, v2, v3, v4, v20, v0, v1
917 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v6, v7, v2, v3, v4, v5, v20, v0, v1
918 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v6, v7, v2, v3, v4, v5, v20, v0, v1
924 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v7, v2, v3, v4, v5, v6, v20, v0, v1
925 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v7, v2, v3, v4, v5, v6, v20, v0, v1
930 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v2, v3, v4, v5, v6, v7, v20, v0, v1
931 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v2, v3, v4, v5, v6, v7, v20, v0, v1
936 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v3, v4, v5, v6, v7, v2, v20, v0, v1
937 FILTER_6TAG_8BITS2_AVERAGE_WITH_1 v3, v4, v5, v6, v7, v2, v20, v0, v1
943 mov v2.16b, v4.16b
944 mov v4.16b, v6.16b
972 …VEC4_UADDL_8BITS v16, v21, v17, v22, v18, v23, v19, v24, v0, v2, v4, v6 //v0/v2/v4/v6 =src[-2]+src…
974 …VEC4_MLS_16BITS v1, v31, v3, v31, v5, v31, v7, v31, v0, v2, v4, v6 //v0/v2/v4/v6 -=5*(src[-1]+src…
976 …VEC4_MLA_16BITS v1, v30, v3, v30, v5, v30, v7, v30, v0, v2, v4, v6 //v0/v2/v4/v6 += 20*(src[0]+sr…
977 VEC4_SQRSHRUN_16BITS_SHIFT5 v0, v2, v4, v6, v1, v3, v5, v7
979 …VEC4_UADDL_8BITS v1, v19, v3, v20, v5, v21, v7, v22, v0, v2, v4, v6 //v0/v2/v4/v6 = average with s…
980 VEC4_RSHRN_16BITS_SHIFT1 v0, v2, v4, v6, v1, v3, v5, v7
1011 ld1 {v4.s}[0], [x0], x1 // v4=src[0*stride]
1012 mov v3.s[1], v4.s[0]
1015 mov v4.s[1], v5.s[0]
1026 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v2, v3, v4, v5, v6, v7, v20, v0, v1
1036 FILTER_6TAG_8BITS1_AVERAGE_WITH_1 v4, v5, v6, v7, v2, v3, v20, v0, v1
1039 mov v4.s[0], v3.s[1]
1042 mov v6.8b, v4.8b
1043 mov v4.8b, v2.8b
1070 ld1 {v4.16b}, [x0], x1 // v4=src[0*stride]
1080 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
1081 FILTER_6TAG_8BITS2 v2, v3, v4, v5, v6, v7, v20, v0, v1
1087 FILTER_6TAG_8BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
1088 FILTER_6TAG_8BITS2 v3, v4, v5, v6, v7, v2, v20, v0, v1
1094 FILTER_6TAG_8BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
1095 FILTER_6TAG_8BITS2 v4, v5, v6, v7, v2, v3, v20, v0, v1
1100 ld1 {v4.16b}, [x0], x1 // v4=src[3*stride]
1101 FILTER_6TAG_8BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
1102 FILTER_6TAG_8BITS2 v5, v6, v7, v2, v3, v4, v20, v0, v1
1108 FILTER_6TAG_8BITS1 v6, v7, v2, v3, v4, v5, v20, v0, v1
1109 FILTER_6TAG_8BITS2 v6, v7, v2, v3, v4, v5, v20, v0, v1
1115 FILTER_6TAG_8BITS1 v7, v2, v3, v4, v5, v6, v20, v0, v1
1116 FILTER_6TAG_8BITS2 v7, v2, v3, v4, v5, v6, v20, v0, v1
1121 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
1122 FILTER_6TAG_8BITS2 v2, v3, v4, v5, v6, v7, v20, v0, v1
1127 FILTER_6TAG_8BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
1128 FILTER_6TAG_8BITS2 v3, v4, v5, v6, v7, v2, v20, v0, v1
1134 mov v2.16b, v4.16b
1135 mov v4.16b, v6.16b
1163 …VEC4_UADDL_8BITS v16, v21, v17, v22, v18, v23, v19, v24, v0, v2, v4, v6 //v0/v2/v4/v6 =src[-2]+src…
1165 …VEC4_MLS_16BITS v1, v31, v3, v31, v5, v31, v7, v31, v0, v2, v4, v6 //v0/v2/v4/v6 -=5*(src[-1]+src…
1167 …VEC4_MLA_16BITS v1, v30, v3, v30, v5, v30, v7, v30, v0, v2, v4, v6 //v0/v2/v4/v6 += 20*(src[0]+sr…
1168 VEC4_SQRSHRUN_16BITS_SHIFT5 v0, v2, v4, v6, v1, v3, v5, v7
1198 ld1 {v4.s}[0], [x0], x1 // v4=src[0*stride]
1199 mov v3.s[1], v4.s[0]
1202 mov v4.s[1], v5.s[0]
1213 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
1223 FILTER_6TAG_8BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
1226 mov v4.s[0], v3.s[1]
1229 mov v6.8b, v4.8b
1230 mov v4.8b, v2.8b
1258 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 // v2=src[-2*stride]
1278 FILTER_6TAG_8BITS_TO_16BITS1 v4, v7, v10, v13, v16, v19, v22, v0, v1
1284 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 // v2=src[3*stride]
1292 FILTER_6TAG_8BITS_TO_16BITS1 v7, v10, v13, v16, v19, v4, v22, v0, v1
1306 FILTER_6TAG_8BITS_TO_16BITS1 v10, v13, v16, v19, v4, v7, v22, v0, v1
1320 FILTER_6TAG_8BITS_TO_16BITS1 v13, v16, v19, v4, v7, v10, v22, v0, v1
1334 FILTER_6TAG_8BITS_TO_16BITS1 v16, v19, v4, v7, v10, v13, v22, v0, v1
1348 FILTER_6TAG_8BITS_TO_16BITS1 v19, v4, v7, v10, v13, v16, v22, v0, v1
1362 FILTER_6TAG_8BITS_TO_16BITS1 v4, v7, v10, v13, v16, v19, v22, v0, v1
1368 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 // v2=src[3*stride]
1376 FILTER_6TAG_8BITS_TO_16BITS1 v7, v10, v13, v16, v19, v4, v22, v0, v1
1397 mov v30.16b, v4.16b
1398 mov v4.16b, v10.16b
1428 ld1 {v4.16b}, [x0], x1 // v8=src[0*stride]
1438 FILTER_6TAG_8BITS_TO_16BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
1439 FILTER_6TAG_8BITS_TO_16BITS2 v2, v3, v4, v5, v6, v7, v21, v0, v1
1448 FILTER_6TAG_8BITS_TO_16BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
1449 FILTER_6TAG_8BITS_TO_16BITS2 v3, v4, v5, v6, v7, v2, v21, v0, v1
1458 FILTER_6TAG_8BITS_TO_16BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
1459 FILTER_6TAG_8BITS_TO_16BITS2 v4, v5, v6, v7, v2, v3, v21, v0, v1
1466 ld1 {v4.16b}, [x0], x1 // v4=src[3*stride]
1468 FILTER_6TAG_8BITS_TO_16BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
1469 FILTER_6TAG_8BITS_TO_16BITS2 v5, v6, v7, v2, v3, v4, v21, v0, v1
1480 mov v6.16b, v4.16b
1481 mov v4.16b, v30.16b
1504 ld1 {v4.16b}, [x0], x1 // v4=src[0*stride]
1514 FILTER_6TAG_8BITS_TO_16BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
1515 FILTER_6TAG_8BITS_TO_16BITS2 v2, v3, v4, v5, v6, v7, v21, v0, v1
1519 FILTER_6TAG_8BITS_TO_16BITS1 v3, v4, v5, v6, v7, v2, v22, v0, v1
1520 FILTER_6TAG_8BITS_TO_16BITS2 v3, v4, v5, v6, v7, v2, v23, v0, v1
1535 FILTER_6TAG_8BITS_TO_16BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
1536 FILTER_6TAG_8BITS_TO_16BITS2 v4, v5, v6, v7, v2, v3, v21, v0, v1
1538 ld1 {v4.16b}, [x0], x1 // v4=src[6*stride]
1539 FILTER_6TAG_8BITS_TO_16BITS1 v5, v6, v7, v2, v3, v4, v22, v0, v1
1540 FILTER_6TAG_8BITS_TO_16BITS2 v5, v6, v7, v2, v3, v4, v23, v0, v1
1555 mov v6.16b, v4.16b
1556 mov v4.16b, v30.16b
1628 ld1 {v4.16b}, [x2], x3 //read 16Byte : src0: 2 line
1642 AVERAGE_TWO_8BITS1 v16, v4, v5
1643 AVERAGE_TWO_8BITS2 v16, v4, v5
1674 ld1 {v4.8b}, [x2], x3 //read 8Byte : src0: 2 line
1687 AVERAGE_TWO_8BITS1 v16, v4, v5
1716 ld1 {v4.16b}, [x2], x3 //read 16Byte : src0: 2 line
1732 AVERAGE_TWO_8BITS1 v16, v4, v5
1733 AVERAGE_TWO_8BITS2 v16, v4, v5
1763 ld1 {v4.8b}, [x2], x3 //read 8Byte : src0: 2 line
1776 AVERAGE_TWO_8BITS1 v16, v4, v5
1835 umull v4.8h, v20.8b, v28.8b
1840 umlal v4.8h, v21.8b, v29.8b
1845 umlal v4.8h, v22.8b, v30.8b
1850 umlal v4.8h, v23.8b, v31.8b
1859 rshrn v5.8b, v4.8h, #6
1876 ld4r {v4.8b, v5.8b, v6.8b, v7.8b}, [x4] //load A/B/C/D
1890 umull v16.8h, v0.8b, v4.8b
1954 ext v5.16b, v2.16b, v4.16b, #1 //v5=src[-1]
1955 ext v6.16b, v2.16b, v4.16b, #2 //v6=src[0]
1956 ext v7.16b, v2.16b, v4.16b, #3 //v7=src[1]
1957 ext v16.16b, v2.16b, v4.16b, #4 //v16=src[2]
1958 ext v17.16b, v2.16b, v4.16b, #5 //v17=src[3]
1985 ext v5.16b, v2.16b, v4.16b, #1 //v5=src[-1]
1986 ext v6.16b, v2.16b, v4.16b, #2 //v6=src[0]
1987 ext v7.16b, v2.16b, v4.16b, #3 //v7=src[1]
1988 ext v16.16b, v2.16b, v4.16b, #4 //v16=src[2]
1989 ext v17.16b, v2.16b, v4.16b, #5 //v17=src[3]
2021 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 // v2=src[-2*stride]
2041 FILTER_6TAG_8BITS_TO_16BITS1 v4, v7, v10, v13, v16, v19, v22, v0, v1
2049 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 // v2=src[4*stride]
2057 FILTER_6TAG_8BITS_TO_16BITS1 v7, v10, v13, v16, v19, v4, v22, v0, v1
2073 FILTER_6TAG_8BITS_TO_16BITS1 v10, v13, v16, v19, v4, v7, v22, v0, v1
2089 FILTER_6TAG_8BITS_TO_16BITS1 v13, v16, v19, v4, v7, v10, v22, v0, v1
2105 FILTER_6TAG_8BITS_TO_16BITS1 v16, v19, v4, v7, v10, v13, v22, v0, v1
2121 FILTER_6TAG_8BITS_TO_16BITS1 v19, v4, v7, v10, v13, v16, v22, v0, v1
2137 FILTER_6TAG_8BITS_TO_16BITS1 v4, v7, v10, v13, v16, v19, v22, v0, v1
2145 ld1 {v2.8b, v3.8b, v4.8b}, [x0], x1 // v2=src[10*stride]
2153 FILTER_6TAG_8BITS_TO_16BITS1 v7, v10, v13, v16, v19, v4, v22, v0, v1
2176 mov v30.16b, v4.16b
2177 mov v4.16b, v10.16b
2193 FILTER_6TAG_8BITS_TO_16BITS1 v4, v7, v10, v13, v16, v19, v22, v0, v1
2227 ld1 {v4.16b}, [x0], x1 // v8=src[0*stride]
2237 FILTER_6TAG_8BITS_TO_16BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2238 FILTER_6TAG_8BITS_TO_16BITS2 v2, v3, v4, v5, v6, v7, v21, v0, v1
2249 FILTER_6TAG_8BITS_TO_16BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
2250 FILTER_6TAG_8BITS_TO_16BITS2 v3, v4, v5, v6, v7, v2, v21, v0, v1
2261 FILTER_6TAG_8BITS_TO_16BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
2262 FILTER_6TAG_8BITS_TO_16BITS2 v4, v5, v6, v7, v2, v3, v21, v0, v1
2271 ld1 {v4.16b}, [x0], x1 // v4=src[6*stride]
2273 FILTER_6TAG_8BITS_TO_16BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
2274 FILTER_6TAG_8BITS_TO_16BITS2 v5, v6, v7, v2, v3, v4, v21, v0, v1
2287 mov v6.16b, v4.16b
2288 mov v4.16b, v30.16b
2296 FILTER_6TAG_8BITS_TO_16BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2297 FILTER_6TAG_8BITS_TO_16BITS2 v2, v3, v4, v5, v6, v7, v21, v0, v1
2327 ld1 {v4.16b}, [x0], x1 // v8=src[0*stride]
2337 FILTER_6TAG_8BITS_TO_16BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2338 FILTER_6TAG_8BITS_TO_16BITS2 v2, v3, v4, v5, v6, v7, v21, v0, v1
2348 FILTER_6TAG_8BITS_TO_16BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
2349 FILTER_6TAG_8BITS_TO_16BITS2 v3, v4, v5, v6, v7, v2, v21, v0, v1
2359 FILTER_6TAG_8BITS_TO_16BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
2360 FILTER_6TAG_8BITS_TO_16BITS2 v4, v5, v6, v7, v2, v3, v21, v0, v1
2368 ld1 {v4.16b}, [x0], x1 // v4=src[6*stride]
2370 FILTER_6TAG_8BITS_TO_16BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
2371 FILTER_6TAG_8BITS_TO_16BITS2 v5, v6, v7, v2, v3, v4, v21, v0, v1
2383 mov v6.16b, v4.16b
2384 mov v4.16b, v30.16b
2392 FILTER_6TAG_8BITS_TO_16BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2393 FILTER_6TAG_8BITS_TO_16BITS2 v2, v3, v4, v5, v6, v7, v21, v0, v1
2418 ld1 {v4.16b}, [x0], x1 // v4=src[0*stride]
2428 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2429 FILTER_6TAG_8BITS2 v2, v3, v4, v5, v6, v7, v20, v0, v1
2435 FILTER_6TAG_8BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
2436 FILTER_6TAG_8BITS2 v3, v4, v5, v6, v7, v2, v20, v0, v1
2442 FILTER_6TAG_8BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
2443 FILTER_6TAG_8BITS2 v4, v5, v6, v7, v2, v3, v20, v0, v1
2448 ld1 {v4.16b}, [x0], x1 // v4=src[6*stride]
2449 FILTER_6TAG_8BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
2450 FILTER_6TAG_8BITS2 v5, v6, v7, v2, v3, v4, v20, v0, v1
2456 FILTER_6TAG_8BITS1 v6, v7, v2, v3, v4, v5, v20, v0, v1
2457 FILTER_6TAG_8BITS2 v6, v7, v2, v3, v4, v5, v20, v0, v1
2463 FILTER_6TAG_8BITS1 v7, v2, v3, v4, v5, v6, v20, v0, v1
2464 FILTER_6TAG_8BITS2 v7, v2, v3, v4, v5, v6, v20, v0, v1
2469 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2470 FILTER_6TAG_8BITS2 v2, v3, v4, v5, v6, v7, v20, v0, v1
2475 FILTER_6TAG_8BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
2476 FILTER_6TAG_8BITS2 v3, v4, v5, v6, v7, v2, v20, v0, v1
2482 mov v2.16b, v4.16b
2483 mov v4.16b, v6.16b
2490 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2491 FILTER_6TAG_8BITS2 v2, v3, v4, v5, v6, v7, v20, v0, v1
2511 ld1 {v4.8b}, [x0], x1 // v4=src[0*stride]
2520 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2525 FILTER_6TAG_8BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
2530 FILTER_6TAG_8BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
2534 ld1 {v4.8b}, [x0], x1 // v4=src[6*stride]
2535 FILTER_6TAG_8BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
2542 mov v6.16b, v4.16b
2543 mov v4.16b, v7.16b
2549 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2570 ld1 {v4.8b}, [x0], x1 // v4=src[0*stride]
2579 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1
2584 FILTER_6TAG_8BITS1 v3, v4, v5, v6, v7, v2, v20, v0, v1
2589 FILTER_6TAG_8BITS1 v4, v5, v6, v7, v2, v3, v20, v0, v1
2593 ld1 {v4.8b}, [x0], x1 // v4=src[6*stride]
2594 FILTER_6TAG_8BITS1 v5, v6, v7, v2, v3, v4, v20, v0, v1
2601 mov v6.16b, v4.16b
2602 mov v4.16b, v7.16b
2608 FILTER_6TAG_8BITS1 v2, v3, v4, v5, v6, v7, v20, v0, v1