Lines Matching refs:H
43 ld1 {v5.8H}, [x16], #16 // load 8x16-bit filter values, part 1
45 ld1 {v7.8H}, [x12], #16 // load 8x16-bit at filter+filterSize
46 uxtl v4.8H, v4.8B // unpack part 1 to 16-bit
47 …smlal v0.4S, v4.4H, v5.4H // v0 accumulates srcp[filterPos[0] + {0..3}] * fi…
48 …smlal2 v0.4S, v4.8H, v5.8H // v0 accumulates srcp[filterPos[0] + {4..7}] * fi…
50 ld1 {v17.8H}, [x13], #16 // load 8x16-bit at filter+2*filterSize
51 uxtl v6.8H, v6.8B // unpack part 2 to 16-bit
52 …smlal v1.4S, v6.4H, v7.4H // v1 accumulates srcp[filterPos[1] + {0..3}] * fi…
53 uxtl v16.8H, v16.8B // unpack part 3 to 16-bit
54 …smlal v2.4S, v16.4H, v17.4H // v2 accumulates srcp[filterPos[2] + {0..3}] * fi…
55 …smlal2 v2.4S, v16.8H, v17.8H // v2 accumulates srcp[filterPos[2] + {4..7}] * fi…
57 …smlal2 v1.4S, v6.8H, v7.8H // v1 accumulates srcp[filterPos[1] + {4..7}] * fi…
58 ld1 {v19.8H}, [x4], #16 // load 8x16-bit at filter+3*filterSize
60 uxtl v18.8H, v18.8B // unpack part 4 to 16-bit
61 …smlal v3.4S, v18.4H, v19.4H // v3 accumulates srcp[filterPos[3] + {0..3}] * fi…
62 …smlal2 v3.4S, v18.8H, v19.8H // v3 accumulates srcp[filterPos[3] + {4..7}] * fi…
76 sqshrn v0.4H, v0.4S, #7 // shift and clip the 2x16-bit final values
77 st1 {v0.4H}, [x1], #8 // write to destination part0123