Lines Matching refs:va0
64 const int8x8_t va0 = vld1_s8(a0); a0 += 8; in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup() local
83 …prod0x0123c0 = vmull_s8(vb0123c0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
84 …prod0x0123c1 = vmull_s8(vb0123c1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
85 …prod0x0123c2 = vmull_s8(vb0123c2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
86 …prod0x0123c3 = vmull_s8(vb0123c3, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 3))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
91 …prod0x4567c0 = vmull_s8(vb4567c0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
92 …prod0x4567c1 = vmull_s8(vb4567c1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
93 …prod0x4567c2 = vmull_s8(vb4567c2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
94 …prod0x4567c3 = vmull_s8(vb4567c3, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 3))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
99 …prod0x89ABc0 = vmull_s8(vb89ABc0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
100 …prod0x89ABc1 = vmull_s8(vb89ABc1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
101 …prod0x89ABc2 = vmull_s8(vb89ABc2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
102 …prod0x89ABc3 = vmull_s8(vb89ABc3, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 3))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
107 …prod0xCDEFc0 = vmull_s8(vbCDEFc0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
108 …prod0xCDEFc1 = vmull_s8(vbCDEFc1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
109 …prod0xCDEFc2 = vmull_s8(vbCDEFc2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
110 …prod0xCDEFc3 = vmull_s8(vbCDEFc3, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 3))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
120 const int8x8_t va0 = vld1_s8(a0); a0 = (const int8_t*) ((uintptr_t) a0 + k); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup() local
127 …prod0x0123c0 = vmull_s8(vb0123c0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
129 …prod0x4567c0 = vmull_s8(vb4567c0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
131 …prod0x89ABc0 = vmull_s8(vb89ABc0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
133 …prod0xCDEFc0 = vmull_s8(vbCDEFc0, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 0))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
142 …prod0x0123c1 = vmull_s8(vb0123c1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
144 …prod0x4567c1 = vmull_s8(vb4567c1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
146 …prod0x89ABc1 = vmull_s8(vb89ABc1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
148 …prod0xCDEFc1 = vmull_s8(vbCDEFc1, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 1))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
157 …prod0x0123c2 = vmull_s8(vb0123c2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
159 …prod0x4567c2 = vmull_s8(vb4567c2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
161 …prod0x89ABc2 = vmull_s8(vb89ABc2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()
163 …prod0xCDEFc2 = vmull_s8(vbCDEFc2, vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va0), 2))); in xnn_qs8_igemm_minmax_ukernel_1x16c2__neon_mull_padal_dup()