/external/XNNPACK/src/qu8-gemm/gen/ |
D | 4x8c4-minmax-rndnu-neondot.c | 78 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__neondot() local 112 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__neondot() 142 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__neondot() 160 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__neondot() 161 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x8c4__neondot()
|
D | 5x8c4-minmax-rndnu-neondot.c | 86 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x8c4__neondot() local 122 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x8c4__neondot() 158 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x8c4__neondot() 179 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x8c4__neondot() 180 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x8c4__neondot()
|
D | 6x8c4-minmax-rndnu-neondot.c | 94 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x8c4__neondot() local 132 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x8c4__neondot() 174 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x8c4__neondot() 198 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x8c4__neondot() 199 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x8c4__neondot()
|
D | 4x16c4-minmax-fp32-neondot.c | 87 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__neondot() local 137 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__neondot() 179 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__neondot() 205 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__neondot() 206 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_fp32_ukernel_4x16c4__neondot()
|
D | 4x16c4-minmax-rndnu-neondot.c | 86 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x16c4__neondot() local 136 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x16c4__neondot() 178 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x16c4__neondot() 204 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x16c4__neondot() 205 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_4x16c4__neondot()
|
D | 8x8c4-minmax-rndnu-neondot.c | 110 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x8c4__neondot() local 152 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x8c4__neondot() 206 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x8c4__neondot() 236 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x8c4__neondot() 237 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x8c4__neondot()
|
D | 5x16c4-minmax-rndnu-neondot.c | 96 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x16c4__neondot() local 148 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x16c4__neondot() 200 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x16c4__neondot() 231 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x16c4__neondot() 232 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_5x16c4__neondot()
|
D | 6x16c4-minmax-rndnu-neondot.c | 106 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x16c4__neondot() local 160 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x16c4__neondot() 222 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x16c4__neondot() 258 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x16c4__neondot() 259 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_6x16c4__neondot()
|
D | 8x16c4-minmax-rndnu-neondot.c | 126 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x16c4__neondot() local 184 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x16c4__neondot() 266 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x16c4__neondot() 312 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x16c4__neondot() 313 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_gemm_minmax_rndnu_ukernel_8x16c4__neondot()
|
/external/XNNPACK/src/qu8-igemm/gen/ |
D | 4x8c4-minmax-rndnu-neondot.c | 74 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__neondot() local 128 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__neondot() 158 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__neondot() 178 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__neondot() 179 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x8c4__neondot()
|
D | 5x8c4-minmax-rndnu-neondot.c | 80 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x8c4__neondot() local 140 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x8c4__neondot() 176 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x8c4__neondot() 199 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x8c4__neondot() 200 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x8c4__neondot()
|
D | 6x8c4-minmax-rndnu-neondot.c | 86 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x8c4__neondot() local 152 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x8c4__neondot() 194 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x8c4__neondot() 220 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x8c4__neondot() 221 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x8c4__neondot()
|
D | 4x16c4-minmax-fp32-neondot.c | 83 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__neondot() local 153 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__neondot() 195 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__neondot() 223 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__neondot() 224 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_fp32_ukernel_4x16c4__neondot()
|
D | 4x16c4-minmax-rndnu-neondot.c | 82 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x16c4__neondot() local 152 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x16c4__neondot() 194 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x16c4__neondot() 222 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x16c4__neondot() 223 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_4x16c4__neondot()
|
D | 8x8c4-minmax-rndnu-neondot.c | 98 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x8c4__neondot() local 176 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x8c4__neondot() 230 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x8c4__neondot() 262 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x8c4__neondot() 263 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x8c4__neondot()
|
D | 5x16c4-minmax-rndnu-neondot.c | 90 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x16c4__neondot() local 166 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x16c4__neondot() 218 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x16c4__neondot() 251 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x16c4__neondot() 252 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_5x16c4__neondot()
|
D | 6x16c4-minmax-rndnu-neondot.c | 98 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x16c4__neondot() local 180 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x16c4__neondot() 242 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x16c4__neondot() 280 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x16c4__neondot() 281 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_6x16c4__neondot()
|
D | 8x16c4-minmax-rndnu-neondot.c | 114 uint32x2_t vnacc3 = vmov_n_u32(0); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x16c4__neondot() local 208 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x16c4__neondot() 290 vnacc3 = vdot_u32(vnacc3, va_zero_point, va3x01234567); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x16c4__neondot() 338 vnacc3 = vpadd_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x16c4__neondot() 339 const uint32x4_t vnacc3x0123 = vcombine_u32(vnacc3, vnacc3); in xnn_qu8_igemm_minmax_rndnu_ukernel_8x16c4__neondot()
|