Home
last modified time | relevance | path

Searched refs:vprod0x0 (Results 1 – 25 of 63) sorted by relevance

123

/external/XNNPACK/src/qs8-gemm/gen/
D1x8c8-minmax-neon-mlal-padal.c69 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_1x8c8__neon_mlal_padal() local
70 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_1x8c8__neon_mlal_padal()
71 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_1x8c8__neon_mlal_padal()
109 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_gemm_minmax_ukernel_1x8c8__neon_mlal_padal() local
110 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_1x8c8__neon_mlal_padal()
D1x4c8-minmax-wasmsimd-ld64.c58 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_gemm_minmax_ukernel_1x4c8__wasmsimd_ld64() local
59 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_1x4c8__wasmsimd_ld64()
60 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_1x4c8__wasmsimd_ld64()
D1x4c8-minmax-wasmsimd-ld128.c60 const v128_t vprod0x0 = wasm_i16x8_mul(vxb0, vxa0); in xnn_qs8_gemm_minmax_ukernel_1x4c8__wasmsimd_ld128() local
61 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_1x4c8__wasmsimd_ld128()
65 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_1x4c8__wasmsimd_ld128()
D1x4c8-xw-minmax-wasmsimd.c58 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_gemm_xw_minmax_ukernel_1x4c8__wasmsimd() local
59 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_xw_minmax_ukernel_1x4c8__wasmsimd()
60 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_xw_minmax_ukernel_1x4c8__wasmsimd()
D1x8c16-minmax-neon-mlal-padal.c67 int16x8_t vprod0x0 = vmull_s8(vget_low_s8(vb0), vget_low_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_1x8c16__neon_mlal_padal() local
68 vprod0x0 = vmlal_s8(vprod0x0, vget_high_s8(vb0), vget_high_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_1x8c16__neon_mlal_padal()
69 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_1x8c16__neon_mlal_padal()
D2x8c8-minmax-neon-mlal-padal.c85 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_2x8c8__neon_mlal_padal() local
87 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_2x8c8__neon_mlal_padal()
89 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_2x8c8__neon_mlal_padal()
150 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_gemm_minmax_ukernel_2x8c8__neon_mlal_padal() local
152 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_2x8c8__neon_mlal_padal()
D2x4c8-xw-minmax-wasmsimd.c70 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_gemm_xw_minmax_ukernel_2x4c8__wasmsimd() local
71 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_xw_minmax_ukernel_2x4c8__wasmsimd()
72 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_xw_minmax_ukernel_2x4c8__wasmsimd()
D2x4c8-minmax-wasmsimd-ld128.c72 const v128_t vprod0x0 = wasm_i16x8_mul(vxb0, vxa0); in xnn_qs8_gemm_minmax_ukernel_2x4c8__wasmsimd_ld128() local
73 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_2x4c8__wasmsimd_ld128()
79 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_2x4c8__wasmsimd_ld128()
D2x4c8-minmax-wasmsimd-ld64.c70 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_gemm_minmax_ukernel_2x4c8__wasmsimd_ld64() local
71 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_2x4c8__wasmsimd_ld64()
72 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_2x4c8__wasmsimd_ld64()
D1x16c8-minmax-neon-mlal-padal.c85 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
86 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal()
87 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal()
157 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
158 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_1x16c8__neon_mlal_padal()
D3x8c8-minmax-neon-mlal-padal.c101 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_gemm_minmax_ukernel_3x8c8__neon_mlal_padal() local
104 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_gemm_minmax_ukernel_3x8c8__neon_mlal_padal()
107 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_3x8c8__neon_mlal_padal()
191 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_gemm_minmax_ukernel_3x8c8__neon_mlal_padal() local
194 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_3x8c8__neon_mlal_padal()
D2x8c16-minmax-neon-mlal-padal.c82 int16x8_t vprod0x0 = vmull_s8(vget_low_s8(vb0), vget_low_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_2x8c16__neon_mlal_padal() local
84 vprod0x0 = vmlal_s8(vprod0x0, vget_high_s8(vb0), vget_high_s8(va0)); in xnn_qs8_gemm_minmax_ukernel_2x8c16__neon_mlal_padal()
86 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_gemm_minmax_ukernel_2x8c16__neon_mlal_padal()
D3x4c8-xw-minmax-wasmsimd.c82 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_gemm_xw_minmax_ukernel_3x4c8__wasmsimd() local
83 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_xw_minmax_ukernel_3x4c8__wasmsimd()
84 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_xw_minmax_ukernel_3x4c8__wasmsimd()
D3x4c8-minmax-wasmsimd-ld128.c84 const v128_t vprod0x0 = wasm_i16x8_mul(vxb0, vxa0); in xnn_qs8_gemm_minmax_ukernel_3x4c8__wasmsimd_ld128() local
85 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_3x4c8__wasmsimd_ld128()
93 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_gemm_minmax_ukernel_3x4c8__wasmsimd_ld128()
/external/XNNPACK/src/qs8-igemm/gen/
D1x8c8-minmax-neon-mlal-padal.c80 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_1x8c8__neon_mlal_padal() local
81 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_1x8c8__neon_mlal_padal()
82 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_1x8c8__neon_mlal_padal()
120 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_igemm_minmax_ukernel_1x8c8__neon_mlal_padal() local
121 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_1x8c8__neon_mlal_padal()
D1x4c8-minmax-wasmsimd-ld64.c69 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_igemm_minmax_ukernel_1x4c8__wasmsimd_ld64() local
70 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_1x4c8__wasmsimd_ld64()
71 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_1x4c8__wasmsimd_ld64()
D1x4c8-minmax-wasmsimd-ld128.c71 const v128_t vprod0x0 = wasm_i16x8_mul(vxb0, vxa0); in xnn_qs8_igemm_minmax_ukernel_1x4c8__wasmsimd_ld128() local
72 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_1x4c8__wasmsimd_ld128()
76 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_1x4c8__wasmsimd_ld128()
D1x8c16-minmax-neon-mlal-padal.c78 int16x8_t vprod0x0 = vmull_s8(vget_low_s8(vb0), vget_low_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_1x8c16__neon_mlal_padal() local
79 vprod0x0 = vmlal_s8(vprod0x0, vget_high_s8(vb0), vget_high_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_1x8c16__neon_mlal_padal()
80 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_1x8c16__neon_mlal_padal()
D2x8c8-minmax-neon-mlal-padal.c98 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_2x8c8__neon_mlal_padal() local
100 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_2x8c8__neon_mlal_padal()
102 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_2x8c8__neon_mlal_padal()
163 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_igemm_minmax_ukernel_2x8c8__neon_mlal_padal() local
165 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_2x8c8__neon_mlal_padal()
D2x4c8-minmax-wasmsimd-ld128.c85 const v128_t vprod0x0 = wasm_i16x8_mul(vxb0, vxa0); in xnn_qs8_igemm_minmax_ukernel_2x4c8__wasmsimd_ld128() local
86 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_2x4c8__wasmsimd_ld128()
92 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_2x4c8__wasmsimd_ld128()
D2x4c8-minmax-wasmsimd-ld64.c83 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_igemm_minmax_ukernel_2x4c8__wasmsimd_ld64() local
84 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_2x4c8__wasmsimd_ld64()
85 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_2x4c8__wasmsimd_ld64()
D1x16c8-minmax-neon-mlal-padal.c96 int16x8_t vprod0x0 = vmull_s8(vb0x0, va0x0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
97 vprod0x0 = vmlal_s8(vprod0x0, vb0x1, va0x1); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal()
98 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal()
168 const int16x8_t vprod0x0 = vmull_s8(vb0, va0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal() local
169 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_1x16c8__neon_mlal_padal()
D2x8c16-minmax-neon-mlal-padal.c95 int16x8_t vprod0x0 = vmull_s8(vget_low_s8(vb0), vget_low_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_2x8c16__neon_mlal_padal() local
97 vprod0x0 = vmlal_s8(vprod0x0, vget_high_s8(vb0), vget_high_s8(va0)); in xnn_qs8_igemm_minmax_ukernel_2x8c16__neon_mlal_padal()
99 vacc0x0 = vpadalq_s16(vacc0x0, vprod0x0); in xnn_qs8_igemm_minmax_ukernel_2x8c16__neon_mlal_padal()
D3x4c8-minmax-wasmsimd-ld128.c99 const v128_t vprod0x0 = wasm_i16x8_mul(vxb0, vxa0); in xnn_qs8_igemm_minmax_ukernel_3x4c8__wasmsimd_ld128() local
100 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_3x4c8__wasmsimd_ld128()
108 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_3x4c8__wasmsimd_ld128()
D3x4c8-minmax-wasmsimd-ld64.c97 const v128_t vprod0x0 = wasm_i16x8_mul(vxa0, vxb0); in xnn_qs8_igemm_minmax_ukernel_3x4c8__wasmsimd_ld64() local
98 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_low_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_3x4c8__wasmsimd_ld64()
99 vacc0x0 = wasm_i32x4_add(vacc0x0, wasm_i32x4_widen_high_i16x8(vprod0x0)); in xnn_qs8_igemm_minmax_ukernel_3x4c8__wasmsimd_ld64()

123