Home
last modified time | relevance | path

Searched refs:vb0123c2x1 (Results 1 – 25 of 160) sorted by relevance

1234567

/external/XNNPACK/src/qs8-igemm/gen/
D4x8c2s4-minmax-rndnu-neon-mlal.c180 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal() local
181 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
182 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
183 vprod2x0123c2 = vmlal_s8(vprod2x0123c2, vb0123c2x1, va2x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
184 vprod3x0123c2 = vmlal_s8(vprod3x0123c2, vb0123c2x1, va3x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
D3x8c2s4-minmax-rndnu-neon-mlal.c151 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal() local
152 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal()
153 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal()
154 vprod2x0123c2 = vmlal_s8(vprod2x0123c2, vb0123c2x1, va2x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal()
D2x8c2s4-minmax-fp32-neonv8-mlal.c123 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal() local
124 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
125 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
D2x8c2s4-minmax-rndnu-neon-mlal.c122 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2s4__neon_mlal() local
123 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2s4__neon_mlal()
124 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2s4__neon_mlal()
D2x8c2s4-minmax-fp32-neon-mlal.c122 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal() local
123 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
124 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_igemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
D1x8c2s4-minmax-fp32-neonv8-mlal.c94 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal() local
95 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal()
D1x8c2s4-minmax-rndnu-neon-mlal.c93 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_rndnu_ukernel_1x8c2s4__neon_mlal() local
94 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_rndnu_ukernel_1x8c2s4__neon_mlal()
D1x8c2s4-minmax-fp32-neon-mlal.c93 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal() local
94 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_igemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal()
/external/XNNPACK/src/qs8-gemm/gen/
D4x8c2s4-minmax-rndnu-neon-mlal.c163 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal() local
164 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
165 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
166 vprod2x0123c2 = vmlal_s8(vprod2x0123c2, vb0123c2x1, va2x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
167 vprod3x0123c2 = vmlal_s8(vprod3x0123c2, vb0123c2x1, va3x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2s4__neon_mlal()
D3x8c2s4-minmax-rndnu-neon-mlal.c136 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal() local
137 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal()
138 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal()
139 vprod2x0123c2 = vmlal_s8(vprod2x0123c2, vb0123c2x1, va2x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2s4__neon_mlal()
D2x8c2s4-minmax-rndnu-neon-mlal.c109 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2s4__neon_mlal() local
110 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2s4__neon_mlal()
111 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2s4__neon_mlal()
D2x8c2s4-minmax-fp32-neonv8-mlal.c110 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal() local
111 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
112 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_gemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
D2x8c2s4-minmax-fp32-neon-mlal.c109 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal() local
110 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
111 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qs8_gemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
D1x8c2s4-minmax-fp32-neon-mlal.c82 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal() local
83 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal()
D1x8c2s4-minmax-fp32-neonv8-mlal.c83 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal() local
84 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal()
D1x8c2s4-minmax-rndnu-neon-mlal.c82 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qs8_gemm_minmax_rndnu_ukernel_1x8c2s4__neon_mlal() local
83 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_1x8c2s4__neon_mlal()
D4x8c2-minmax-rndnu-neon-mlal-ld4r.c173 … const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const void*) ((uintptr_t) w + 8 * sizeof(int8_t)); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2__neon_mlal_ld4r() local
174 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0c2x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2__neon_mlal_ld4r()
175 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1c2x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2__neon_mlal_ld4r()
176 vprod2x0123c2 = vmlal_s8(vprod2x0123c2, vb0123c2x1, va2c2x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2__neon_mlal_ld4r()
177 vprod3x0123c2 = vmlal_s8(vprod3x0123c2, vb0123c2x1, va3c2x1); in xnn_qs8_gemm_minmax_rndnu_ukernel_4x8c2__neon_mlal_ld4r()
/external/XNNPACK/src/qc8-gemm/gen/
D2x8c2s4-minmax-fp32-neon-mlal.c109 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_gemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal() local
110 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_gemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
111 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qc8_gemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
D2x8c2s4-minmax-fp32-neonv8-mlal.c110 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_gemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal() local
111 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_gemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
112 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qc8_gemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
D1x8c2s4-minmax-fp32-neonv8-mlal.c83 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_gemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal() local
84 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_gemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal()
D1x8c2s4-minmax-fp32-neon-mlal.c82 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_gemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal() local
83 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_gemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal()
/external/XNNPACK/src/qc8-igemm/gen/
D2x8c2s4-minmax-fp32-neon-mlal.c122 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_igemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal() local
123 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_igemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
124 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qc8_igemm_minmax_fp32_ukernel_2x8c2s4__neon_mlal()
D2x8c2s4-minmax-fp32-neonv8-mlal.c123 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_igemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal() local
124 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_igemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
125 vprod1x0123c2 = vmlal_s8(vprod1x0123c2, vb0123c2x1, va1x1); in xnn_qc8_igemm_minmax_fp32_ukernel_2x8c2s4__neonv8_mlal()
D1x8c2s4-minmax-fp32-neonv8-mlal.c94 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_igemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal() local
95 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_igemm_minmax_fp32_ukernel_1x8c2s4__neonv8_mlal()
D1x8c2s4-minmax-fp32-neon-mlal.c93 const int8x8_t vb0123c2x1 = vld1_s8(w); w = (const int8_t*) w + 8; in xnn_qc8_igemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal() local
94 vprod0x0123c2 = vmlal_s8(vprod0x0123c2, vb0123c2x1, va0x1); in xnn_qc8_igemm_minmax_fp32_ukernel_1x8c2s4__neon_mlal()

1234567