| /external/XNNPACK/src/qs8-gemm/gen/ |
| D | 2x8c2-minmax-rndnu-neon-mull-ld2r.c | 84 const int8x8_t va1c1 = vreinterpret_s8_s16(va10.val[1]); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld2r() local 147 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld2r() local
|
| D | 2x8c2-minmax-rndnu-neon-mull-ld4r.c | 82 const int8x8_t va1c1 = vreinterpret_s8_s16(va1.val[1]); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld4r() local 145 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld4r() local
|
| D | 2x8c2-minmax-rndnu-neon-mull-dup.c | 82 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_dup() local 145 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_dup() local
|
| D | 2x8c2-minmax-rndnu-neon-mull-ld1r.c | 88 const int8x8_t va1c1 = vreinterpret_s8_s16(va11); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld1r() local 151 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld1r() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-dup.c | 96 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_dup() local 180 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_dup() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-ld2r.c | 99 const int8x8_t va1c1 = vreinterpret_s8_s16(va10.val[1]); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld2r() local 183 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld2r() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-ld4r.c | 96 const int8x8_t va1c1 = vreinterpret_s8_s16(va1.val[1]); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld4r() local 180 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld4r() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-ld1r.c | 105 const int8x8_t va1c1 = vreinterpret_s8_s16(va11); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld1r() local 189 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_gemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld1r() local
|
| /external/XNNPACK/src/qs8-igemm/gen/ |
| D | 2x8c2-minmax-rndnu-neon-mull-dup.c | 95 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_dup() local 158 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_dup() local
|
| D | 2x8c2-minmax-rndnu-neon-mull-ld4r.c | 95 const int8x8_t va1c1 = vreinterpret_s8_s16(va1.val[1]); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld4r() local 158 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld4r() local
|
| D | 2x8c2-minmax-rndnu-neon-mull-ld1r.c | 101 const int8x8_t va1c1 = vreinterpret_s8_s16(va11); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld1r() local 164 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld1r() local
|
| D | 2x8c2-minmax-rndnu-neon-mull-ld2r.c | 97 const int8x8_t va1c1 = vreinterpret_s8_s16(va10.val[1]); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld2r() local 160 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_2x8c2__neon_mull_ld2r() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-dup.c | 111 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_dup() local 195 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_dup() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-ld4r.c | 111 const int8x8_t va1c1 = vreinterpret_s8_s16(va1.val[1]); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld4r() local 195 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld4r() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-ld2r.c | 114 const int8x8_t va1c1 = vreinterpret_s8_s16(va10.val[1]); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld2r() local 198 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld2r() local
|
| D | 3x8c2-minmax-rndnu-neon-mull-ld1r.c | 120 const int8x8_t va1c1 = vreinterpret_s8_s16(va11); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld1r() local 204 const int8x8_t va1c1 = vreinterpret_s8_s16(vdup_lane_s16(vreinterpret_s16_s8(va1), 1)); in xnn_qs8_igemm_minmax_rndnu_ukernel_3x8c2__neon_mull_ld1r() local
|
| /external/XNNPACK/src/f32-gemm/gen/ |
| D | 4x2-minmax-neonfma-lane-ld64.c | 99 const float32x2_t va1c1 = vdup_lane_f32(va1, 1); in xnn_f32_gemm_minmax_ukernel_4x2__neonfma_lane_ld64() local
|
| D | 3x8-wasmsimd-splat.c | 85 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemm_ukernel_3x8__wasmsimd_splat() local
|
| D | 3x8-wasmrelaxedsimd-fma-splat.c | 85 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemm_ukernel_3x8__wasmrelaxedsimd_fma_splat() local
|
| D | 3x8-relu-wasmrelaxedsimd-fma-splat.c | 85 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemm_relu_ukernel_3x8__wasmrelaxedsimd_fma_splat() local
|
| D | 3x8-relu-wasmsimd-splat.c | 85 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemm_relu_ukernel_3x8__wasmsimd_splat() local
|
| D | 3x8-minmax-wasmrelaxedsimd-fma-splat.c | 87 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemm_minmax_ukernel_3x8__wasmrelaxedsimd_fma_splat() local
|
| /external/XNNPACK/src/f32-igemm/gen/ |
| D | 4x2-minmax-neonfma-lane-ld64.c | 121 const float32x2_t va1c1 = vdup_lane_f32(va1, 1); in xnn_f32_igemm_minmax_ukernel_4x2__neonfma_lane_ld64() local
|
| /external/XNNPACK/src/f32-gemm/gen-inc/ |
| D | 3x8inc-minmax-wasmsimd-arm-splat.c | 89 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemminc_minmax_ukernel_3x8__wasmsimd_arm_splat() local
|
| D | 3x8inc-minmax-wasmrelaxedsimd-splat.c | 89 const v128_t va1c1 = wasm_v32x4_shuffle(va1, va1, 1, 1, 1, 1); in xnn_f32_gemminc_minmax_ukernel_3x8__wasmrelaxedsimd_splat() local
|