/external/XNNPACK/src/f32-spmm/gen/ |
D | 32x1-minmax-wasmsimd-x86.c | 80 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() local 88 voutSTUV = wasm_v128_bitselect(vmin, voutSTUV, wasm_f32x4_lt(voutSTUV, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86() 96 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86()
|
D | 32x1-minmax-wasmsimd-x86-pipelined.c | 94 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() local 102 voutSTUV = wasm_v128_bitselect(vmin, voutSTUV, wasm_f32x4_lt(voutSTUV, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined() 110 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined()
|
D | 32x1-minmax-neon.c | 83 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__neon() local 91 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__neon() 99 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__neon()
|
D | 32x1-minmax-neonfma.c | 83 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma() local 91 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma() 99 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma()
|
D | 32x1-minmax-wasmsimd-arm-pipelined.c | 94 v128_t voutSTUV = wasm_f32x4_min(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_pipelined() local 102 voutSTUV = wasm_f32x4_max(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_pipelined() 110 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_pipelined()
|
D | 32x1-minmax-wasmsimd-arm.c | 80 v128_t voutSTUV = wasm_f32x4_min(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm() local 88 voutSTUV = wasm_f32x4_max(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm() 96 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm()
|
D | 32x1-minmax-neon-pipelined.c | 94 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__neon_pipelined() local 102 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__neon_pipelined() 110 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__neon_pipelined()
|
D | 32x1-minmax-neonfma-pipelined.c | 94 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma_pipelined() local 102 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma_pipelined() 110 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma_pipelined()
|
D | 32x1-minmax-sse.c | 80 __m128 voutSTUV = _mm_min_ps(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__sse() local 88 voutSTUV = _mm_max_ps(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__sse() 96 _mm_storeu_ps(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__sse()
|
D | 32x1-minmax-wasmsimd-x86-pipelined-x2.c | 134 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() local 142 voutSTUV = wasm_v128_bitselect(vmin, voutSTUV, wasm_f32x4_lt(voutSTUV, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2() 150 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_pipelined_x2()
|
D | 32x1-minmax-wasmsimd-x86-x2.c | 149 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() local 157 voutSTUV = wasm_v128_bitselect(vmin, voutSTUV, wasm_f32x4_lt(voutSTUV, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2() 165 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x2()
|
D | 32x1-minmax-wasmsimd-arm-pipelined-x2.c | 134 v128_t voutSTUV = wasm_f32x4_min(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_pipelined_x2() local 142 voutSTUV = wasm_f32x4_max(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_pipelined_x2() 150 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_pipelined_x2()
|
D | 32x1-minmax-neon-x2.c | 154 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__neon_x2() local 162 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__neon_x2() 170 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__neon_x2()
|
D | 32x1-minmax-neonfma-x2.c | 154 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma_x2() local 162 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma_x2() 170 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__neonfma_x2()
|
D | 32x1-minmax-wasmsimd-arm-x2.c | 149 v128_t voutSTUV = wasm_f32x4_min(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_x2() local 157 voutSTUV = wasm_f32x4_max(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_x2() 165 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_x2()
|
D | 32x1-minmax-wasmsimd-x86-x4.c | 221 v128_t voutSTUV = wasm_v128_bitselect(vaccSTUV, vmax, wasm_f32x4_le(vaccSTUV, vmax)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x4() local 229 voutSTUV = wasm_v128_bitselect(vmin, voutSTUV, wasm_f32x4_lt(voutSTUV, vmin)); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x4() 237 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_x86_x4()
|
D | 32x1-minmax-wasmsimd-arm-x4.c | 221 v128_t voutSTUV = wasm_f32x4_min(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_x4() local 229 voutSTUV = wasm_f32x4_max(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_x4() 237 wasm_v128_store(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x1__wasmsimd_arm_x4()
|
D | 32x2-minmax-neonfma.c | 192 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x2__neonfma() local 201 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x2__neonfma() 210 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x2__neonfma()
|
D | 32x4-minmax-neonfma.c | 274 float32x4_t voutSTUV = vminq_f32(vaccSTUV, vmax); in xnn_f32_spmm_minmax_ukernel_32x4__neonfma() local 283 voutSTUV = vmaxq_f32(voutSTUV, vmin); in xnn_f32_spmm_minmax_ukernel_32x4__neonfma() 292 vst1q_f32(output + 28, voutSTUV); in xnn_f32_spmm_minmax_ukernel_32x4__neonfma()
|