/external/XNNPACK/src/f32-vbinary/gen/ |
D | vmax-wasmsimd-x86-x8.c | 42 const v128_t vm4567 = wasm_f32x4_le(va4567, vb4567); in xnn_f32_vmax_ukernel__wasmsimd_x86_x8() local 45 v128_t vy4567 = wasm_v128_bitselect(vb4567, va4567, vm4567); in xnn_f32_vmax_ukernel__wasmsimd_x86_x8()
|
D | vmin-wasmsimd-x86-x8.c | 42 const v128_t vm4567 = wasm_f32x4_lt(va4567, vb4567); in xnn_f32_vmin_ukernel__wasmsimd_x86_x8() local 45 v128_t vy4567 = wasm_v128_bitselect(va4567, vb4567, vm4567); in xnn_f32_vmin_ukernel__wasmsimd_x86_x8()
|
D | vmax-wasmsimd-x86-x16.c | 46 const v128_t vm4567 = wasm_f32x4_le(va4567, vb4567); in xnn_f32_vmax_ukernel__wasmsimd_x86_x16() local 51 v128_t vy4567 = wasm_v128_bitselect(vb4567, va4567, vm4567); in xnn_f32_vmax_ukernel__wasmsimd_x86_x16()
|
D | vmin-wasmsimd-x86-x16.c | 46 const v128_t vm4567 = wasm_f32x4_lt(va4567, vb4567); in xnn_f32_vmin_ukernel__wasmsimd_x86_x16() local 51 v128_t vy4567 = wasm_v128_bitselect(va4567, vb4567, vm4567); in xnn_f32_vmin_ukernel__wasmsimd_x86_x16()
|
/external/XNNPACK/src/f32-velu/gen/ |
D | velu-sse2-rr2-p6-x8.c | 95 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_velu_ukernel__sse2_rr2_p6_x8() local 99 const __m128 vy4567 = _mm_or_ps(_mm_and_ps(ve4567, vm4567), _mm_andnot_ps(vm4567, vx4567)); in xnn_f32_velu_ukernel__sse2_rr2_p6_x8()
|
D | velu-sse2-rr2-p6-x12.c | 111 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_velu_ukernel__sse2_rr2_p6_x12() local 117 const __m128 vy4567 = _mm_or_ps(_mm_and_ps(ve4567, vm4567), _mm_andnot_ps(vm4567, vx4567)); in xnn_f32_velu_ukernel__sse2_rr2_p6_x12()
|
D | velu-sse2-rr2-p6-x16.c | 127 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_velu_ukernel__sse2_rr2_p6_x16() local 135 const __m128 vy4567 = _mm_or_ps(_mm_and_ps(ve4567, vm4567), _mm_andnot_ps(vm4567, vx4567)); in xnn_f32_velu_ukernel__sse2_rr2_p6_x16()
|
D | velu-neonfma-rr1-p6-x8.c | 89 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_velu_ukernel__neonfma_rr1_p6_x8() local 93 const float32x4_t vy4567 = vbslq_f32(vm4567, ve4567, vx4567); in xnn_f32_velu_ukernel__neonfma_rr1_p6_x8()
|
D | velu-neon-rr2-p6-x8.c | 93 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_velu_ukernel__neon_rr2_p6_x8() local 97 const float32x4_t vy4567 = vbslq_f32(vm4567, ve4567, vx4567); in xnn_f32_velu_ukernel__neon_rr2_p6_x8()
|
D | velu-sse2-rr2-p6-x20.c | 143 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_velu_ukernel__sse2_rr2_p6_x20() local 153 const __m128 vy4567 = _mm_or_ps(_mm_and_ps(ve4567, vm4567), _mm_andnot_ps(vm4567, vx4567)); in xnn_f32_velu_ukernel__sse2_rr2_p6_x20()
|
D | velu-sse2-rr2-lut16-p3-x8.c | 134 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x8() local 138 const __m128 vy4567 = _mm_or_ps(_mm_and_ps(ve4567, vm4567), _mm_andnot_ps(vm4567, vx4567)); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x8()
|
/external/XNNPACK/src/f32-vsigmoid/gen/ |
D | vsigmoid-sse2-rr2-p5-div-x8.c | 89 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x8() local 92 vf4567 = _mm_or_ps(_mm_and_ps(vf4567, vm4567), _mm_andnot_ps(vm4567, _mm_sub_ps(vone, vf4567))); in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x8()
|
D | vsigmoid-sse2-rr2-p5-div-x12.c | 105 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x12() local 109 vf4567 = _mm_or_ps(_mm_and_ps(vf4567, vm4567), _mm_andnot_ps(vm4567, _mm_sub_ps(vone, vf4567))); in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x12()
|
D | vsigmoid-sse2-rr2-p5-div-x16.c | 121 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x16() local 126 vf4567 = _mm_or_ps(_mm_and_ps(vf4567, vm4567), _mm_andnot_ps(vm4567, _mm_sub_ps(vone, vf4567))); in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x16()
|
D | vsigmoid-neonfma-rr1-p5-div-x8.c | 84 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_div_x8() local 87 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_div_x8()
|
D | vsigmoid-sse2-rr2-p5-div-x20.c | 137 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x20() local 143 vf4567 = _mm_or_ps(_mm_and_ps(vf4567, vm4567), _mm_andnot_ps(vm4567, _mm_sub_ps(vone, vf4567))); in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x20()
|
D | vsigmoid-neonfma-rr1-p5-nr2recps-x8.c | 93 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_nr2recps_x8() local 96 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_nr2recps_x8()
|
D | vsigmoid-sse2-rr2-lut64-p2-div-x8.c | 127 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x8() local 130 vf4567 = _mm_or_ps(_mm_and_ps(vf4567, vm4567), _mm_andnot_ps(vm4567, _mm_sub_ps(vone, vf4567))); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x8()
|
D | vsigmoid-neonfma-rr1-lut64-p2-div-x8.c | 97 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut64_p2_div_x8() local 100 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut64_p2_div_x8()
|
D | vsigmoid-neonfma-rr1-lut2048-p1-div-x8.c | 93 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x8() local 96 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x8()
|
D | vsigmoid-neon-rr2-p5-nr2recps-x8.c | 97 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neon_rr2_p5_nr2recps_x8() local 100 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neon_rr2_p5_nr2recps_x8()
|
D | vsigmoid-neonfma-rr1-p5-nr1recps1fma-x8.c | 93 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_nr1recps1fma_x8() local 96 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_nr1recps1fma_x8()
|
D | vsigmoid-neonfma-rr1-p5-div-x12.c | 99 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_div_x12() local 103 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_div_x12()
|
D | vsigmoid-neonfma-rr1-p5-nr2fma-x8.c | 93 const uint32x4_t vm4567 = vcltq_f32(vx4567, vmovq_n_f32(0.0f)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_nr2fma_x8() local 96 vf4567 = vbslq_f32(vm4567, vf4567, vsubq_f32(vone, vf4567)); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_p5_nr2fma_x8()
|
D | vsigmoid-sse2-rr2-p5-div-x24.c | 153 …const __m128 vm4567 = _mm_castsi128_ps(_mm_cmpgt_epi32(_mm_setzero_si128(), _mm_castps_si128(vx456… in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x24() local 160 vf4567 = _mm_or_ps(_mm_and_ps(vf4567, vm4567), _mm_andnot_ps(vm4567, _mm_sub_ps(vone, vf4567))); in xnn_f32_vsigmoid_ukernel__sse2_rr2_p5_div_x24()
|