/external/XNNPACK/src/f32-velu/gen/ |
D | velu-sse41-rr2-lut16-p3-x8.c | 67 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x8() local 84 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x8() local
|
D | velu-sse2-rr2-lut16-p3-x8.c | 69 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x8() local 90 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x8() local
|
D | velu-sse41-rr2-lut16-p3-x12.c | 72 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x12() local 96 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x12() local
|
D | velu-sse2-rr2-lut16-p3-x12.c | 74 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x12() local 104 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x12() local
|
D | velu-sse41-rr2-lut16-p3-x16.c | 77 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x16() local 108 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x16() local
|
D | velu-sse41-rr2-lut16-p3-x20.c | 82 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x20() local 120 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x20() local
|
D | velu-sse2-rr2-lut16-p3-x16.c | 79 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x16() local 118 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse2_rr2_lut16_p3_x16() local
|
D | velu-neon-rr2-lut16-p3-x8.c | 65 const int32x4_t vl0123 = vcombine_s32(vl01, vl23); in xnn_f32_velu_ukernel__neon_rr2_lut16_p3_x8() local
|
D | velu-neonfma-rr1-lut16-p3-x8.c | 64 const int32x4_t vl0123 = vcombine_s32(vl01, vl23); in xnn_f32_velu_ukernel__neonfma_rr1_lut16_p3_x8() local
|
D | velu-sse41-rr2-lut16-p3-x24.c | 87 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x24() local 132 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_velu_ukernel__sse41_rr2_lut16_p3_x24() local
|
/external/XNNPACK/src/f32-vsigmoid/gen/ |
D | vsigmoid-sse41-rr2-lut64-p2-div-x8.c | 62 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x8() local 79 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x8() local
|
D | vsigmoid-sse2-rr2-lut64-p2-div-x8.c | 64 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x8() local 85 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x8() local
|
D | vsigmoid-sse41-rr2-lut64-p2-div-x12.c | 67 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x12() local 91 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x12() local
|
D | vsigmoid-sse2-rr2-lut64-p2-div-x12.c | 69 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x12() local 99 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x12() local
|
D | vsigmoid-sse41-rr2-lut64-p2-div-x16.c | 72 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x16() local 103 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x16() local
|
D | vsigmoid-sse2-rr2-lut64-p2-div-x16.c | 74 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x16() local 113 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse2_rr2_lut64_p2_div_x16() local
|
D | vsigmoid-sse41-rr2-lut64-p2-div-x20.c | 77 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x20() local 115 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x20() local
|
D | vsigmoid-neonfma-rr1-lut64-p2-div-x8.c | 64 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut64_p2_div_x8() local
|
D | vsigmoid-neonfma-rr1-lut2048-p1-div-x8.c | 63 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x8() local
|
D | vsigmoid-sse41-rr2-lut64-p2-div-x24.c | 82 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x24() local 127 const __m128i vl0123 = _mm_unpacklo_epi64(vl01, vl23); in xnn_f32_vsigmoid_ukernel__sse41_rr2_lut64_p2_div_x24() local
|
D | vsigmoid-neonfma-rr1-lut2048-p1-nr2recps-x8.c | 63 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_vsigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2recps_x8() local
|
/external/XNNPACK/src/f32-raddstoreexpminusmax/gen/ |
D | neonfma-rr1-lut64-p2-x8.c | 66 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_rr1_lut64_p2_x8() local
|
D | neon-rr2-lut64-p2-x8-acc2.c | 68 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neon_rr2_lut64_p2_x8_acc2() local
|
D | neonfma-rr1-lut64-p2-x8-acc2.c | 67 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_rr1_lut64_p2_x8_acc2() local
|
D | neon-rr2-lut64-p2-x8.c | 67 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neon_rr2_lut64_p2_x8() local
|