Home
last modified time | relevance | path

Searched refs:vp89AB (Results 1 – 25 of 126) sorted by relevance

123456

/external/XNNPACK/src/f32-sigmoid/gen/
Dpsimd-p5-div-x12.c94 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vt89AB, vc5); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x12() local
98 vp89AB = psimd_qfma_f32(vc3, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x12()
102 vp89AB = psimd_qfma_f32(vc2, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x12()
106 vp89AB = psimd_qfma_f32(vc1, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x12()
118 const psimd_f32 ve89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x12()
Dneonfma-rr1-p5-div-x12.c85 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x12() local
89 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x12()
93 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x12()
97 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x12()
109 float32x4_t ve89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x12()
Dpsimd-p5-div-x16.c101 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vt89AB, vc5); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x16() local
106 vp89AB = psimd_qfma_f32(vc3, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x16()
111 vp89AB = psimd_qfma_f32(vc2, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x16()
116 vp89AB = psimd_qfma_f32(vc1, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x16()
130 const psimd_f32 ve89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_sigmoid_ukernel__psimd_p5_div_x16()
Dsse41-p5-div-x12.c93 __m128 vp89AB = _mm_add_ps(_mm_mul_ps(vc5, vt89AB), vc4); in xnn_f32_sigmoid_ukernel__sse41_p5_div_x12() local
97 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc3); in xnn_f32_sigmoid_ukernel__sse41_p5_div_x12()
101 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc2); in xnn_f32_sigmoid_ukernel__sse41_p5_div_x12()
105 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc1); in xnn_f32_sigmoid_ukernel__sse41_p5_div_x12()
117 __m128 ve89AB = _mm_add_ps(_mm_mul_ps(vt89AB, vp89AB), vs89AB); in xnn_f32_sigmoid_ukernel__sse41_p5_div_x12()
Dneonfma-rr1-p5-div-x16.c91 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x16() local
96 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x16()
101 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x16()
106 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x16()
120 float32x4_t ve89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_div_x16()
Dneonfma-rr1-p5-nr2fma-x12.c85 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2fma_x12() local
89 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2fma_x12()
93 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2fma_x12()
97 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2fma_x12()
109 float32x4_t ve89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2fma_x12()
Dneonfma-rr1-p5-nr2recps-x12.c85 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2recps_x12() local
89 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2recps_x12()
93 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2recps_x12()
97 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2recps_x12()
109 float32x4_t ve89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neonfma_rr1_p5_nr2recps_x12()
Dneon-rr2-p5-nr2recps-x12.c92 float32x4_t vp89AB = vmlaq_f32(vc4, vc5, vt89AB); in xnn_f32_sigmoid_ukernel__neon_rr2_p5_nr2recps_x12() local
96 vp89AB = vmlaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neon_rr2_p5_nr2recps_x12()
100 vp89AB = vmlaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neon_rr2_p5_nr2recps_x12()
104 vp89AB = vmlaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neon_rr2_p5_nr2recps_x12()
116 float32x4_t ve89AB = vmlaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_sigmoid_ukernel__neon_rr2_p5_nr2recps_x12()
/external/XNNPACK/src/f32-raddstoreexpminusmax/gen/
Dpsimd-p5-x12.c85 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12() local
89 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12()
93 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12()
97 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12()
109 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12()
Dpsimd-p5-x12-acc2.c86 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc2() local
90 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc2()
94 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc2()
98 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc2()
110 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc2()
Dpsimd-p5-x12-acc3.c87 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc3() local
91 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc3()
95 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc3()
99 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc3()
111 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x12_acc3()
Dsse2-p5-x12.c85 __m128 vp89AB = _mm_add_ps(_mm_mul_ps(vc5, vt89AB), vc4); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12() local
89 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc3); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12()
93 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc2); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12()
97 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc1); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12()
109 __m128 vf89AB = _mm_add_ps(_mm_mul_ps(vt89AB, vp89AB), vs89AB); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12()
Dneon-p5-x12.c89 float32x4_t vp89AB = vmlaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12() local
93 vp89AB = vmlaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12()
97 vp89AB = vmlaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12()
101 vp89AB = vmlaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12()
113 float32x4_t vf89AB = vmlaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12()
Dneonfma-p5-x12.c88 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12() local
92 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12()
96 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12()
100 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12()
112 float32x4_t vf89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12()
Dneonfma-p5-x12-acc2.c89 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc2() local
93 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc2()
97 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc2()
101 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc2()
113 float32x4_t vf89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc2()
Dneon-p5-x12-acc2.c90 float32x4_t vp89AB = vmlaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc2() local
94 vp89AB = vmlaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc2()
98 vp89AB = vmlaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc2()
102 vp89AB = vmlaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc2()
114 float32x4_t vf89AB = vmlaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc2()
Dpsimd-p5-x16-acc2.c93 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc2() local
98 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc2()
103 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc2()
108 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc2()
122 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc2()
Dsse2-p5-x12-acc3.c87 __m128 vp89AB = _mm_add_ps(_mm_mul_ps(vc5, vt89AB), vc4); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc3() local
91 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc3); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc3()
95 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc2); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc3()
99 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc1); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc3()
111 __m128 vf89AB = _mm_add_ps(_mm_mul_ps(vt89AB, vp89AB), vs89AB); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc3()
Dpsimd-p5-x16.c92 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16() local
97 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16()
102 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16()
107 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16()
121 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16()
Dpsimd-p5-x16-acc4.c95 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc4() local
100 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc4()
105 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc4()
110 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc4()
124 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x16_acc4()
Dneonfma-p5-x12-acc3.c90 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc3() local
94 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc3()
98 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc3()
102 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc3()
114 float32x4_t vf89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x12_acc3()
Dneon-p5-x12-acc3.c91 float32x4_t vp89AB = vmlaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc3() local
95 vp89AB = vmlaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc3()
99 vp89AB = vmlaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc3()
103 vp89AB = vmlaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc3()
115 float32x4_t vf89AB = vmlaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x12_acc3()
Dsse2-p5-x12-acc2.c86 __m128 vp89AB = _mm_add_ps(_mm_mul_ps(vc5, vt89AB), vc4); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc2() local
90 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc3); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc2()
94 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc2); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc2()
98 vp89AB = _mm_add_ps(_mm_mul_ps(vp89AB, vt89AB), vc1); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc2()
110 __m128 vf89AB = _mm_add_ps(_mm_mul_ps(vt89AB, vp89AB), vs89AB); in xnn_f32_raddstoreexpminusmax_ukernel__sse2_p5_x12_acc2()
Dneonfma-p5-x16-acc4.c98 float32x4_t vp89AB = vfmaq_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x16_acc4() local
103 vp89AB = vfmaq_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x16_acc4()
108 vp89AB = vfmaq_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x16_acc4()
113 vp89AB = vfmaq_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x16_acc4()
127 float32x4_t vf89AB = vfmaq_f32(vs89AB, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x16_acc4()
Dpsimd-p5-x20-acc2.c100 psimd_f32 vp89AB = psimd_qfma_f32(vc4, vc5, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x20_acc2() local
106 vp89AB = psimd_qfma_f32(vc3, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x20_acc2()
112 vp89AB = psimd_qfma_f32(vc2, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x20_acc2()
118 vp89AB = psimd_qfma_f32(vc1, vp89AB, vt89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x20_acc2()
134 psimd_f32 vf89AB = psimd_qfma_f32(vs89AB, vt89AB, vp89AB); in xnn_f32_raddstoreexpminusmax_ukernel__psimd_p5_x20_acc2()

123456