Home
last modified time | relevance | path

Searched refs:vl01 (Results 1 – 25 of 85) sorted by relevance

1234

/external/XNNPACK/src/math/
Dexpminus-neonfma-lut2048-p1.c576 float32x2_t vl01 = vld1_dup_f32(&exp2_k_over_2048_table[(uint32_t) vidx01]); in xnn_math_f32_expminus__neonfma_lut2048_p1() local
578 vl01 = vld1_lane_f32(&exp2_k_over_2048_table[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_expminus__neonfma_lut2048_p1()
580 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_expminus__neonfma_lut2048_p1()
Dexpminus-neonfma-lut64-p2.c80 float32x2_t vl01 = vld1_dup_f32(&exp2_k_over_64_table[(uint32_t) vidx01]); in xnn_math_f32_expminus__neonfma_lut64_p2() local
82 vl01 = vld1_lane_f32(&exp2_k_over_64_table[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_expminus__neonfma_lut64_p2()
84 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_expminus__neonfma_lut64_p2()
Dsigmoid-neonfma-rr1-lut2048-p1-div.c74 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_div() local
76 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_div()
78 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_div()
Dsigmoid-neonfma-rr1-lut2048-p1-nr2recps.c74 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr2recps() local
76 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr2recps()
78 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr2recps()
Dsigmoid-neonfma-rr1-lut2048-p1-nr2fma.c74 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr2fma() local
76 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr2fma()
78 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr2fma()
Dsigmoid-neonfma-rr1-lut2048-p1-nr1recps1fma.c74 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr1recps1fma() local
76 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr1recps1fma()
78 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr1_lut2048_p1_nr1recps1fma()
Dsigmoid-neonfma-rr2-lut2048-p1-div.c75 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_div() local
77 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_div()
79 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_div()
Dsigmoid-neon-rr1-lut2048-p1-nr2recps.c74 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neon_rr1_lut2048_p1_nr2recps() local
76 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neon_rr1_lut2048_p1_nr2recps()
78 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neon_rr1_lut2048_p1_nr2recps()
Dsigmoid-neonfma-rr2-lut2048-p1-nr2fma.c75 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr2fma() local
77 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr2fma()
79 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr2fma()
Dsigmoid-neon-rr2-lut2048-p1-nr2recps.c76 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neon_rr2_lut2048_p1_nr2recps() local
78 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neon_rr2_lut2048_p1_nr2recps()
80 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neon_rr2_lut2048_p1_nr2recps()
Dsigmoid-neonfma-rr2-lut2048-p1-nr1recps1fma.c75 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr1recps1fma() local
77 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr1recps1fma()
79 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr1recps1fma()
Dsigmoid-neonfma-rr2-lut2048-p1-nr2recps.c75 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr2recps() local
77 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr2recps()
79 const float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_sigmoid__neonfma_rr2_lut2048_p1_nr2recps()
Dexp-neonfma-lut64-p2.c88 float32x2_t vl01 = vld1_dup_f32(&exp2_table[(uint32_t) vidx01]); in xnn_math_f32_exp__neonfma_lut64_p2() local
90 vl01 = vld1_lane_f32(&exp2_table[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_math_f32_exp__neonfma_lut64_p2()
92 float32x4_t vl = vcombine_f32(vl01, vl23); in xnn_math_f32_exp__neonfma_lut64_p2()
/external/XNNPACK/src/f32-raddstoreexpminusmax/gen/
Dneon-lut64-p2-x8-acc2.c85 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x8_acc2() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x8_acc2()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x8_acc2()
Dneonfma-lut64-p2-x8-acc2.c84 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x8_acc2() local
89 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x8_acc2()
91 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x8_acc2()
Dneon-lut64-p2-x8.c84 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x8() local
89 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x8()
91 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x8()
Dneonfma-lut64-p2-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x8() local
88 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x8()
90 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x8()
/external/XNNPACK/src/f32-sigmoid/gen/
Dneonfma-rr1-lut64-p2-div-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x8()
Dneonfma-rr1-lut2048-p1-div-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x8()
Dneonfma-rr1-lut2048-p1-nr1recps1fma-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr1recps1fma_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr1recps1fma_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr1recps1fma_x8()
Dneonfma-rr1-lut2048-p1-nr2recps-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2recps_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2recps_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2recps_x8()
Dneonfma-rr1-lut64-p2-nr1recps1fma-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x8()
Dneonfma-rr1-lut64-p2-nr2recps-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_64[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2recps_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_64[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2recps_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2recps_x8()
Dneonfma-rr1-lut2048-p1-nr2fma-x8.c83 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2fma_x8() local
90 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2fma_x8()
92 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2fma_x8()
Dneon-rr2-lut2048-p1-nr2recps-x8.c85 float32x2_t vl01 = vld1_dup_f32(&xnn_table_exp2_k_over_2048[(uint32_t) vidx01]); in xnn_f32_sigmoid_ukernel__neon_rr2_lut2048_p1_nr2recps_x8() local
92 vl01 = vld1_lane_f32(&xnn_table_exp2_k_over_2048[(uint32_t) (vidx01 >> 32)], vl01, 1); in xnn_f32_sigmoid_ukernel__neon_rr2_lut2048_p1_nr2recps_x8()
94 const float32x4_t vl0123 = vcombine_f32(vl01, vl23); in xnn_f32_sigmoid_ukernel__neon_rr2_lut2048_p1_nr2recps_x8()

1234