/external/XNNPACK/src/f32-raddstoreexpminusmax/gen/ |
D | neonfma-lut64-p2-x16-acc4.c | 120 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x16_acc4() local 126 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x16_acc4()
|
D | neon-lut64-p2-x16-acc2.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x16_acc2() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x16_acc2()
|
D | neon-lut64-p2-x16.c | 118 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x16() local 124 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x16()
|
D | neonfma-lut64-p2-x16-acc2.c | 118 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x16_acc2() local 124 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x16_acc2()
|
D | neon-lut64-p2-x16-acc4.c | 121 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x16_acc4() local 127 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x16_acc4()
|
D | neonfma-lut64-p2-x16.c | 117 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x16() local 123 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x16()
|
D | neonfma-lut64-p2-x20.c | 126 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x20() local 135 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x20()
|
D | neonfma-lut64-p2-x20-acc5.c | 130 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x20_acc5() local 139 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x20_acc5()
|
D | neonfma-lut64-p2-x20-acc2.c | 127 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x20_acc2() local 136 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x20_acc2()
|
D | neon-lut64-p2-x20-acc2.c | 128 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x20_acc2() local 137 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x20_acc2()
|
D | neon-lut64-p2-x20.c | 127 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x20() local 136 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x20()
|
D | neon-lut64-p2-x20-acc5.c | 131 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x20_acc5() local 140 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x20_acc5()
|
/external/XNNPACK/src/f32-sigmoid/gen/ |
D | neonfma-rr1-lut2048-p1-div-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x16()
|
D | neonfma-rr1-lut64-p2-div-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x16()
|
D | neonfma-rr1-lut2048-p1-nr2recps-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2recps_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2recps_x16()
|
D | neonfma-rr1-lut2048-p1-nr1recps1fma-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr1recps1fma_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr1recps1fma_x16()
|
D | neon-rr2-lut64-p2-nr2recps-x16.c | 121 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neon_rr2_lut64_p2_nr2recps_x16() local 127 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neon_rr2_lut64_p2_nr2recps_x16()
|
D | neonfma-rr1-lut64-p2-nr2fma-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2fma_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2fma_x16()
|
D | neonfma-rr1-lut2048-p1-div-x20.c | 128 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x20() local 137 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_div_x20()
|
D | neonfma-rr1-lut64-p2-nr1recps1fma-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x16()
|
D | neonfma-rr1-lut64-p2-nr2recps-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2recps_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr2recps_x16()
|
D | neon-rr2-lut2048-p1-nr2recps-x16.c | 121 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neon_rr2_lut2048_p1_nr2recps_x16() local 127 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neon_rr2_lut2048_p1_nr2recps_x16()
|
D | neonfma-rr1-lut2048-p1-nr2fma-x16.c | 119 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2fma_x16() local 125 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut2048_p1_nr2fma_x16()
|
D | neonfma-rr1-lut64-p2-div-x20.c | 128 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x20() local 137 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_div_x20()
|
D | neonfma-rr1-lut64-p2-nr1recps1fma-x20.c | 128 const float32x4_t vlCDEF = vcombine_f32(vlCD, vlEF); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x20() local 137 …const float32x4_t vsCDEF = vreinterpretq_f32_s32(vaddq_s32(vreinterpretq_s32_f32(vlCDEF), veCDEF)); in xnn_f32_sigmoid_ukernel__neonfma_rr1_lut64_p2_nr1recps1fma_x20()
|