/external/XNNPACK/src/f32-raddstoreexpminusmax/gen/ |
D | neonfma-p5-x4.c | 94 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x4() local 96 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x4() local
|
D | neon-p5-x4.c | 95 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x4() local 97 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x4() local
|
D | neonfma-lut64-p2-x4.c | 113 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x4() local 115 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_lut64_p2_x4() local
|
D | neon-lut64-p2-x4.c | 114 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x4() local 116 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_lut64_p2_x4() local
|
D | neonfma-p5-x8-acc2.c | 170 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x8_acc2() local 172 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x8_acc2() local
|
D | neon-p5-x8.c | 168 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x8() local 170 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x8() local
|
D | neon-p5-x8-acc2.c | 171 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x8_acc2() local 173 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neon_p5_x8_acc2() local
|
D | neonfma-p5-x8.c | 167 float vacc_lo = vaddvq_f32(vacc); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x8() local 169 float32x2_t vacc_lo = vadd_f32(vget_high_f32(vacc), vget_low_f32(vacc)); in xnn_f32_raddstoreexpminusmax_ukernel__neonfma_p5_x8() local
|
/external/XNNPACK/src/f32-relu/ |
D | neon.c.in | 50 float32x2_t vacc_lo = vget_low_f32(vacc); variable
|
D | avx.c.in | 65 __m128 vacc_lo = _mm256_castps256_ps128(vacc); variable
|
/external/XNNPACK/src/f32-clamp/ |
D | neon.c.in | 56 float32x2_t vacc_lo = vget_low_f32(vacc); variable
|
D | avx.c.in | 71 __m128 vacc_lo = _mm256_castps256_ps128(vacc); variable
|
/external/XNNPACK/src/f16-relu/ |
D | neonfp16arith.c.in | 53 float16x4_t vacc_lo = vget_low_f16(vacc); variable
|
/external/XNNPACK/src/f32-vlrelu/ |
D | neon.c.in | 56 float32x2_t vacc_lo = vget_low_f32(vacc); variable
|
D | avx.c.in | 65 __m128 vacc_lo = _mm256_castps256_ps128(vacc); variable
|
/external/XNNPACK/src/qu8-vadd/ |
D | minmax-sse2.c | 52 …__m128i vacc_lo = _mm_add_epi32(vzero_point_product, _mm_unpacklo_epi16(va_product_lo, va_product_… in xnn_qu8_vadd_minmax_ukernel__sse2() local 94 …__m128i vacc_lo = _mm_add_epi32(vzero_point_product, _mm_unpacklo_epi16(va_product_lo, va_product_… in xnn_qu8_vadd_minmax_ukernel__sse2() local
|
/external/XNNPACK/src/f16-clamp/ |
D | neonfp16arith.c.in | 59 float16x4_t vacc_lo = vget_low_f16(vacc); variable
|
/external/XNNPACK/src/f32-hswish/ |
D | avx.c.in | 95 __m128 vacc_lo = _mm256_castps256_ps128(vacc); variable
|
D | neon.c.in | 69 float32x2_t vacc_lo = vget_low_f32(vacc); variable
|
/external/XNNPACK/src/f32-relu/gen/ |
D | neon-x4.c | 42 float32x2_t vacc_lo = vget_low_f32(vacc); in xnn_f32_relu_ukernel__neon_x4() local
|
D | avx-x8.c | 51 __m128 vacc_lo = _mm256_castps256_ps128(vacc); in xnn_f32_relu_ukernel__avx_x8() local
|
D | neon-x8.c | 50 float32x2_t vacc_lo = vget_low_f32(vacc); in xnn_f32_relu_ukernel__neon_x8() local
|
/external/XNNPACK/src/f32-clamp/gen/ |
D | neon-x4.c | 46 float32x2_t vacc_lo = vget_low_f32(vacc); in xnn_f32_clamp_ukernel__neon_x4() local
|
/external/XNNPACK/src/f16-relu/gen/ |
D | neonfp16arith-x8.c | 45 float16x4_t vacc_lo = vget_low_f16(vacc); in xnn_f16_relu_ukernel__neonfp16arith_x8() local
|
/external/XNNPACK/src/f16-hswish/ |
D | neonfp16arith.c.in | 72 float16x4_t vacc_lo = vget_low_f16(vacc); variable
|