Home
last modified time | relevance | path

Searched refs:vout_lo (Results 1 – 8 of 8) sorted by relevance

/external/XNNPACK/src/u8-maxpool/
D9p8x-neon-c16.c124 uint8x8_t vout_lo = vget_low_u8(vout); in xnn_u8_maxpool_ukernel_9p8x__neon_c16() local
126 vst1_u8(o, vout_lo); o += 8; in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
127 vout_lo = vget_high_u8(vout); in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
130 vst1_lane_u32(__builtin_assume_aligned(o, 1), vreinterpret_u32_u8(vout_lo), 0); o += 4; in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
131 vout_lo = vext_u8(vout_lo, vout_lo, 4); in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
134 vst1_lane_u16(__builtin_assume_aligned(o, 1), vreinterpret_u16_u8(vout_lo), 0); o += 2; in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
135 vout_lo = vext_u8(vout_lo, vout_lo, 2); in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
138 vst1_lane_u8(o, vout_lo, 0); o += 1; in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
228 uint8x8_t vout_lo = vget_low_u8(vout); in xnn_u8_maxpool_ukernel_9p8x__neon_c16() local
230 vst1_u8(o, vout_lo); o += 8; in xnn_u8_maxpool_ukernel_9p8x__neon_c16()
[all …]
/external/XNNPACK/src/f32-gavgpool/
Dup7-neon.c103 float32x2_t vout_lo = vget_low_f32(vout); in xnn_f32_gavgpool_ukernel_up7__neon() local
105 vst1_f32(output, vout_lo); output += 2; in xnn_f32_gavgpool_ukernel_up7__neon()
106 vout_lo = vget_high_f32(vout); in xnn_f32_gavgpool_ukernel_up7__neon()
109 vst1_lane_f32(output, vout_lo, 0); in xnn_f32_gavgpool_ukernel_up7__neon()
Dmp7p7q-neon.c175 float32x2_t vout_lo = vget_low_f32(vout); in xnn_f32_gavgpool_ukernel_mp7p7q__neon() local
177 vst1_f32(output, vout_lo); output += 2; in xnn_f32_gavgpool_ukernel_mp7p7q__neon()
178 vout_lo = vget_high_f32(vout); in xnn_f32_gavgpool_ukernel_mp7p7q__neon()
181 vst1_lane_f32(output, vout_lo, 0); in xnn_f32_gavgpool_ukernel_mp7p7q__neon()
/external/XNNPACK/src/f32-avgpool/
Dup9-neon.c122 float32x2_t vout_lo = vget_low_f32(vout); in xnn_f32_avgpool_ukernel_up9__neon() local
124 vst1_f32(output, vout_lo); output += 2; in xnn_f32_avgpool_ukernel_up9__neon()
125 vout_lo = vget_high_f32(vout); in xnn_f32_avgpool_ukernel_up9__neon()
128 vst1_lane_f32(output, vout_lo, 0); output += 1; in xnn_f32_avgpool_ukernel_up9__neon()
Dmp9p8q-neon.c192 float32x2_t vout_lo = vget_low_f32(vout); in xnn_f32_avgpool_ukernel_mp9p8q__neon() local
194 vst1_f32(output, vout_lo); output += 2; in xnn_f32_avgpool_ukernel_mp9p8q__neon()
195 vout_lo = vget_high_f32(vout); in xnn_f32_avgpool_ukernel_mp9p8q__neon()
198 vst1_lane_f32(output, vout_lo, 0); output += 1; in xnn_f32_avgpool_ukernel_mp9p8q__neon()
/external/XNNPACK/src/f32-pavgpool/
Dup9-neon.c124 float32x2_t vout_lo = vget_low_f32(vout); in xnn_f32_pavgpool_ukernel_up9__neon() local
126 vst1_f32(output, vout_lo); output += 2; in xnn_f32_pavgpool_ukernel_up9__neon()
127 vout_lo = vget_high_f32(vout); in xnn_f32_pavgpool_ukernel_up9__neon()
130 vst1_lane_f32(output, vout_lo, 0); output += 1; in xnn_f32_pavgpool_ukernel_up9__neon()
Dmp9p8q-neon.c194 float32x2_t vout_lo = vget_low_f32(vout); in xnn_f32_pavgpool_ukernel_mp9p8q__neon() local
196 vst1_f32(output, vout_lo); output += 2; in xnn_f32_pavgpool_ukernel_mp9p8q__neon()
197 vout_lo = vget_high_f32(vout); in xnn_f32_pavgpool_ukernel_mp9p8q__neon()
200 vst1_lane_f32(output, vout_lo, 0); output += 1; in xnn_f32_pavgpool_ukernel_mp9p8q__neon()
/external/XNNPACK/src/q8-dwconv/
Dup8x9-sse2.c183 …const __m128i vout_lo = _mm_sub_epi32(_mm_sra_epi32(vq31prod_lo0123, vshift), _mm_cmpgt_epi32(vrem… in xnn_q8_dwconv_ukernel_up8x9__sse2() local
187 __m128i vout = _mm_adds_epi16(_mm_packs_epi32(vout_lo, vout_hi), voutput_zero_point); in xnn_q8_dwconv_ukernel_up8x9__sse2()
333 …const __m128i vout_lo = _mm_sub_epi32(_mm_sra_epi32(vq31prod_lo0123, vshift), _mm_cmpgt_epi32(vrem… in xnn_q8_dwconv_ukernel_up8x9__sse2() local
337 __m128i vout = _mm_adds_epi16(_mm_packs_epi32(vout_lo, vout_hi), voutput_zero_point); in xnn_q8_dwconv_ukernel_up8x9__sse2()