Home
last modified time | relevance | path

Searched refs:vsum89ABCDEF (Results 1 – 25 of 42) sorted by relevance

12

/external/XNNPACK/src/qs8-gavgpool/gen/
D7p7x-minmax-fp32-neon-c16.c52 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local
57 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
69 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
71 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
75 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
76 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
104 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local
109 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
[all …]
D7p7x-minmax-rndnu-neon-c16.c52 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local
57 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
69 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
71 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
75 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
76 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
104 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local
109 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
[all …]
D7p7x-minmax-fp32-neonv8-c16.c53 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local
58 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
62 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
66 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
70 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
72 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
76 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
77 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
105 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local
110 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
[all …]
D7p7x-minmax-fp32-neon-c24.c54 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
67 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
79 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
83 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
88 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
89 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
149 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
156 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
[all …]
D7p7x-minmax-fp32-neonv8-c24.c55 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
62 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
68 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
74 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
84 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
89 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
90 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
150 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
157 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
[all …]
D7p7x-minmax-rndnu-neon-c24.c54 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
67 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
79 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
83 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
88 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
89 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
149 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
156 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
[all …]
D7p7x-minmax-rndnu-neon-c32.c56 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
81 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
89 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
95 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
101 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
102 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
168 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
177 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
[all …]
D7p7x-minmax-fp32-neonv8-c32.c57 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local
66 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
74 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
82 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
90 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
96 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
102 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
103 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
169 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local
178 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
[all …]
D7p7x-minmax-fp32-neon-c32.c56 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local
65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
81 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
89 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
95 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
101 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
102 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
168 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local
177 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
[all …]
D7x-minmax-fp32-neonv8-c16.c71 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() local
76 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
84 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
88 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
90 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
94 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
95 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
D7x-minmax-fp32-neon-c16.c71 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() local
76 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
84 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
88 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
90 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
94 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
95 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
D7x-minmax-rndnu-neon-c16.c72 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() local
77 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
81 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
85 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
89 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
91 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
95 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
96 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
D7x-minmax-fp32-neonv8-c24.c73 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() local
80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
86 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
92 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
98 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
102 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
107 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
108 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
/external/XNNPACK/src/qu8-gavgpool/gen/
D7p7x-minmax-fp32-neonv8-c16.c53 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local
58 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
62 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
66 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
70 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
72 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
76 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
77 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
105 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local
110 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16()
[all …]
D7p7x-minmax-fp32-neon-c16.c52 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local
57 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
69 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
71 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
75 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
76 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
104 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local
109 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16()
[all …]
D7p7x-minmax-rndnu-neon-c16.c52 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local
57 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
69 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
71 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
75 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
76 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
104 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local
109 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16()
[all …]
D7p7x-minmax-fp32-neonv8-c24.c55 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
62 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
68 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
74 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
80 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
84 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
89 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
90 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
150 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local
157 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24()
[all …]
D7p7x-minmax-fp32-neon-c24.c54 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
67 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
79 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
83 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
88 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
89 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
149 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local
156 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24()
[all …]
D7p7x-minmax-rndnu-neon-c24.c54 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
67 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
79 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
83 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
88 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
89 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
149 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local
156 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24()
[all …]
D7p7x-minmax-fp32-neonv8-c32.c57 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local
66 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
74 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
82 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
90 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
96 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
102 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
103 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
169 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local
178 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32()
[all …]
D7p7x-minmax-fp32-neon-c32.c56 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local
65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
81 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
89 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
95 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
101 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
102 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
168 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local
177 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32()
[all …]
D7p7x-minmax-rndnu-neon-c32.c56 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
81 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
89 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
95 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
101 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
102 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
168 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local
177 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32()
[all …]
D7x-minmax-rndnu-neon-c16.c72 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() local
77 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
81 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
85 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
89 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
91 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
95 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
96 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
D7x-minmax-fp32-neonv8-c16.c71 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() local
76 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
80 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
84 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
88 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
90 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
94 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
95 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
D7x-minmax-fp32-neon-c16.c71 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() local
76 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
80 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
84 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
88 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
90 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
94 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
95 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()

12