/external/XNNPACK/src/qs8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-neon-c16.c | 52 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 57 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 69 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 71 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 75 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 76 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 104 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 109 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() [all …]
|
D | 7p7x-minmax-rndnu-neon-c16.c | 52 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 57 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 69 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 71 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 75 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 76 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 104 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 109 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() [all …]
|
D | 7p7x-minmax-fp32-neonv8-c16.c | 53 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 58 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 62 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 66 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 70 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 72 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 76 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 77 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 105 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 110 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() [all …]
|
D | 7p7x-minmax-fp32-neon-c24.c | 54 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 67 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 79 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 83 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 88 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 89 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 149 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 156 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() [all …]
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 55 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 62 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 68 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 74 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 84 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 89 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 90 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 150 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 157 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() [all …]
|
D | 7p7x-minmax-rndnu-neon-c24.c | 54 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 61 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 67 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 79 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 83 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 88 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 89 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 149 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 156 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() [all …]
|
D | 7p7x-minmax-rndnu-neon-c32.c | 56 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 81 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 89 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 95 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 101 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 102 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 168 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 177 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() [all …]
|
D | 7p7x-minmax-fp32-neonv8-c32.c | 57 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local 66 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 74 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 82 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 90 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 96 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 102 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 103 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 169 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local 178 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() [all …]
|
D | 7p7x-minmax-fp32-neon-c32.c | 56 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local 65 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 73 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 81 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 89 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 95 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 101 const int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 102 const int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 168 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local 177 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() [all …]
|
D | 7x-minmax-fp32-neonv8-c16.c | 71 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() local 76 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 84 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 88 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 90 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 94 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 95 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
|
D | 7x-minmax-fp32-neon-c16.c | 71 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() local 76 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 84 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 88 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 90 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 94 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 95 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
|
D | 7x-minmax-rndnu-neon-c16.c | 72 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() local 77 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 81 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 85 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 89 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 91 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 95 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 96 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
|
D | 7x-minmax-fp32-neonv8-c24.c | 73 int16x8_t vsum89ABCDEF = vaddl_s8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() local 80 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() 86 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() 92 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() 98 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() 102 vsum89ABCDEF = vaddw_s8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() 107 int32x4_t vacc89AB = vaddw_s16(vinit_bias, vget_low_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24() 108 int32x4_t vaccCDEF = vaddw_s16(vinit_bias, vget_high_s16(vsum89ABCDEF)); in xnn_qs8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c24()
|
/external/XNNPACK/src/qu8-gavgpool/gen/ |
D | 7p7x-minmax-fp32-neonv8-c16.c | 53 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 58 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 62 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 66 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 70 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 72 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 76 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 77 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() 105 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() local 110 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c16() [all …]
|
D | 7p7x-minmax-fp32-neon-c16.c | 52 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 57 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 69 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 71 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 75 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 76 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() 104 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() local 109 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c16() [all …]
|
D | 7p7x-minmax-rndnu-neon-c16.c | 52 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 57 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 69 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 71 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 75 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 76 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() 104 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() local 109 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c16() [all …]
|
D | 7p7x-minmax-fp32-neonv8-c24.c | 55 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 62 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 68 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 74 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 80 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 84 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 89 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 90 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() 150 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() local 157 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c24() [all …]
|
D | 7p7x-minmax-fp32-neon-c24.c | 54 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 67 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 79 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 83 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 88 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 89 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() 149 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() local 156 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c24() [all …]
|
D | 7p7x-minmax-rndnu-neon-c24.c | 54 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 61 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 67 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 79 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 83 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 88 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 89 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() 149 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() local 156 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c24() [all …]
|
D | 7p7x-minmax-fp32-neonv8-c32.c | 57 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local 66 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 74 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 82 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 90 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 96 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 102 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 103 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() 169 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() local 178 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neonv8_c32() [all …]
|
D | 7p7x-minmax-fp32-neon-c32.c | 56 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local 65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 81 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 89 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 95 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 101 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 102 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() 168 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() local 177 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7p7x__neon_c32() [all …]
|
D | 7p7x-minmax-rndnu-neon-c32.c | 56 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 65 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 73 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 81 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 89 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 95 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 101 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 102 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() 168 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() local 177 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7p7x__neon_c32() [all …]
|
D | 7x-minmax-rndnu-neon-c16.c | 72 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() local 77 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 81 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 85 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 89 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 91 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 95 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16() 96 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_rndnu_ukernel_7x__neon_c16()
|
D | 7x-minmax-fp32-neonv8-c16.c | 71 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() local 76 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 80 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 84 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 88 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 90 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 94 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16() 95 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neonv8_c16()
|
D | 7x-minmax-fp32-neon-c16.c | 71 uint16x8_t vsum89ABCDEF = vaddl_u8(vi0x89ABCDEF, vi1x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() local 76 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi2x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 80 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi3x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 84 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi4x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 88 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi5x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 90 vsum89ABCDEF = vaddw_u8(vsum89ABCDEF, vi6x89ABCDEF); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 94 … = vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_low_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16() 95 …= vreinterpretq_s32_u32(vaddw_u16(vreinterpretq_u32_s32(vinit_bias), vget_high_u16(vsum89ABCDEF))); in xnn_qu8_gavgpool_minmax_fp32_ukernel_7x__neon_c16()
|