/external/ruy/ruy/ |
D | kernel_avx512.cc | 122 _mm512_mullo_epi32(_mm512_set1_epi32(lhs_zero_point), 160 __m512i initial_accum_data = _mm512_set1_epi32(params.prod_zp_depth); 174 _mm512_mullo_epi32(_mm512_set1_epi32(rhs_zero_point), 183 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[0])); 185 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[1])); 187 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[2])); 189 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[3])); 191 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[4])); 193 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[5])); 195 initial_accum_data, _mm512_set1_epi32(rhs_sums_offsets[6])); [all …]
|
/external/tensorflow/third_party/eigen3/unsupported/Eigen/CXX11/src/FixedPoint/ |
D | TypeCastingAVX512.h | 148 _mm512_min_epi32(a, _mm512_set1_epi32(255)), _mm512_setzero_si512())); 150 _mm512_min_epi32(b, _mm512_set1_epi32(255)), _mm512_setzero_si512())); 152 _mm512_min_epi32(c, _mm512_set1_epi32(255)), _mm512_setzero_si512())); 154 _mm512_min_epi32(d, _mm512_set1_epi32(255)), _mm512_setzero_si512())); 178 _mm512_min_epi32(a, _mm512_set1_epi32(65535)), _mm512_setzero_si512())); 180 _mm512_max_epi32(_mm512_min_epi32(b, _mm512_set1_epi32(65535)),
|
/external/XNNPACK/src/math/ |
D | exp-avx512f-rr2-lut32-p2-perm2.c | 44 const __m512i vmin_exponent = _mm512_set1_epi32(0xC1000000); in xnn_math_f32_exp__avx512f_rr2_lut32_p2_perm2() 45 const __m512i vmax_exponent = _mm512_set1_epi32(0x3F800000); in xnn_math_f32_exp__avx512f_rr2_lut32_p2_perm2() 47 const __m512i vmantissa_mask = _mm512_set1_epi32(0x007FFFE0); in xnn_math_f32_exp__avx512f_rr2_lut32_p2_perm2()
|
D | exp-avx512f-rr2-lut16-p3-perm.c | 39 const __m512i vmin_exponent = _mm512_set1_epi32(0xC1000000); in xnn_math_f32_exp__avx512f_rr2_lut16_p3_perm() 40 const __m512i vmax_exponent = _mm512_set1_epi32(0x3F800000); in xnn_math_f32_exp__avx512f_rr2_lut16_p3_perm() 42 const __m512i vmantissa_mask = _mm512_set1_epi32(0x007FFFF0); in xnn_math_f32_exp__avx512f_rr2_lut16_p3_perm()
|
D | sigmoid-avx512f-rr1-lut64-p2-gather-scalef-div.c | 26 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut64_p2_gather_scalef_div() 31 const __m512i vindex_mask = _mm512_set1_epi32(INT32_C(0x3F)); in xnn_math_f32_sigmoid__avx512f_rr1_lut64_p2_gather_scalef_div()
|
D | sigmoid-avx512f-rr2-lut64-p2-gather-scalef-div.c | 26 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_lut64_p2_gather_scalef_div() 31 const __m512i vindex_mask = _mm512_set1_epi32(INT32_C(0x3F)); in xnn_math_f32_sigmoid__avx512f_rr2_lut64_p2_gather_scalef_div()
|
D | sigmoid-avx512f-rr1-lut64-p2-gather-scalef-nr1fma.c | 26 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut64_p2_gather_scalef_nr1fma() 31 const __m512i vindex_mask = _mm512_set1_epi32(INT32_C(0x3F)); in xnn_math_f32_sigmoid__avx512f_rr1_lut64_p2_gather_scalef_nr1fma()
|
D | sigmoid-avx512f-rr1-lut64-p2-gather-scalef-nr1fma1adj.c | 26 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut64_p2_gather_scalef_nr1fma1adj() 31 const __m512i vindex_mask = _mm512_set1_epi32(INT32_C(0x3F)); in xnn_math_f32_sigmoid__avx512f_rr1_lut64_p2_gather_scalef_nr1fma1adj()
|
D | sigmoid-avx512f-rr2-lut64-p2-gather-scalef-nr1fma.c | 26 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_lut64_p2_gather_scalef_nr1fma() 31 const __m512i vindex_mask = _mm512_set1_epi32(INT32_C(0x3F)); in xnn_math_f32_sigmoid__avx512f_rr2_lut64_p2_gather_scalef_nr1fma()
|
D | sigmoid-avx512f-rr2-lut64-p2-gather-scalef-nr1fma1adj.c | 26 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_lut64_p2_gather_scalef_nr1fma1adj() 31 const __m512i vindex_mask = _mm512_set1_epi32(INT32_C(0x3F)); in xnn_math_f32_sigmoid__avx512f_rr2_lut64_p2_gather_scalef_nr1fma1adj()
|
D | exp-avx512f-rr2-p5.c | 37 const __m512i vmin_exponent = _mm512_set1_epi32(0xC1000000); in xnn_math_f32_exp__avx512f_rr2_p5() 38 const __m512i vmax_exponent = _mm512_set1_epi32(0x3F800000); in xnn_math_f32_exp__avx512f_rr2_p5()
|
D | sigmoid-avx512f-rr1-lut16-p3-perm-scalef-div.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut16_p3_perm_scalef_div()
|
D | sigmoid-avx512f-rr1-lut32-p2-perm2-scalef-div.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut32_p2_perm2_scalef_div()
|
D | sigmoid-avx512f-rr1-p5-scalef-div.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_p5_scalef_div()
|
D | sigmoid-avx512f-rr2-lut16-p3-perm-scalef-div.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_lut16_p3_perm_scalef_div()
|
D | sigmoid-avx512f-rr1-p5-scalef-nr1fma.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_p5_scalef_nr1fma()
|
D | sigmoid-avx512f-rr2-lut32-p2-perm2-scalef-div.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_lut32_p2_perm2_scalef_div()
|
D | sigmoid-avx512f-rr1-lut32-p2-perm2-scalef-nr1fma.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut32_p2_perm2_scalef_nr1fma()
|
D | sigmoid-avx512f-rr2-p5-scalef-div.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_p5_scalef_div()
|
D | sigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut16_p3_perm_scalef_nr1fma()
|
D | sigmoid-avx512f-rr2-p5-scalef-nr1fma.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr2_p5_scalef_nr1fma()
|
D | sigmoid-avx512f-rr1-lut32-p2-perm2-scalef-nr1fma1adj.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut32_p2_perm2_scalef_nr1fma1adj()
|
D | sigmoid-avx512f-rr1-lut16-p3-perm-scalef-nr1fma1adj.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_lut16_p3_perm_scalef_nr1fma1adj()
|
D | sigmoid-avx512f-rr1-p5-scalef-nr1fma1adj.c | 22 const __m512i vsign_mask = _mm512_set1_epi32(0x80000000); in xnn_math_f32_sigmoid__avx512f_rr1_p5_scalef_nr1fma1adj()
|
/external/skia/src/opts/ |
D | SkBlitRow_opts.h | 40 __m512i rb = _mm512_and_si512(_mm512_set1_epi32(0x00ff00ff), dst); in SkPMSrcOver_SKX() 47 ga = _mm512_andnot_si512(_mm512_set1_epi32(0x00ff00ff), ga); in SkPMSrcOver_SKX()
|