Home
last modified time | relevance | path

Searched refs:_mm_castsi128_ps (Results 1 – 25 of 32) sorted by relevance

12

/external/webrtc/webrtc/modules/audio_processing/aec/
Daec_rdft_sse2.c92 const __m128 a_00_32 = _mm_shuffle_ps(_mm_castsi128_ps(a_00), in cftmdl_128_SSE2()
93 _mm_castsi128_ps(a_32), in cftmdl_128_SSE2()
95 const __m128 a_08_40 = _mm_shuffle_ps(_mm_castsi128_ps(a_08), in cftmdl_128_SSE2()
96 _mm_castsi128_ps(a_40), in cftmdl_128_SSE2()
105 const __m128 a_16_48 = _mm_shuffle_ps(_mm_castsi128_ps(a_16), in cftmdl_128_SSE2()
106 _mm_castsi128_ps(a_48), in cftmdl_128_SSE2()
108 const __m128 a_24_56 = _mm_shuffle_ps(_mm_castsi128_ps(a_24), in cftmdl_128_SSE2()
109 _mm_castsi128_ps(a_56), in cftmdl_128_SSE2()
117 const __m128 x3i0_3r0_3i1_x3r1 = _mm_castsi128_ps(_mm_shuffle_epi32( in cftmdl_128_SSE2()
166 const __m128 a_00_32 = _mm_shuffle_ps(_mm_castsi128_ps(a_00), in cftmdl_128_SSE2()
[all …]
Daec_rdft.h20 static __inline __m128 _mm_castsi128_ps(__m128i a) { return *(__m128*)&a; } in _mm_castsi128_ps() function
Daec_core_sse2.c266 const __m128 n_1 = _mm_castsi128_ps(_mm_srli_epi32( in mm_pow_ps()
348 _mm_castsi128_ps(_mm_slli_epi32(two_n_exponent, float_exponent_shift)); in mm_pow_ps()
/external/tensorflow/tensorflow/core/kernels/
Dsparse_matmul_op.h197 return _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp));
205 return _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp));
214 return _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)); in pexpand_bf16_l()
223 return _mm_castsi128_ps(_mm_unpackhi_epi16(zero, tmp)); in pexpand_bf16_u()
349 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)));
357 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)));
367 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)));
375 _mm_castsi128_ps(_mm_unpacklo_epi16(zero, tmp)));
393 __m256 res = _mm256_castps128_ps256(_mm_castsi128_ps(res_l)); in pexpand_bf16_l()
394 res = _mm256_insertf128_ps(res, _mm_castsi128_ps(res_h), 1); in pexpand_bf16_l()
[all …]
/external/eigen/Eigen/src/Core/arch/SSE/
DPacketMath.h65 (_mm_castsi128_ps(_mm_shuffle_epi32( _mm_castps_si128(v), ((s)<<6|(r)<<4|(q)<<2|(p)))))
77 …(_mm_castps_si128( (_mm_shuffle_ps( _mm_castsi128_ps(a), _mm_castsi128_ps(b), ((s)<<6|(r)<<4|(q)<<…
86 const Packet4f p4f_##NAME = _mm_castsi128_ps(pset1<Packet4i>(X))
208 …const Packet4f mask = _mm_castsi128_ps(_mm_setr_epi32(0x80000000,0x80000000,0x80000000,0x80000000)…
444 …const Packet4f mask = _mm_castsi128_ps(_mm_setr_epi32(0x7FFFFFFF,0x7FFFFFFF,0x7FFFFFFF,0x7FFFFFFF)…
496 vecs[1] = _mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128(vecs[0]), 0x55));
497 vecs[2] = _mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128(vecs[0]), 0xAA));
498 vecs[3] = _mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128(vecs[0]), 0xFF));
499 vecs[0] = _mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128(vecs[0]), 0x00));
686 …first = _mm_castsi128_ps(_mm_alignr_epi8(_mm_castps_si128(second), _mm_castps_si128(first), Offset…
[all …]
DComplex.h59 const __m128 mask = _mm_castsi128_ps(_mm_setr_epi32(0x80000000,0x80000000,0x80000000,0x80000000));
64 const __m128 mask = _mm_castsi128_ps(_mm_setr_epi32(0x00000000,0x80000000,0x00000000,0x80000000));
78 const __m128 mask = _mm_castsi128_ps(_mm_setr_epi32(0x80000000,0x00000000,0x80000000,0x00000000));
188 … const __m128 mask = _mm_castsi128_ps(_mm_setr_epi32(0x00000000,0x80000000,0x00000000,0x80000000));
206 … const __m128 mask = _mm_castsi128_ps(_mm_setr_epi32(0x00000000,0x80000000,0x00000000,0x80000000));
224 … const __m128 mask = _mm_castsi128_ps(_mm_setr_epi32(0x00000000,0x80000000,0x00000000,0x80000000));
255 …return Packet2cf(_mm_div_ps(res.v,_mm_add_ps(s,_mm_castsi128_ps(_mm_shuffle_epi32(_mm_castps_si128…
DMathFunctions.h169 return pmax(pmul(y, Packet4f(_mm_castsi128_ps(emm0))), _x);
315 Packet4f swap_sign_bit = _mm_castsi128_ps(emm0);
316 Packet4f poly_mask = _mm_castsi128_ps(emm2);
405 Packet4f sign_bit = _mm_castsi128_ps(emm0);
406 Packet4f poly_mask = _mm_castsi128_ps(emm2);
/external/libvpx/libvpx/vpx_dsp/x86/
Dloopfilter_avx2.c34 _mm_loadh_pi(_mm_castsi128_ps(q4p4), (__m64 *)(s + 4 * pitch))); in vpx_lpf_horizontal_16_avx2()
37 _mm_loadh_pi(_mm_castsi128_ps(q3p3), (__m64 *)(s + 3 * pitch))); in vpx_lpf_horizontal_16_avx2()
40 _mm_loadh_pi(_mm_castsi128_ps(q2p2), (__m64 *)(s + 2 * pitch))); in vpx_lpf_horizontal_16_avx2()
43 _mm_loadh_pi(_mm_castsi128_ps(q1p1), (__m64 *)(s + 1 * pitch))); in vpx_lpf_horizontal_16_avx2()
47 _mm_loadh_pi(_mm_castsi128_ps(q0p0), (__m64 *)(s - 0 * pitch))); in vpx_lpf_horizontal_16_avx2()
141 _mm_loadh_pi(_mm_castsi128_ps(q5p5), (__m64 *)(s + 5 * pitch))); in vpx_lpf_horizontal_16_avx2()
145 _mm_loadh_pi(_mm_castsi128_ps(q6p6), (__m64 *)(s + 6 * pitch))); in vpx_lpf_horizontal_16_avx2()
153 _mm_loadh_pi(_mm_castsi128_ps(q7p7), (__m64 *)(s + 7 * pitch))); in vpx_lpf_horizontal_16_avx2()
325 _mm_storeh_pi((__m64 *)(s + 6 * pitch), _mm_castsi128_ps(q6p6)); in vpx_lpf_horizontal_16_avx2()
331 _mm_storeh_pi((__m64 *)(s + 5 * pitch), _mm_castsi128_ps(q5p5)); in vpx_lpf_horizontal_16_avx2()
[all …]
Dmem_sse2.h45 _mm_loadh_pi(_mm_castsi128_ps(s), (const __m64 *)src)); in loadh_epi64()
103 _mm_storeh_pi((__m64 *)d, _mm_castsi128_ps(s)); in _mm_storeh_epi64()
Dloopfilter_sse2.c135 _mm_storeh_pi((__m64 *)(s - 2 * pitch), _mm_castsi128_ps(ps1ps0)); // *op1 in vpx_lpf_horizontal_4_sse2()
138 _mm_storeh_pi((__m64 *)(s + 1 * pitch), _mm_castsi128_ps(qs1qs0)); // *oq1 in vpx_lpf_horizontal_4_sse2()
246 _mm_loadh_pi(_mm_castsi128_ps(q4p4), (__m64 *)(s + 4 * pitch))); in vpx_lpf_horizontal_16_sse2()
249 _mm_loadh_pi(_mm_castsi128_ps(q3p3), (__m64 *)(s + 3 * pitch))); in vpx_lpf_horizontal_16_sse2()
252 _mm_loadh_pi(_mm_castsi128_ps(q2p2), (__m64 *)(s + 2 * pitch))); in vpx_lpf_horizontal_16_sse2()
255 _mm_loadh_pi(_mm_castsi128_ps(q1p1), (__m64 *)(s + 1 * pitch))); in vpx_lpf_horizontal_16_sse2()
259 _mm_loadh_pi(_mm_castsi128_ps(q0p0), (__m64 *)(s - 0 * pitch))); in vpx_lpf_horizontal_16_sse2()
346 _mm_loadh_pi(_mm_castsi128_ps(q5p5), (__m64 *)(s + 5 * pitch))); in vpx_lpf_horizontal_16_sse2()
350 _mm_loadh_pi(_mm_castsi128_ps(q6p6), (__m64 *)(s + 6 * pitch))); in vpx_lpf_horizontal_16_sse2()
355 _mm_loadh_pi(_mm_castsi128_ps(q7p7), (__m64 *)(s + 7 * pitch))); in vpx_lpf_horizontal_16_sse2()
[all …]
Davg_pred_sse2.c57 r = _mm_castps_si128(_mm_loadh_pi(_mm_castsi128_ps(r_0), in vpx_comp_avg_pred_sse2()
Dhighbd_inv_txfm_sse2.h304 _mm_loadh_pi(_mm_castsi128_ps(d), (const __m64 *)(dest + 1 * stride))); in recon_and_store_4x2()
307 _mm_storeh_pi((__m64 *)(dest + 1 * stride), _mm_castsi128_ps(d)); in recon_and_store_4x2()
/external/libaom/libaom/aom_dsp/x86/
Dmem_sse2.h23 _mm_loadh_pi(_mm_castsi128_ps(s), (const __m64 *)src)); in loadh_epi64()
Dmasked_variance_intrin_ssse3.h68 _mm_castsi128_ps(aA), (const __m64 *)(mask + mask_stride))); in comp_mask_pred_8_ssse3()
/external/libaom/libaom/aom_ports/
Demmintrin_compat.h45 _mm_castsi128_ps(__m128i __A) { in _mm_castsi128_ps() function
/external/libvpx/libvpx/vpx_ports/
Demmintrin_compat.h44 _mm_castsi128_ps(__m128i __A) { in _mm_castsi128_ps() function
/external/llvm/test/CodeGen/X86/
Dlea-opt-memop-check-1.ll12 declare <4 x float> @_mm_castsi128_ps(<2 x i64>) optsize
21 %call1 = tail call <4 x float> @_mm_castsi128_ps(<2 x i64> %tmp0)
/external/swiftshader/third_party/llvm-7.0/llvm/test/CodeGen/X86/
Dlea-opt-memop-check-1.ll12 declare <4 x float> @_mm_castsi128_ps(<2 x i64>) optsize
21 %call1 = tail call <4 x float> @_mm_castsi128_ps(<2 x i64> %tmp0)
/external/python/cpython3/Modules/_blake2/impl/
Dblake2s-round.h22 #define TOF(reg) _mm_castsi128_ps((reg))
Dblake2b-round.h22 #define TOF(reg) _mm_castsi128_ps((reg))
/external/libaom/libaom/aom_dsp/simd/
Dv128_intrinsics_x86.h222 _mm_castsi128_ps(b), _mm_castsi128_ps(a), _MM_SHUFFLE(3, 1, 3, 1))); in v128_unziphi_32()
227 _mm_castsi128_ps(b), _mm_castsi128_ps(a), _MM_SHUFFLE(2, 0, 2, 0))); in v128_unziplo_32()
/external/mesa3d/src/gallium/drivers/swr/rasterizer/core/
Drasterizer_impl.h274 int msk = _mm_movemask_ps(_mm_castsi128_ps(vA)); in adjustTopLeftRuleIntFix16()
278 int msk2 = _mm_movemask_ps(_mm_castsi128_ps(vCmp)); in adjustTopLeftRuleIntFix16()
279 msk2 &= _mm_movemask_ps(_mm_castsi128_ps(vB)); in adjustTopLeftRuleIntFix16()
Dformat_types.h696 #define TO_M128(a) _mm_castsi128_ps(a)
719 ret = _mm_castsi128_ps(_mm_cvtps_epi32(ret));
/external/compiler-rt/lib/tsan/rtl/
Dtsan_rtl.cc674 _mm_castsi128_ps(v0), _mm_castsi128_ps(v1), \
/external/epid-sdk/ext/ipp/sources/include/
Downdefs.h572 #define _pi2ps _mm_castsi128_ps

12