Home
last modified time | relevance | path

Searched refs:_mm_cvtepi32_ps (Results 1 – 25 of 42) sorted by relevance

12

/external/XNNPACK/src/qu8-requantization/
Dfp32-sse2.c48 const __m128 x_scaled = _mm_mul_ps(_mm_cvtepi32_ps(x), vscale); in xnn_qu8_requantize_fp32__sse2()
49 const __m128 y_scaled = _mm_mul_ps(_mm_cvtepi32_ps(y), vscale); in xnn_qu8_requantize_fp32__sse2()
50 const __m128 z_scaled = _mm_mul_ps(_mm_cvtepi32_ps(z), vscale); in xnn_qu8_requantize_fp32__sse2()
51 const __m128 w_scaled = _mm_mul_ps(_mm_cvtepi32_ps(w), vscale); in xnn_qu8_requantize_fp32__sse2()
/external/XNNPACK/src/qs8-requantization/
Dfp32-sse4.c48 const __m128 x_scaled = _mm_mul_ps(_mm_cvtepi32_ps(x), vscale); in xnn_qs8_requantize_fp32__sse4()
49 const __m128 y_scaled = _mm_mul_ps(_mm_cvtepi32_ps(y), vscale); in xnn_qs8_requantize_fp32__sse4()
50 const __m128 z_scaled = _mm_mul_ps(_mm_cvtepi32_ps(z), vscale); in xnn_qs8_requantize_fp32__sse4()
51 const __m128 w_scaled = _mm_mul_ps(_mm_cvtepi32_ps(w), vscale); in xnn_qs8_requantize_fp32__sse4()
Dfp32-sse2.c48 const __m128 x_scaled = _mm_mul_ps(_mm_cvtepi32_ps(x), vscale); in xnn_qs8_requantize_fp32__sse2()
49 const __m128 y_scaled = _mm_mul_ps(_mm_cvtepi32_ps(y), vscale); in xnn_qs8_requantize_fp32__sse2()
50 const __m128 z_scaled = _mm_mul_ps(_mm_cvtepi32_ps(z), vscale); in xnn_qs8_requantize_fp32__sse2()
51 const __m128 w_scaled = _mm_mul_ps(_mm_cvtepi32_ps(w), vscale); in xnn_qs8_requantize_fp32__sse2()
/external/XNNPACK/src/f32-vrnd/gen/
Dvrndz-sse2-x8.c40 const __m128 vrndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndz_ukernel__sse2_x8()
41 const __m128 vrndx4567 = _mm_cvtepi32_ps(vintx4567); in xnn_f32_vrndz_ukernel__sse2_x8()
56 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndz_ukernel__sse2_x8()
66 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndz_ukernel__sse2_x8()
Dvrndne-sse2-x8.c40 const __m128 vrndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndne_ukernel__sse2_x8()
41 const __m128 vrndx4567 = _mm_cvtepi32_ps(vintx4567); in xnn_f32_vrndne_ukernel__sse2_x8()
56 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndne_ukernel__sse2_x8()
66 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndne_ukernel__sse2_x8()
Dvrndd-sse2-x8.c41 const __m128 vprerndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndd_ukernel__sse2_x8()
42 const __m128 vprerndx4567 = _mm_cvtepi32_ps(vintx4567); in xnn_f32_vrndd_ukernel__sse2_x8()
60 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndd_ukernel__sse2_x8()
71 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndd_ukernel__sse2_x8()
Dvrndu-sse2-x8.c41 const __m128 vprerndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndu_ukernel__sse2_x8()
42 const __m128 vprerndx4567 = _mm_cvtepi32_ps(vintx4567); in xnn_f32_vrndu_ukernel__sse2_x8()
66 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndu_ukernel__sse2_x8()
79 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndu_ukernel__sse2_x8()
Dvrndz-sse2-x4.c37 const __m128 vrndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndz_ukernel__sse2_x4()
48 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndz_ukernel__sse2_x4()
Dvrndne-sse2-x4.c37 const __m128 vrndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndne_ukernel__sse2_x4()
48 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndne_ukernel__sse2_x4()
Dvrndd-sse2-x4.c38 const __m128 vprerndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndd_ukernel__sse2_x4()
51 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndd_ukernel__sse2_x4()
Dvrndu-sse2-x4.c38 const __m128 vprerndx0123 = _mm_cvtepi32_ps(vintx0123); in xnn_f32_vrndu_ukernel__sse2_x4()
55 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_f32_vrndu_ukernel__sse2_x4()
/external/XNNPACK/src/f32-vrnd/
Dvrndne-sse2.c.in41 const __m128 vrndx${ABC[N:N+4]} = _mm_cvtepi32_ps(vintx${ABC[N:N+4]});
58 const __m128 vrndx = _mm_cvtepi32_ps(vintx);
68 const __m128 vrndx = _mm_cvtepi32_ps(vintx);
Dvrndz-sse2.c.in41 const __m128 vrndx${ABC[N:N+4]} = _mm_cvtepi32_ps(vintx${ABC[N:N+4]});
58 const __m128 vrndx = _mm_cvtepi32_ps(vintx);
68 const __m128 vrndx = _mm_cvtepi32_ps(vintx);
Dvrndd-sse2.c.in42 const __m128 vprerndx${ABC[N:N+4]} = _mm_cvtepi32_ps(vintx${ABC[N:N+4]});
62 const __m128 vprerndx = _mm_cvtepi32_ps(vintx);
73 const __m128 vprerndx = _mm_cvtepi32_ps(vintx);
Dvrndu-sse2.c.in42 const __m128 vprerndx${ABC[N:N+4]} = _mm_cvtepi32_ps(vintx${ABC[N:N+4]});
68 const __m128 vprerndx = _mm_cvtepi32_ps(vintx);
81 const __m128 vprerndx = _mm_cvtepi32_ps(vintx);
/external/XNNPACK/src/math/
Droundne-sse2-cvt.c41 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_math_f32_roundne__sse2_cvt()
Droundz-sse2-cvt.c41 const __m128 vrndx = _mm_cvtepi32_ps(vintx); in xnn_math_f32_roundz__sse2_cvt()
Droundd-sse2-cvt.c43 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_math_f32_roundd__sse2_cvt()
Droundu-sse2-cvt.c43 const __m128 vprerndx = _mm_cvtepi32_ps(vintx); in xnn_math_f32_roundu__sse2_cvt()
/external/eigen/Eigen/src/Core/arch/SSE/
DTypeCasting.h41 return _mm_cvtepi32_ps(a);
DMathFunctions.h66 Packet4f e = padd(Packet4f(_mm_cvtepi32_ps(emm0)), p4f_1);
142 tmp = _mm_cvtepi32_ps(emm0);
302 y = _mm_cvtepi32_ps(emm2);
394 y = _mm_cvtepi32_ps(emm2);
/external/tensorflow/tensorflow/lite/kernels/internal/optimized/
Dsse_tensor_utils.cc243 const __m128 float_val0 = _mm_cvtepi32_ps(scratch_val0); in SseMatrixBatchVectorMultiplyAccumulate()
244 const __m128 float_val1 = _mm_cvtepi32_ps(scratch_val1); in SseMatrixBatchVectorMultiplyAccumulate()
374 const __m128 dp_fx4 = _mm_cvtepi32_ps(dp_32x4); in SseSparseMatrix4VectorsMultiplyAccumulate()
/external/libopus/celt/x86/
Dvq_sse2.c120 y4 = _mm_cvtepi32_ps(iy4); in op_pvq_search_sse2()
/external/skia/include/private/
DSkNx_sse.h32 __m128 roundtrip = _mm_cvtepi32_ps(_mm_cvttps_epi32(v)); in emulate_mm_floor_ps()
691 return _mm_cvtepi32_ps(src.fVec);
747 return _mm_cvtepi32_ps(SkNx_cast<int32_t>(src).fVec);
752 return _mm_cvtepi32_ps(_32);
/external/skqp/include/private/
DSkNx_sse.h32 __m128 roundtrip = _mm_cvtepi32_ps(_mm_cvttps_epi32(v)); in emulate_mm_floor_ps()
695 return _mm_cvtepi32_ps(src.fVec);
751 return _mm_cvtepi32_ps(SkNx_cast<int32_t>(src).fVec);
756 return _mm_cvtepi32_ps(_32);

12