Home
last modified time | relevance | path

Searched refs:_mm_loadu_ps (Results 1 – 22 of 22) sorted by relevance

/external/libopus/celt/x86/
Dpitch_sse.c47 xsum1 = _mm_loadu_ps(sum); in xcorr_kernel_sse()
52 __m128 x0 = _mm_loadu_ps(x+j); in xcorr_kernel_sse()
53 __m128 yj = _mm_loadu_ps(y+j); in xcorr_kernel_sse()
54 __m128 y3 = _mm_loadu_ps(y+j+3); in xcorr_kernel_sse()
65 xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); in xcorr_kernel_sse()
68 xsum2 = _mm_add_ps(xsum2,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); in xcorr_kernel_sse()
71 xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); in xcorr_kernel_sse()
88 __m128 xi = _mm_loadu_ps(x+i); in dual_inner_prod_sse()
89 __m128 y1i = _mm_loadu_ps(y01+i); in dual_inner_prod_sse()
90 __m128 y2i = _mm_loadu_ps(y02+i); in dual_inner_prod_sse()
[all …]
Dvq_sse2.c71 x4 = _mm_loadu_ps(&X[j]); in op_pvq_search_sse2()
115 x4 = _mm_loadu_ps(&X[j]); in op_pvq_search_sse2()
169 x4 = _mm_loadu_ps(&X[j]); in op_pvq_search_sse2()
170 y4 = _mm_loadu_ps(&y[j]); in op_pvq_search_sse2()
209 s4 = _mm_castps_si128(_mm_loadu_ps(&signy[j])); in op_pvq_search_sse2()
/external/libaom/libaom/av1/encoder/x86/
Dml_sse3.c25 const __m128 inputs_h = _mm_loadu_ps(&inputs[4]); in nn_propagate_8to1()
26 const __m128 inputs_l = _mm_loadu_ps(inputs); in nn_propagate_8to1()
28 const __m128 weights_h = _mm_loadu_ps(&weights[4]); in nn_propagate_8to1()
29 const __m128 weights_l = _mm_loadu_ps(weights); in nn_propagate_8to1()
47 const __m128 inputs128 = _mm_loadu_ps(inputs); in nn_propagate_4to1()
49 const __m128 weights128 = _mm_loadu_ps(weights); in nn_propagate_4to1()
64 const __m128 inputs128 = _mm_loadu_ps(inputs); in nn_propagate_4to4()
68 const __m128 weight0 = _mm_loadu_ps(&weights[2 * i * num_inputs]); in nn_propagate_4to4()
70 const __m128 weight1 = _mm_loadu_ps(&weights[(2 * i + 1) * num_inputs]); in nn_propagate_4to4()
86 const __m128 inputs128 = _mm_loadu_ps(inputs); in nn_propagate_4to8()
[all …]
/external/speex/libspeexdsp/
Dresample_sse.h47 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_loadu_ps(a+i), _mm_loadu_ps(b+i))); in inner_product_single()
48 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_loadu_ps(a+i+4), _mm_loadu_ps(b+i+4))); in inner_product_single()
61 __m128 f = _mm_loadu_ps(frac); in interpolate_product_single()
64 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_load1_ps(a+i), _mm_loadu_ps(b+i*oversample))); in interpolate_product_single()
65 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_load1_ps(a+i+1), _mm_loadu_ps(b+(i+1)*oversample))); in interpolate_product_single()
86 t = _mm_mul_ps(_mm_loadu_ps(a+i), _mm_loadu_ps(b+i)); in inner_product_double()
90 t = _mm_mul_ps(_mm_loadu_ps(a+i+4), _mm_loadu_ps(b+i+4)); in inner_product_double()
106 __m128 f = _mm_loadu_ps(frac); in interpolate_product_double()
112 t = _mm_mul_ps(_mm_load1_ps(a+i), _mm_loadu_ps(b+i*oversample)); in interpolate_product_double()
116 t = _mm_mul_ps(_mm_load1_ps(a+i+1), _mm_loadu_ps(b+(i+1)*oversample)); in interpolate_product_double()
/external/webrtc/webrtc/modules/audio_processing/aec/
Daec_core_sse2.c51 const __m128 x_fft_buf_re = _mm_loadu_ps(&x_fft_buf[0][xPos + j]); in FilterFarSSE2()
52 const __m128 x_fft_buf_im = _mm_loadu_ps(&x_fft_buf[1][xPos + j]); in FilterFarSSE2()
53 const __m128 h_fft_buf_re = _mm_loadu_ps(&h_fft_buf[0][pos + j]); in FilterFarSSE2()
54 const __m128 h_fft_buf_im = _mm_loadu_ps(&h_fft_buf[1][pos + j]); in FilterFarSSE2()
55 const __m128 y_fft_re = _mm_loadu_ps(&y_fft[0][j]); in FilterFarSSE2()
56 const __m128 y_fft_im = _mm_loadu_ps(&y_fft[1][j]); in FilterFarSSE2()
97 const __m128 x_pow_local = _mm_loadu_ps(&x_pow[i]); in ScaleErrorSignalSSE2()
98 const __m128 ef_re_base = _mm_loadu_ps(&ef[0][i]); in ScaleErrorSignalSSE2()
99 const __m128 ef_im_base = _mm_loadu_ps(&ef[1][i]); in ScaleErrorSignalSSE2()
170 const __m128 x_fft_buf_re = _mm_loadu_ps(&x_fft_buf[0][xPos + j]); in FilterAdaptationSSE2()
[all …]
Daec_rdft_sse2.c23 __m128 a00v = _mm_loadu_ps(&a[j + 0]); in cft1st_128_SSE2()
24 __m128 a04v = _mm_loadu_ps(&a[j + 4]); in cft1st_128_SSE2()
25 __m128 a08v = _mm_loadu_ps(&a[j + 8]); in cft1st_128_SSE2()
26 __m128 a12v = _mm_loadu_ps(&a[j + 12]); in cft1st_128_SSE2()
253 const __m128 c_j1 = _mm_loadu_ps(&c[j1]); // 1, 2, 3, 4, in rftfsub_128_SSE2()
254 const __m128 c_k1 = _mm_loadu_ps(&c[29 - j1]); // 28, 29, 30, 31, in rftfsub_128_SSE2()
260 const __m128 a_j2_0 = _mm_loadu_ps(&a[0 + j2]); // 2, 3, 4, 5, in rftfsub_128_SSE2()
261 const __m128 a_j2_4 = _mm_loadu_ps(&a[4 + j2]); // 6, 7, 8, 9, in rftfsub_128_SSE2()
262 const __m128 a_k2_0 = _mm_loadu_ps(&a[122 - j2]); // 120, 121, 122, 123, in rftfsub_128_SSE2()
263 const __m128 a_k2_4 = _mm_loadu_ps(&a[126 - j2]); // 124, 125, 126, 127, in rftfsub_128_SSE2()
[all …]
/external/flac/libFLAC/
Dlpc_intrin_sse.c71 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_4_new()
108 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_8_new()
109 d1 = _mm_loadu_ps(data+i+4); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_8_new()
153 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12_new()
154 d1 = _mm_loadu_ps(data+i+4); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12_new()
155 d2 = _mm_loadu_ps(data+i+8); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12_new()
206 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
207 d1 = _mm_loadu_ps(data+i+4); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
208 d2 = _mm_loadu_ps(data+i+8); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
209 d3 = _mm_loadu_ps(data+i+12); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
/external/clang/test/Sema/
Duninit-variables-vectors.c6 __m128 _mm_loadu_ps(const float *p);
14 X = _mm_loadu_ps(&input[0]); in test1()
/external/webrtc/webrtc/common_audio/resampler/
Dsinc_resampler_sse.cc31 m_input = _mm_loadu_ps(input_ptr + i); in Convolve_SSE()
/external/webrtc/webrtc/common_audio/
Dfir_filter_sse.cc63 m_in = _mm_loadu_ps(in_ptr + j); in Filter()
/external/skia/include/private/
DSkNx_sse.h136 AI static SkNx Load(const void* ptr) { return _mm_loadu_ps((const float*)ptr); } in Load()
147 __m128 v0 = _mm_loadu_ps(((float*)ptr) + 0), in Load4()
148 v1 = _mm_loadu_ps(((float*)ptr) + 4), in Load4()
149 v2 = _mm_loadu_ps(((float*)ptr) + 8), in Load4()
150 v3 = _mm_loadu_ps(((float*)ptr) + 12); in Load4()
/external/skqp/include/private/
DSkNx_sse.h136 AI static SkNx Load(const void* ptr) { return _mm_loadu_ps((const float*)ptr); } in Load()
147 __m128 v0 = _mm_loadu_ps(((float*)ptr) + 0), in Load4()
148 v1 = _mm_loadu_ps(((float*)ptr) + 4), in Load4()
149 v2 = _mm_loadu_ps(((float*)ptr) + 8), in Load4()
150 v3 = _mm_loadu_ps(((float*)ptr) + 12); in Load4()
/external/speex/
Dconfigure.ac72 return _mm_add_ps(_mm_loadu_ps(a), _mm_loadu_ps(b));
Dconfigure12512 return _mm_add_ps(_mm_loadu_ps(a), _mm_loadu_ps(b));
/external/skia/src/opts/
DSkRasterPipeline_opts.h454 case 0: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+28), 1);
455 case 7: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+24), 1);
456 case 6: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+20), 1);
457 case 5: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+16), 1);
458 case 4: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+12), 0);
459 case 3: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+ 8), 0);
460 case 2: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+ 4), 0);
461 case 1: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+ 0), 0);
637 if ( true ) { _0 = _mm_loadu_ps(ptr + 0); }
638 if (tail > 1) { _1 = _mm_loadu_ps(ptr + 4); }
[all …]
/external/skqp/src/opts/
DSkRasterPipeline_opts.h454 case 0: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+28), 1);
455 case 7: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+24), 1);
456 case 6: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+20), 1);
457 case 5: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+16), 1);
458 case 4: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+12), 0);
459 case 3: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+ 8), 0);
460 case 2: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+ 4), 0);
461 case 1: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+ 0), 0);
637 if ( true ) { _0 = _mm_loadu_ps(ptr + 0); }
638 if (tail > 1) { _1 = _mm_loadu_ps(ptr + 4); }
[all …]
/external/clang/test/CodeGen/
Dsse-builtins.c429 return _mm_loadu_ps(A); in test_mm_loadu_ps()
/external/eigen/Eigen/src/Core/arch/SSE/
DPacketMath.h320 return _mm_loadu_ps(from);
329 return _mm_loadu_ps(from);
/external/clang/lib/Headers/
Davxintrin.h2844 __m256 __v256 = _mm256_castps128_ps256(_mm_loadu_ps(__addr_lo)); in _mm256_loadu2_m128()
2845 return _mm256_insertf128_ps(__v256, _mm_loadu_ps(__addr_hi), 1); in _mm256_loadu2_m128()
Dxmmintrin.h1693 _mm_loadu_ps(const float *__p) in _mm_loadu_ps() function
/external/mesa3d/src/gallium/drivers/swr/rasterizer/common/
Dsimdlib_128_avx.inl425 return _mm_loadu_ps(p);
/external/neon_2_sse/
DNEON_2_SSE.h9272 return _mm_loadu_ps(ptr);