Home
last modified time | relevance | path

Searched refs:_mm_loadu_ps (Results 1 – 21 of 21) sorted by relevance

/external/libopus/celt/x86/
Dpitch_sse.c47 xsum1 = _mm_loadu_ps(sum); in xcorr_kernel_sse()
52 __m128 x0 = _mm_loadu_ps(x+j); in xcorr_kernel_sse()
53 __m128 yj = _mm_loadu_ps(y+j); in xcorr_kernel_sse()
54 __m128 y3 = _mm_loadu_ps(y+j+3); in xcorr_kernel_sse()
65 xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); in xcorr_kernel_sse()
68 xsum2 = _mm_add_ps(xsum2,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); in xcorr_kernel_sse()
71 xsum1 = _mm_add_ps(xsum1,_mm_mul_ps(_mm_load1_ps(x+j),_mm_loadu_ps(y+j))); in xcorr_kernel_sse()
88 __m128 xi = _mm_loadu_ps(x+i); in dual_inner_prod_sse()
89 __m128 y1i = _mm_loadu_ps(y01+i); in dual_inner_prod_sse()
90 __m128 y2i = _mm_loadu_ps(y02+i); in dual_inner_prod_sse()
[all …]
Dvq_sse2.c71 x4 = _mm_loadu_ps(&X[j]); in op_pvq_search_sse2()
115 x4 = _mm_loadu_ps(&X[j]); in op_pvq_search_sse2()
169 x4 = _mm_loadu_ps(&X[j]); in op_pvq_search_sse2()
170 y4 = _mm_loadu_ps(&y[j]); in op_pvq_search_sse2()
209 s4 = _mm_castps_si128(_mm_loadu_ps(&signy[j])); in op_pvq_search_sse2()
/external/webrtc/webrtc/modules/audio_processing/aec/
Daec_core_sse2.c51 const __m128 x_fft_buf_re = _mm_loadu_ps(&x_fft_buf[0][xPos + j]); in FilterFarSSE2()
52 const __m128 x_fft_buf_im = _mm_loadu_ps(&x_fft_buf[1][xPos + j]); in FilterFarSSE2()
53 const __m128 h_fft_buf_re = _mm_loadu_ps(&h_fft_buf[0][pos + j]); in FilterFarSSE2()
54 const __m128 h_fft_buf_im = _mm_loadu_ps(&h_fft_buf[1][pos + j]); in FilterFarSSE2()
55 const __m128 y_fft_re = _mm_loadu_ps(&y_fft[0][j]); in FilterFarSSE2()
56 const __m128 y_fft_im = _mm_loadu_ps(&y_fft[1][j]); in FilterFarSSE2()
97 const __m128 x_pow_local = _mm_loadu_ps(&x_pow[i]); in ScaleErrorSignalSSE2()
98 const __m128 ef_re_base = _mm_loadu_ps(&ef[0][i]); in ScaleErrorSignalSSE2()
99 const __m128 ef_im_base = _mm_loadu_ps(&ef[1][i]); in ScaleErrorSignalSSE2()
170 const __m128 x_fft_buf_re = _mm_loadu_ps(&x_fft_buf[0][xPos + j]); in FilterAdaptationSSE2()
[all …]
Daec_rdft_sse2.c23 __m128 a00v = _mm_loadu_ps(&a[j + 0]); in cft1st_128_SSE2()
24 __m128 a04v = _mm_loadu_ps(&a[j + 4]); in cft1st_128_SSE2()
25 __m128 a08v = _mm_loadu_ps(&a[j + 8]); in cft1st_128_SSE2()
26 __m128 a12v = _mm_loadu_ps(&a[j + 12]); in cft1st_128_SSE2()
253 const __m128 c_j1 = _mm_loadu_ps(&c[j1]); // 1, 2, 3, 4, in rftfsub_128_SSE2()
254 const __m128 c_k1 = _mm_loadu_ps(&c[29 - j1]); // 28, 29, 30, 31, in rftfsub_128_SSE2()
260 const __m128 a_j2_0 = _mm_loadu_ps(&a[0 + j2]); // 2, 3, 4, 5, in rftfsub_128_SSE2()
261 const __m128 a_j2_4 = _mm_loadu_ps(&a[4 + j2]); // 6, 7, 8, 9, in rftfsub_128_SSE2()
262 const __m128 a_k2_0 = _mm_loadu_ps(&a[122 - j2]); // 120, 121, 122, 123, in rftfsub_128_SSE2()
263 const __m128 a_k2_4 = _mm_loadu_ps(&a[126 - j2]); // 124, 125, 126, 127, in rftfsub_128_SSE2()
[all …]
/external/speex/libspeex/
Dresample_sse.h47 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_loadu_ps(a+i), _mm_loadu_ps(b+i))); in inner_product_single()
48 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_loadu_ps(a+i+4), _mm_loadu_ps(b+i+4))); in inner_product_single()
61 __m128 f = _mm_loadu_ps(frac); in interpolate_product_single()
64 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_load1_ps(a+i), _mm_loadu_ps(b+i*oversample))); in interpolate_product_single()
65 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_load1_ps(a+i+1), _mm_loadu_ps(b+(i+1)*oversample))); in interpolate_product_single()
86 t = _mm_mul_ps(_mm_loadu_ps(a+i), _mm_loadu_ps(b+i)); in inner_product_double()
90 t = _mm_mul_ps(_mm_loadu_ps(a+i+4), _mm_loadu_ps(b+i+4)); in inner_product_double()
106 __m128 f = _mm_loadu_ps(frac); in interpolate_product_double()
112 t = _mm_mul_ps(_mm_load1_ps(a+i), _mm_loadu_ps(b+i*oversample)); in interpolate_product_double()
116 t = _mm_mul_ps(_mm_load1_ps(a+i+1), _mm_loadu_ps(b+(i+1)*oversample)); in interpolate_product_double()
Dfilters_sse.h46 mem[i] = _mm_loadu_ps(_mem+4*i); in filter_mem16_10()
47 num[i] = _mm_loadu_ps(_num+4*i); in filter_mem16_10()
48 den[i] = _mm_loadu_ps(_den+4*i); in filter_mem16_10()
99 mem[i] = _mm_loadu_ps(_mem+4*i); in filter_mem16_8()
100 num[i] = _mm_loadu_ps(_num+4*i); in filter_mem16_8()
101 den[i] = _mm_loadu_ps(_den+4*i); in filter_mem16_8()
153 mem[i] = _mm_loadu_ps(_mem+4*i); in iir_mem16_10()
154 den[i] = _mm_loadu_ps(_den+4*i); in iir_mem16_10()
202 mem[i] = _mm_loadu_ps(_mem+4*i); in iir_mem16_8()
203 den[i] = _mm_loadu_ps(_den+4*i); in iir_mem16_8()
[all …]
Dltp_sse.h45 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_loadu_ps(a+0), _mm_loadu_ps(b+0))); in inner_prod()
46 sum = _mm_add_ps(sum, _mm_mul_ps(_mm_loadu_ps(a+4), _mm_loadu_ps(b+4))); in inner_prod()
68 x[i] = _mm_loadu_ps(_x+(i<<2)); in pitch_xcorr()
72 y[i] = _mm_loadu_ps(_y+(i<<2)+offset); in pitch_xcorr()
/external/flac/libFLAC/
Dlpc_intrin_sse.c71 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_4_new()
108 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_8_new()
109 d1 = _mm_loadu_ps(data+i+4); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_8_new()
153 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12_new()
154 d1 = _mm_loadu_ps(data+i+4); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12_new()
155 d2 = _mm_loadu_ps(data+i+8); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_12_new()
206 d0 = _mm_loadu_ps(data+i); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
207 d1 = _mm_loadu_ps(data+i+4); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
208 d2 = _mm_loadu_ps(data+i+8); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
209 d3 = _mm_loadu_ps(data+i+12); in FLAC__lpc_compute_autocorrelation_intrin_sse_lag_16_new()
/external/clang/test/Sema/
Duninit-variables-vectors.c6 __m128 _mm_loadu_ps(const float *p);
14 X = _mm_loadu_ps(&input[0]); in test1()
/external/webrtc/webrtc/common_audio/resampler/
Dsinc_resampler_sse.cc31 m_input = _mm_loadu_ps(input_ptr + i); in Convolve_SSE()
/external/webrtc/webrtc/common_audio/
Dfir_filter_sse.cc63 m_in = _mm_loadu_ps(in_ptr + j); in Filter()
/external/skqp/src/jumper/
DSkJumper_stages.cpp393 case 0: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+28), 1); in load4()
394 case 7: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+24), 1); in load4()
395 case 6: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+20), 1); in load4()
396 case 5: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+16), 1); in load4()
397 case 4: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+12), 0); in load4()
398 case 3: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+ 8), 0); in load4()
399 case 2: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+ 4), 0); in load4()
400 case 1: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+ 0), 0); in load4()
578 if ( true ) { _0 = _mm_loadu_ps(ptr + 0); } in load4()
579 if (tail > 1) { _1 = _mm_loadu_ps(ptr + 4); } in load4()
[all …]
/external/skia/src/jumper/
DSkJumper_stages.cpp393 case 0: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+28), 1); in load4()
394 case 7: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+24), 1); in load4()
395 case 6: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+20), 1); in load4()
396 case 5: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+16), 1); in load4()
397 case 4: _37 = _mm256_insertf128_ps(_37, _mm_loadu_ps(ptr+12), 0); in load4()
398 case 3: _26 = _mm256_insertf128_ps(_26, _mm_loadu_ps(ptr+ 8), 0); in load4()
399 case 2: _15 = _mm256_insertf128_ps(_15, _mm_loadu_ps(ptr+ 4), 0); in load4()
400 case 1: _04 = _mm256_insertf128_ps(_04, _mm_loadu_ps(ptr+ 0), 0); in load4()
578 if ( true ) { _0 = _mm_loadu_ps(ptr + 0); } in load4()
579 if (tail > 1) { _1 = _mm_loadu_ps(ptr + 4); } in load4()
[all …]
/external/skia/src/opts/
DSkNx_sse.h98 AI static SkNx Load(const void* ptr) { return _mm_loadu_ps((const float*)ptr); } in Load()
109 __m128 v0 = _mm_loadu_ps(((float*)ptr) + 0), in Load4()
110 v1 = _mm_loadu_ps(((float*)ptr) + 4), in Load4()
111 v2 = _mm_loadu_ps(((float*)ptr) + 8), in Load4()
112 v3 = _mm_loadu_ps(((float*)ptr) + 12); in Load4()
/external/skqp/src/opts/
DSkNx_sse.h91 AI static SkNx Load(const void* ptr) { return _mm_loadu_ps((const float*)ptr); } in Load()
102 __m128 v0 = _mm_loadu_ps(((float*)ptr) + 0), in Load4()
103 v1 = _mm_loadu_ps(((float*)ptr) + 4), in Load4()
104 v2 = _mm_loadu_ps(((float*)ptr) + 8), in Load4()
105 v3 = _mm_loadu_ps(((float*)ptr) + 12); in Load4()
/external/clang/test/CodeGen/
Dsse-builtins.c429 return _mm_loadu_ps(A); in test_mm_loadu_ps()
/external/eigen/Eigen/src/Core/arch/SSE/
DPacketMath.h320 return _mm_loadu_ps(from);
329 return _mm_loadu_ps(from);
/external/clang/lib/Headers/
Davxintrin.h2844 __m256 __v256 = _mm256_castps128_ps256(_mm_loadu_ps(__addr_lo)); in _mm256_loadu2_m128()
2845 return _mm256_insertf128_ps(__v256, _mm_loadu_ps(__addr_hi), 1); in _mm256_loadu2_m128()
Dxmmintrin.h1693 _mm_loadu_ps(const float *__p) in _mm_loadu_ps() function
/external/skia/site/dev/contrib/
Dsimd.md25 #define vld1q_f32 _mm_loadu_ps
/external/skqp/site/dev/contrib/
Dsimd.md25 #define vld1q_f32 _mm_loadu_ps