Home
last modified time | relevance | path

Searched refs:sum32 (Results 1 – 19 of 19) sorted by relevance

/external/libaom/libaom/aom_dsp/x86/
Dsse_sse4.c32 static INLINE void summary_32_sse4(const __m128i *sum32, __m128i *sum64) { in summary_32_sse4() argument
33 const __m128i sum0 = _mm_cvtepu32_epi64(*sum32); in summary_32_sse4()
34 const __m128i sum1 = _mm_cvtepu32_epi64(_mm_srli_si128(*sum32, 8)); in summary_32_sse4()
231 __m128i sum32 = _mm_setzero_si128(); in aom_highbd_sse_sse4_1() local
233 highbd_sse_w8_sse4_1(&sum32, a, b); in aom_highbd_sse_sse4_1()
234 highbd_sse_w8_sse4_1(&sum32, a + 8, b + 8); in aom_highbd_sse_sse4_1()
239 summary_32_sse4(&sum32, &sum); in aom_highbd_sse_sse4_1()
247 __m128i sum32 = _mm_setzero_si128(); in aom_highbd_sse_sse4_1() local
249 highbd_sse_w8_sse4_1(&sum32, a, b); in aom_highbd_sse_sse4_1()
250 highbd_sse_w8_sse4_1(&sum32, a + 8 * 1, b + 8 * 1); in aom_highbd_sse_sse4_1()
[all …]
Dsse_avx2.c49 static INLINE void summary_32_avx2(const __m256i *sum32, __m256i *sum) { in summary_32_avx2() argument
51 _mm256_cvtepu32_epi64(_mm256_castsi256_si128(*sum32)); in summary_32_avx2()
53 _mm256_cvtepu32_epi64(_mm256_extracti128_si256(*sum32, 1)); in summary_32_avx2()
290 __m256i sum32 = _mm256_setzero_si256(); in aom_highbd_sse_avx2() local
292 highbd_sse_w16_avx2(&sum32, a, b); in aom_highbd_sse_avx2()
293 highbd_sse_w16_avx2(&sum32, a + 16, b + 16); in aom_highbd_sse_avx2()
298 summary_32_avx2(&sum32, &sum); in aom_highbd_sse_avx2()
306 __m256i sum32 = _mm256_setzero_si256(); in aom_highbd_sse_avx2() local
308 highbd_sse_w16_avx2(&sum32, a, b); in aom_highbd_sse_avx2()
309 highbd_sse_w16_avx2(&sum32, a + 16 * 1, b + 16 * 1); in aom_highbd_sse_avx2()
[all …]
Dhighbd_intrapred_sse2.c824 uint32_t sum32 = _mm_cvtsi128_si32(sum); in aom_highbd_dc_predictor_4x8_sse2() local
825 sum32 >>= 16; in aom_highbd_dc_predictor_4x8_sse2()
826 sum32 += 6; in aom_highbd_dc_predictor_4x8_sse2()
827 sum32 /= 12; in aom_highbd_dc_predictor_4x8_sse2()
828 const __m128i row = _mm_set1_epi16((uint16_t)sum32); in aom_highbd_dc_predictor_4x8_sse2()
845 uint32_t sum32 = _mm_cvtsi128_si32(sum); in aom_highbd_dc_predictor_8x4_sse2() local
846 sum32 >>= 16; in aom_highbd_dc_predictor_8x4_sse2()
847 sum32 += 6; in aom_highbd_dc_predictor_8x4_sse2()
848 sum32 /= 12; in aom_highbd_dc_predictor_8x4_sse2()
849 const __m128i row = _mm_set1_epi16((uint16_t)sum32); in aom_highbd_dc_predictor_8x4_sse2()
[all …]
/external/webrtc/modules/audio_coding/codecs/isac/fix/source/
Dentropy_coding_mips.c30 int32_t r0, r1, r2, sum32; in WebRtcIsacfix_MatrixProduct1MIPS() local
90 [sum32] "=&r" (sum32), [r1] "=&r" (r1),[r2] "=&r" (r2) in WebRtcIsacfix_MatrixProduct1MIPS()
100 int32_t r0, r1, r2, sum32; in WebRtcIsacfix_MatrixProduct1MIPS() local
160 [sum32] "=&r" (sum32), [r1] "=&r" (r1),[r2] "=&r" (r2) in WebRtcIsacfix_MatrixProduct1MIPS()
186 int32_t r0, r1, r2, r3, r4, sum32, sum32_2; in WebRtcIsacfix_MatrixProduct2MIPS() local
241 [n] "=&r" (n), [sum32] "=&r" (sum32), [sum32_2] "=&r" (sum32_2), in WebRtcIsacfix_MatrixProduct2MIPS()
Dentropy_coding_neon.c176 int32_t sum32 = 0; in WebRtcIsacfix_MatrixProduct1Neon() local
180 sum32 += (WEBRTC_SPL_MUL_16_32_RSFT16(matrix0[matrix0_index], in WebRtcIsacfix_MatrixProduct1Neon()
185 matrix_product[matrix_prod_index] = sum32; in WebRtcIsacfix_MatrixProduct1Neon()
Dentropy_coding.c884 int32_t sum32 = 0; in WebRtcIsacfix_MatrixProduct1C() local
888 sum32 += WEBRTC_SPL_MUL_16_32_RSFT16( in WebRtcIsacfix_MatrixProduct1C()
893 matrix_product[matrix_prod_index] = sum32; in WebRtcIsacfix_MatrixProduct1C()
920 int32_t sum32 = 0, sum32_2 = 0; in WebRtcIsacfix_MatrixProduct2C() local
924 sum32 += (WEBRTC_SPL_MUL_16_32_RSFT16(matrix0[matrix0_index], in WebRtcIsacfix_MatrixProduct2C()
931 matrix_product[matrix_prod_index] = sum32 >> 3; in WebRtcIsacfix_MatrixProduct2C()
/external/libaom/libaom/av1/encoder/x86/
Dpickrst_sse4.c518 __m128i sum32 = _mm_setzero_si128(); in av1_lowbd_pixel_proj_error_sse4_1() local
538 sum32 = _mm_add_epi32(sum32, err0); in av1_lowbd_pixel_proj_error_sse4_1()
550 const __m128i sum64_0 = _mm_cvtepi32_epi64(sum32); in av1_lowbd_pixel_proj_error_sse4_1()
551 const __m128i sum64_1 = _mm_cvtepi32_epi64(_mm_srli_si128(sum32, 8)); in av1_lowbd_pixel_proj_error_sse4_1()
562 __m128i sum32 = _mm_setzero_si128(); in av1_lowbd_pixel_proj_error_sse4_1() local
577 sum32 = _mm_add_epi32(sum32, err0); in av1_lowbd_pixel_proj_error_sse4_1()
588 const __m128i sum64_0 = _mm_cvtepi32_epi64(sum32); in av1_lowbd_pixel_proj_error_sse4_1()
589 const __m128i sum64_1 = _mm_cvtepi32_epi64(_mm_srli_si128(sum32, 8)); in av1_lowbd_pixel_proj_error_sse4_1()
594 __m128i sum32 = _mm_setzero_si128(); in av1_lowbd_pixel_proj_error_sse4_1() local
607 sum32 = _mm_add_epi32(sum32, err0); in av1_lowbd_pixel_proj_error_sse4_1()
[all …]
Dpickrst_avx2.c515 __m256i sum32 = _mm256_setzero_si256(); in av1_lowbd_pixel_proj_error_avx2() local
541 sum32 = _mm256_add_epi32(sum32, err0); in av1_lowbd_pixel_proj_error_avx2()
554 _mm256_cvtepi32_epi64(_mm256_castsi256_si128(sum32)); in av1_lowbd_pixel_proj_error_avx2()
556 _mm256_cvtepi32_epi64(_mm256_extracti128_si256(sum32, 1)); in av1_lowbd_pixel_proj_error_avx2()
567 __m256i sum32 = _mm256_setzero_si256(); in av1_lowbd_pixel_proj_error_avx2() local
586 sum32 = _mm256_add_epi32(sum32, err0); in av1_lowbd_pixel_proj_error_avx2()
598 _mm256_cvtepi32_epi64(_mm256_castsi256_si128(sum32)); in av1_lowbd_pixel_proj_error_avx2()
600 _mm256_cvtepi32_epi64(_mm256_extracti128_si256(sum32, 1)); in av1_lowbd_pixel_proj_error_avx2()
605 __m256i sum32 = _mm256_setzero_si256(); in av1_lowbd_pixel_proj_error_avx2() local
612 sum32 = _mm256_add_epi32(sum32, err0); in av1_lowbd_pixel_proj_error_avx2()
[all …]
/external/llvm-project/llvm/test/CodeGen/Generic/
Dadd-with-overflow-24.ll10 %sum32 = sext i24 %sum to i32
15 …i8*, ...) @printf( i8* getelementptr ([4 x i8], [4 x i8]* @ok, i32 0, i32 0), i32 %sum32 ) nounwind
27 %sum32 = zext i24 %sum to i32
32 …i8*, ...) @printf( i8* getelementptr ([4 x i8], [4 x i8]* @ok, i32 0, i32 0), i32 %sum32 ) nounwind
Dadd-with-overflow-128.ll12 %sum32 = trunc i128 %sum to i32
17 …i8*, ...) @printf( i8* getelementptr ([4 x i8], [4 x i8]* @ok, i32 0, i32 0), i32 %sum32 ) nounwind
/external/llvm/test/CodeGen/Generic/
Dadd-with-overflow-24.ll10 %sum32 = sext i24 %sum to i32
15 …i8*, ...) @printf( i8* getelementptr ([4 x i8], [4 x i8]* @ok, i32 0, i32 0), i32 %sum32 ) nounwind
27 %sum32 = zext i24 %sum to i32
32 …i8*, ...) @printf( i8* getelementptr ([4 x i8], [4 x i8]* @ok, i32 0, i32 0), i32 %sum32 ) nounwind
Dadd-with-overflow-128.ll12 %sum32 = trunc i128 %sum to i32
17 …i8*, ...) @printf( i8* getelementptr ([4 x i8], [4 x i8]* @ok, i32 0, i32 0), i32 %sum32 ) nounwind
/external/flac/src/libFLAC/
Dlpc_intrin_vsx.c69 vector float sum32 = { 0.0f, 0.0f, 0.0f, 0.0f}; in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_16() local
131 sum32 += d2 * d; in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_16()
151 sum1 += vec_perm(sum31, sum32, (vector unsigned char)vperm3); in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_16()
152 sum2 += vec_perm(sum32, sum33, (vector unsigned char)vperm3); in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_16()
201 vector float sum32 = { 0.0f, 0.0f, 0.0f, 0.0f}; in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_12() local
258 sum32 += d2 * d; in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_12()
274 sum1 += vec_perm(sum31, sum32, (vector unsigned char)vperm3); in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_12()
275 sum2 += vec_perm(sum32, sum30, (vector unsigned char)vperm3); in FLAC__lpc_compute_autocorrelation_intrin_power8_vsx_lag_12()
515 vector float sum32 = { 0.0f, 0.0f, 0.0f, 0.0f}; in FLAC__lpc_compute_autocorrelation_intrin_power9_vsx_lag_16() local
577 sum32 += d2 * d; in FLAC__lpc_compute_autocorrelation_intrin_power9_vsx_lag_16()
[all …]
/external/llvm-project/llvm/test/CodeGen/AArch64/
Darm64_32-pointer-extend.ll46 %sum32 = trunc i64 %sum to i32
47 %res = inttoptr i32 %sum32 to i8*
/external/llvm-project/llvm/test/CodeGen/X86/
Dcode_placement.ll83 %ctg2.sum32 = add i64 %tmp18, 20 ; <i64> [#uses=1]
84 %52 = getelementptr i8, i8* %rk26, i64 %ctg2.sum32 ; <i8*> [#uses=1]
Dlsr-loop-exit-cond.ll246 %ctg2.sum32 = add i64 %tmp18, 20 ; <i64> [#uses=1]
247 %52 = getelementptr i8, i8* %rk26, i64 %ctg2.sum32 ; <i8*> [#uses=1]
Dsad.ll855 %sum32 = add <32 x i32> %abs, %h32
856 …%h0 = shufflevector <32 x i32> %sum32, <32 x i32> undef, <32 x i32> <i32 8, i32 9, i32 10, i32 11,…
857 %sum0 = add <32 x i32> %sum32, %h0
964 %sum32 = add <64 x i32> %sum64, %h32
965 …%h0 = shufflevector <64 x i32> %sum32, <64 x i32> undef, <64 x i32> <i32 8, i32 9, i32 10, i32 11,…
966 %sum0 = add <64 x i32> %sum32, %h0
/external/llvm/test/CodeGen/X86/
Dcode_placement.ll80 %ctg2.sum32 = add i64 %tmp18, 20 ; <i64> [#uses=1]
81 %52 = getelementptr i8, i8* %rk26, i64 %ctg2.sum32 ; <i8*> [#uses=1]
Dlsr-loop-exit-cond.ll89 %ctg2.sum32 = add i64 %tmp18, 20 ; <i64> [#uses=1]
90 %52 = getelementptr i8, i8* %rk26, i64 %ctg2.sum32 ; <i8*> [#uses=1]