/external/libaom/libaom/aom_dsp/x86/ |
D | aom_subpixel_8t_intrin_avx2.c | 109 srcRegFilt32b1_1 = _mm256_maddubs_epi16(srcRegFilt32b1_1, firstFilters); in aom_filter_block1d4_h4_avx2() 197 srcRegFilt32b1_1 = _mm256_maddubs_epi16(srcRegFilt32b1_1, firstFilters); in aom_filter_block1d4_h8_avx2() 203 srcRegFilt32b2 = _mm256_maddubs_epi16(srcRegFilt32b2, secondFilters); in aom_filter_block1d4_h8_avx2() 305 srcRegFilt32b3 = _mm256_maddubs_epi16(srcRegFilt32b3, secondFilters); in aom_filter_block1d8_h4_avx2() 306 srcRegFilt32b2 = _mm256_maddubs_epi16(srcRegFilt32b2, thirdFilters); in aom_filter_block1d8_h4_avx2() 407 srcRegFilt32b1_1 = _mm256_maddubs_epi16(srcRegFilt32b1_1, firstFilters); in aom_filter_block1d8_h8_avx2() 408 srcRegFilt32b2 = _mm256_maddubs_epi16(srcRegFilt32b2, forthFilters); in aom_filter_block1d8_h8_avx2() 418 srcRegFilt32b3 = _mm256_maddubs_epi16(srcRegFilt32b3, secondFilters); in aom_filter_block1d8_h8_avx2() 419 srcRegFilt32b2 = _mm256_maddubs_epi16(srcRegFilt32b2, thirdFilters); in aom_filter_block1d8_h8_avx2() 531 srcRegFilt32b3 = _mm256_maddubs_epi16(srcRegFilt32b3, secondFilters); in aom_filter_block1d16_h4_avx2() [all …]
|
D | convolve_avx2.h | 319 const __m256i res_01 = _mm256_maddubs_epi16(s[0], coeffs[0]); in convolve_lowbd() 320 const __m256i res_23 = _mm256_maddubs_epi16(s[1], coeffs[1]); in convolve_lowbd() 321 const __m256i res_45 = _mm256_maddubs_epi16(s[2], coeffs[2]); in convolve_lowbd() 322 const __m256i res_67 = _mm256_maddubs_epi16(s[3], coeffs[3]); in convolve_lowbd() 333 const __m256i res_23 = _mm256_maddubs_epi16(s[0], coeffs[0]); in convolve_lowbd_4tap() 334 const __m256i res_45 = _mm256_maddubs_epi16(s[1], coeffs[1]); in convolve_lowbd_4tap()
|
D | masked_sad_intrin_avx2.c | 44 __m256i pred_l = _mm256_maddubs_epi16(data_l, mask_l); in masked_sad32xh_avx2() 49 __m256i pred_r = _mm256_maddubs_epi16(data_r, mask_r); in masked_sad32xh_avx2() 98 __m256i pred_l = _mm256_maddubs_epi16(data_l, mask_l); in masked_sad16xh_avx2() 103 __m256i pred_r = _mm256_maddubs_epi16(data_r, mask_r); in masked_sad16xh_avx2()
|
D | blend_a64_mask_avx2.c | 136 const __m256i m0_acbd = _mm256_maddubs_epi16(m0_ac, one_b); in lowbd_blend_a64_d16_mask_subw1_subh1_w16_avx2() 165 const __m256i m0_acbd = _mm256_maddubs_epi16(m0_ac, one_b); in lowbd_blend_a64_d16_mask_subw1_subh1_w32_avx2() 166 const __m256i m1_acbd = _mm256_maddubs_epi16(m1_ac, one_b); in lowbd_blend_a64_d16_mask_subw1_subh1_w32_avx2() 191 const __m256i m0_ac = _mm256_maddubs_epi16(m_i00, one_b); in lowbd_blend_a64_d16_mask_subw1_subh0_w16_avx2() 216 const __m256i m0_ac = _mm256_maddubs_epi16(m_i00, one_b); in lowbd_blend_a64_d16_mask_subw1_subh0_w32_avx2() 217 const __m256i m1_ac = _mm256_maddubs_epi16(m_i01, one_b); in lowbd_blend_a64_d16_mask_subw1_subh0_w32_avx2() 414 _mm256_maddubs_epi16(_mm256_unpacklo_epi8(v_s0_s_b, v_s1_s_b), in blend_16_u8_avx2() 431 _mm256_maddubs_epi16(_mm256_unpacklo_epi8(v_s0_b, v_s1_b), in blend_32_u8_avx2() 434 _mm256_maddubs_epi16(_mm256_unpackhi_epi8(v_s0_b, v_s1_b), in blend_32_u8_avx2() 1007 const __m256i adjacent = _mm256_maddubs_epi16(addrows, one_b); in highbd_blend_a64_d16_mask_subw1_subh1_w4_avx2() [all …]
|
D | variance_avx2.c | 38 const __m256i diff0 = _mm256_maddubs_epi16(src_ref0, adj_sub); in variance_kernel_avx2() 39 const __m256i diff1 = _mm256_maddubs_epi16(src_ref1, adj_sub); in variance_kernel_avx2() 356 const __m256i blendAL = _mm256_maddubs_epi16(ssAL, aaAL); in comp_mask_pred_line_avx2() 357 const __m256i blendAH = _mm256_maddubs_epi16(ssAH, aaAH); in comp_mask_pred_line_avx2()
|
D | variance_impl_avx2.c | 41 exp_src_lo = _mm256_maddubs_epi16(exp_src_lo, filter); \ 42 exp_src_hi = _mm256_maddubs_epi16(exp_src_hi, filter); \
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | vpx_subpixel_8t_intrin_avx2.c | 386 tmp_0 = _mm256_maddubs_epi16(src_reg_shift_0, kernel_reg_23); in vpx_filter_block1d16_h4_avx2() 387 tmp_1 = _mm256_maddubs_epi16(src_reg_shift_2, kernel_reg_45); in vpx_filter_block1d16_h4_avx2() 397 tmp_0 = _mm256_maddubs_epi16(src_reg_shift_0, kernel_reg_23); in vpx_filter_block1d16_h4_avx2() 398 tmp_1 = _mm256_maddubs_epi16(src_reg_shift_2, kernel_reg_45); in vpx_filter_block1d16_h4_avx2() 423 tmp_0 = _mm256_maddubs_epi16(src_reg_shift_0, kernel_reg_23); in vpx_filter_block1d16_h4_avx2() 424 tmp_1 = _mm256_maddubs_epi16(src_reg_shift_2, kernel_reg_45); in vpx_filter_block1d16_h4_avx2() 508 res_reg_m1001_lo = _mm256_maddubs_epi16(src_reg_m1001_lo, kernel_reg_23); in vpx_filter_block1d16_v4_avx2() 509 res_reg_1223_lo = _mm256_maddubs_epi16(src_reg_1223_lo, kernel_reg_45); in vpx_filter_block1d16_v4_avx2() 513 res_reg_m1001_hi = _mm256_maddubs_epi16(src_reg_m1001_hi, kernel_reg_23); in vpx_filter_block1d16_v4_avx2() 514 res_reg_1223_hi = _mm256_maddubs_epi16(src_reg_1223_hi, kernel_reg_45); in vpx_filter_block1d16_v4_avx2() [all …]
|
D | convolve_avx2.h | 57 const __m256i x0 = _mm256_maddubs_epi16(s[0], f[0]); in convolve8_16_avx2() 58 const __m256i x1 = _mm256_maddubs_epi16(s[1], f[1]); in convolve8_16_avx2() 59 const __m256i x2 = _mm256_maddubs_epi16(s[2], f[2]); in convolve8_16_avx2() 60 const __m256i x3 = _mm256_maddubs_epi16(s[3], f[3]); in convolve8_16_avx2()
|
D | variance_avx2.c | 51 const __m256i diff0 = _mm256_maddubs_epi16(src_ref0, adj_sub); in variance_kernel_avx2() 52 const __m256i diff1 = _mm256_maddubs_epi16(src_ref1, adj_sub); in variance_kernel_avx2() 177 exp_src_lo = _mm256_maddubs_epi16(exp_src_lo, filter); \ 178 exp_src_hi = _mm256_maddubs_epi16(exp_src_hi, filter); \
|
/external/rust/crates/libz-sys/src/zlib-ng/arch/x86/ |
D | adler32_avx.c | 75 … __m256i v_short_sum1 = _mm256_maddubs_epi16(vbuf, dot1v); // multiply-add, resulting in 8 shorts. in adler32_avx2() 77 __m256i v_short_sum2 = _mm256_maddubs_epi16(vbuf, dot2v); in adler32_avx2()
|
/external/libgav1/libgav1/src/dsp/x86/ |
D | convolve_avx2.cc | 47 const __m256i v_madd_21 = _mm256_maddubs_epi16(src[0], taps[0]); // k2k1 in SumOnePassTaps() 48 const __m256i v_madd_43 = _mm256_maddubs_epi16(src[1], taps[1]); // k4k3 in SumOnePassTaps() 49 const __m256i v_madd_65 = _mm256_maddubs_epi16(src[2], taps[2]); // k6k5 in SumOnePassTaps() 54 const __m256i v_madd_10 = _mm256_maddubs_epi16(src[0], taps[0]); // k1k0 in SumOnePassTaps() 55 const __m256i v_madd_32 = _mm256_maddubs_epi16(src[1], taps[1]); // k3k2 in SumOnePassTaps() 56 const __m256i v_madd_54 = _mm256_maddubs_epi16(src[2], taps[2]); // k5k4 in SumOnePassTaps() 57 const __m256i v_madd_76 = _mm256_maddubs_epi16(src[3], taps[3]); // k7k6 in SumOnePassTaps() 63 sum = _mm256_maddubs_epi16(src[0], taps[0]); // k4k3 in SumOnePassTaps() 66 const __m256i v_madd_32 = _mm256_maddubs_epi16(src[0], taps[0]); // k3k2 in SumOnePassTaps() 67 const __m256i v_madd_54 = _mm256_maddubs_epi16(src[1], taps[1]); // k5k4 in SumOnePassTaps()
|
D | loop_restoration_avx2.cc | 70 madds[0] = _mm256_maddubs_epi16(s01, filter[0]); in WienerHorizontalTap7Kernel() 71 madds[1] = _mm256_maddubs_epi16(s23, filter[1]); in WienerHorizontalTap7Kernel() 72 madds[2] = _mm256_maddubs_epi16(s45, filter[2]); in WienerHorizontalTap7Kernel() 73 madds[3] = _mm256_maddubs_epi16(s67, filter[3]); in WienerHorizontalTap7Kernel() 88 madds[0] = _mm256_maddubs_epi16(s01, filter[0]); in WienerHorizontalTap5Kernel() 89 madds[1] = _mm256_maddubs_epi16(s23, filter[1]); in WienerHorizontalTap5Kernel() 90 madds[2] = _mm256_maddubs_epi16(s45, filter[2]); in WienerHorizontalTap5Kernel() 103 madds[0] = _mm256_maddubs_epi16(s01, filter[0]); in WienerHorizontalTap3Kernel() 104 madds[1] = _mm256_maddubs_epi16(s23, filter[1]); in WienerHorizontalTap3Kernel() 1453 _mm256_maddubs_epi16(ma, _mm256_set1_epi16(one_over_n_quarter)); in CalculateB5()
|
D | loop_restoration_10bit_avx2.cc | 1378 _mm256_maddubs_epi16(ma, _mm256_set1_epi16(one_over_n_quarter)); in CalculateB5()
|
/external/libaom/libaom/av1/common/x86/ |
D | cfl_avx2.c | 74 __m256i top_16x16 = _mm256_maddubs_epi16(top, twos); in cfl_luma_subsampling_420_lbd_avx2() 75 __m256i bot_16x16 = _mm256_maddubs_epi16(bot, twos); in cfl_luma_subsampling_420_lbd_avx2() 106 __m256i top_16x16 = _mm256_maddubs_epi16(top, fours); in cfl_luma_subsampling_422_lbd_avx2()
|
D | warp_plane_avx2.c | 87 const __m256i res_02 = _mm256_maddubs_epi16(src_0, coeff[0]); in filter_src_pixels_avx2() 88 const __m256i res_46 = _mm256_maddubs_epi16(src_1, coeff[1]); in filter_src_pixels_avx2() 89 const __m256i res_13 = _mm256_maddubs_epi16(src_2, coeff[2]); in filter_src_pixels_avx2() 90 const __m256i res_57 = _mm256_maddubs_epi16(src_3, coeff[3]); in filter_src_pixels_avx2()
|
/external/skia/src/opts/ |
D | SkBitmapProcState_opts.h | 94 __m256i lo = _mm256_maddubs_epi16(_mm256_unpacklo_epi8( l, r), in S32_alpha_D32_filter_DX() 96 __m256i hi = _mm256_maddubs_epi16(_mm256_unpackhi_epi8( l, r), in S32_alpha_D32_filter_DX()
|
/external/libaom/libaom/aom_dsp/simd/ |
D | v256_intrinsics_x86.h | 106 return _mm256_maddubs_epi16(a, _mm256_set1_epi8(1)); in v256_padd_u8() 521 return _mm256_maddubs_epi16(a, b); in v256_madd_us8()
|
/external/clang/test/CodeGen/ |
D | avx2-builtins.c | 673 return _mm256_maddubs_epi16(a, b); in test_mm256_maddubs_epi16()
|
/external/llvm-project/clang/test/CodeGen/X86/ |
D | avx2-builtins.c | 677 return _mm256_maddubs_epi16(a, b); in test_mm256_maddubs_epi16()
|
/external/llvm-project/clang/lib/Headers/ |
D | avx2intrin.h | 242 _mm256_maddubs_epi16(__m256i __a, __m256i __b) in _mm256_maddubs_epi16() function
|
D | avx512vlbwintrin.h | 1360 (__v16hi)_mm256_maddubs_epi16(__X, __Y), in _mm256_mask_maddubs_epi16() 1367 (__v16hi)_mm256_maddubs_epi16(__X, __Y), in _mm256_maskz_maddubs_epi16()
|
/external/clang/lib/Headers/ |
D | avx2intrin.h | 271 _mm256_maddubs_epi16(__m256i __a, __m256i __b) in _mm256_maddubs_epi16() function
|