/external/libaom/libaom/av1/common/x86/ |
D | highbd_convolve_2d_ssse3.c | 38 __m128i coeffs_x[4], coeffs_y[4], s[16]; in av1_highbd_convolve_2d_sr_ssse3() local 58 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_convolve_2d_sr_ssse3() 134 const __m128i res_a0 = convolve(s, coeffs_y); in av1_highbd_convolve_2d_sr_ssse3() 140 const __m128i res_a1 = convolve(s + 8, coeffs_y); in av1_highbd_convolve_2d_sr_ssse3() 147 const __m128i res_b0 = convolve(s + 4, coeffs_y); in av1_highbd_convolve_2d_sr_ssse3() 153 const __m128i res_b1 = convolve(s + 4 + 8, coeffs_y); in av1_highbd_convolve_2d_sr_ssse3()
|
D | highbd_wiener_convolve_ssse3.c | 116 const __m128i coeffs_y = in av1_highbd_wiener_convolve_add_src_ssse3() local 120 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_highbd_wiener_convolve_add_src_ssse3() 122 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_highbd_wiener_convolve_add_src_ssse3()
|
D | wiener_convolve_sse2.c | 114 const __m128i coeffs_y = in av1_wiener_convolve_add_src_sse2() local 118 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_wiener_convolve_add_src_sse2() 120 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_wiener_convolve_add_src_sse2()
|
D | wiener_convolve_avx2.c | 151 const __m128i coeffs_y = _mm_add_epi16(xx_loadu_128(filter_y), offset); in av1_wiener_convolve_add_src_avx2() local 154 const __m128i coeffs_0123 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_wiener_convolve_add_src_avx2() 156 const __m128i coeffs_4567 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_wiener_convolve_add_src_avx2()
|
D | jnt_convolve_ssse3.c | 127 const __m128i coeffs_y = _mm_loadu_si128((__m128i *)y_filter); in av1_dist_wtd_convolve_2d_ssse3() local 130 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_dist_wtd_convolve_2d_ssse3() 132 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_dist_wtd_convolve_2d_ssse3()
|
D | highbd_wiener_convolve_avx2.c | 145 const __m128i coeffs_y = _mm_add_epi16(xx_loadu_128(filter_y), offset); in av1_highbd_wiener_convolve_add_src_avx2() local 148 const __m128i coeffs_0123 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_highbd_wiener_convolve_add_src_avx2() 150 const __m128i coeffs_4567 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_highbd_wiener_convolve_add_src_avx2()
|
D | highbd_jnt_convolve_sse4.c | 57 __m128i s[16], coeffs_y[4]; in av1_highbd_dist_wtd_convolve_y_sse4_1() local 59 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_dist_wtd_convolve_y_sse4_1() 101 const __m128i res_a0 = convolve(s, coeffs_y); in av1_highbd_dist_wtd_convolve_y_sse4_1() 106 const __m128i res_a1 = convolve(s + 8, coeffs_y); in av1_highbd_dist_wtd_convolve_y_sse4_1() 165 const __m128i res_b0 = convolve(s + 4, coeffs_y); in av1_highbd_dist_wtd_convolve_y_sse4_1() 170 const __m128i res_b1 = convolve(s + 4 + 8, coeffs_y); in av1_highbd_dist_wtd_convolve_y_sse4_1()
|
D | convolve_sse2.c | 26 const __m128i coeffs_y = _mm_loadu_si128((__m128i *)y_filter); in prepare_coeffs() local 28 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in prepare_coeffs() 30 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in prepare_coeffs()
|
D | highbd_convolve_2d_avx2.c | 42 __m256i s[8], coeffs_y[4], coeffs_x[4]; in av1_highbd_convolve_2d_sr_avx2() local 62 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_convolve_2d_sr_avx2() 134 const __m256i res_a = convolve(s, coeffs_y); in av1_highbd_convolve_2d_sr_avx2() 142 const __m256i res_b = convolve(s + 4, coeffs_y); in av1_highbd_convolve_2d_sr_avx2()
|
D | highbd_convolve_2d_sse4.c | 279 const __m128i coeffs_y = _mm_loadu_si128((__m128i *)y_filter); in av1_highbd_dist_wtd_convolve_2d_sse4_1() local 282 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_highbd_dist_wtd_convolve_2d_sse4_1() 284 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_highbd_dist_wtd_convolve_2d_sse4_1()
|
D | convolve_2d_sse2.c | 115 const __m128i coeffs_y = _mm_loadu_si128((__m128i *)y_filter); in av1_convolve_2d_sr_sse2() local 118 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_convolve_2d_sr_sse2() 120 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_convolve_2d_sr_sse2()
|
D | highbd_jnt_convolve_avx2.c | 250 __m256i s[8], coeffs_y[4], coeffs_x[4]; in av1_highbd_dist_wtd_convolve_2d_avx2() local 281 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_dist_wtd_convolve_2d_avx2() 353 const __m256i res_a = convolve(s, coeffs_y); in av1_highbd_dist_wtd_convolve_2d_avx2() 401 const __m256i res_b = convolve(s + 4, coeffs_y); in av1_highbd_dist_wtd_convolve_2d_avx2() 651 __m256i s[8], coeffs_y[4]; in av1_highbd_dist_wtd_convolve_y_avx2() local 675 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_dist_wtd_convolve_y_avx2() 747 const __m256i res_a = convolve(s, coeffs_y); in av1_highbd_dist_wtd_convolve_y_avx2() 795 const __m256i res_b = convolve(s + 4, coeffs_y); in av1_highbd_dist_wtd_convolve_y_avx2()
|
D | jnt_convolve_sse2.c | 511 const __m128i coeffs_y = _mm_loadu_si128((__m128i *)y_filter); in av1_dist_wtd_convolve_2d_sse2() local 514 const __m128i tmp_0 = _mm_unpacklo_epi32(coeffs_y, coeffs_y); in av1_dist_wtd_convolve_2d_sse2() 516 const __m128i tmp_1 = _mm_unpackhi_epi32(coeffs_y, coeffs_y); in av1_dist_wtd_convolve_2d_sse2()
|
D | jnt_convolve_avx2.c | 631 __m256i filt[4], coeffs_x[4], coeffs_y[4]; in av1_dist_wtd_convolve_2d_avx2() local 637 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_dist_wtd_convolve_2d_avx2() 644 if (!(_mm256_extract_epi32(_mm256_or_si256(coeffs_y[0], coeffs_y[3]), 0))) in av1_dist_wtd_convolve_2d_avx2() 709 const __m256i res_a = convolve_4tap(s, coeffs_y + 1); in av1_dist_wtd_convolve_2d_avx2() 714 const __m256i res_b = convolve_4tap(s + 3, coeffs_y + 1); in av1_dist_wtd_convolve_2d_avx2()
|
/external/libaom/libaom/aom_dsp/x86/ |
D | highbd_convolve_ssse3.c | 37 __m128i s[16], coeffs_y[4]; in av1_highbd_convolve_y_sr_ssse3() local 47 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_convolve_y_sr_ssse3() 89 const __m128i res_a0 = convolve(s, coeffs_y); in av1_highbd_convolve_y_sr_ssse3() 93 const __m128i res_a1 = convolve(s + 8, coeffs_y); in av1_highbd_convolve_y_sr_ssse3() 98 const __m128i res_b0 = convolve(s + 4, coeffs_y); in av1_highbd_convolve_y_sr_ssse3() 102 const __m128i res_b1 = convolve(s + 4 + 8, coeffs_y); in av1_highbd_convolve_y_sr_ssse3()
|
D | convolve_avx2.h | 170 const __m256i res_a = convolve(s, coeffs_y); \ 175 const __m256i res_b = convolve(s + 4, coeffs_y); \
|
D | highbd_convolve_avx2.c | 131 __m256i s[8], coeffs_y[4]; in av1_highbd_convolve_y_sr_avx2() local 141 prepare_coeffs(filter_params_y, subpel_y_q4, coeffs_y); in av1_highbd_convolve_y_sr_avx2() 213 const __m256i res_a = convolve(s, coeffs_y); in av1_highbd_convolve_y_sr_avx2() 219 const __m256i res_b = convolve(s + 4, coeffs_y); in av1_highbd_convolve_y_sr_avx2()
|