/external/libaom/libaom/av1/common/x86/ |
D | wiener_convolve_sse2.c | 82 __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_4), in av1_wiener_convolve_add_src_sse2() local 84 res_even = _mm_srai_epi32(_mm_add_epi32(res_even, round_const), in av1_wiener_convolve_add_src_sse2() 103 __m128i res = _mm_packs_epi32(res_even, res_odd); in av1_wiener_convolve_add_src_sse2() 157 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_wiener_convolve_add_src_sse2() local 183 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_wiener_convolve_add_src_sse2() 184 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_wiener_convolve_add_src_sse2()
|
D | highbd_wiener_convolve_ssse3.c | 84 __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_4), in av1_highbd_wiener_convolve_add_src_ssse3() local 86 res_even = _mm_srai_epi32(_mm_add_epi32(res_even, round_const), in av1_highbd_wiener_convolve_add_src_ssse3() 107 __m128i res = _mm_packs_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_ssse3() 159 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_highbd_wiener_convolve_add_src_ssse3() local 185 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_ssse3() 186 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_ssse3()
|
D | jnt_convolve_ssse3.c | 96 __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_4), in av1_dist_wtd_convolve_2d_ssse3() local 98 res_even = in av1_dist_wtd_convolve_2d_ssse3() 99 _mm_sra_epi32(_mm_add_epi32(res_even, round_const), round_shift); in av1_dist_wtd_convolve_2d_ssse3() 117 __m128i res = _mm_packs_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_ssse3() 170 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_dist_wtd_convolve_2d_ssse3() local 196 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_ssse3() 197 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_ssse3()
|
D | highbd_convolve_2d_ssse3.c | 75 __m128i res_even = convolve(s, coeffs_x); in av1_highbd_convolve_2d_sr_ssse3() local 76 res_even = _mm_sra_epi32(_mm_add_epi32(res_even, round_const_x), in av1_highbd_convolve_2d_sr_ssse3() 89 __m128i res_even1 = _mm_packs_epi32(res_even, res_even); in av1_highbd_convolve_2d_sr_ssse3()
|
D | highbd_wiener_convolve_avx2.c | 118 const __m256i res_even = _mm256_srai_epi32( in av1_highbd_wiener_convolve_add_src_avx2() local 130 const __m256i res = _mm256_packs_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_avx2() 201 const __m256i res_even = _mm256_add_epi32( in av1_highbd_wiener_convolve_add_src_avx2() local 225 const __m256i res_lo = _mm256_unpacklo_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_avx2() 226 const __m256i res_hi = _mm256_unpackhi_epi32(res_even, res_odd); in av1_highbd_wiener_convolve_add_src_avx2()
|
D | highbd_jnt_convolve_sse4.c | 318 __m128i res_even = convolve(s, coeffs_x); in av1_highbd_dist_wtd_convolve_x_sse4_1() local 319 res_even = in av1_highbd_dist_wtd_convolve_x_sse4_1() 320 _mm_sra_epi32(_mm_add_epi32(res_even, round_const_x), round_shift_x); in av1_highbd_dist_wtd_convolve_x_sse4_1() 332 res_even = _mm_sll_epi32(res_even, round_shift_bits); in av1_highbd_dist_wtd_convolve_x_sse4_1() 335 __m128i res1 = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_x_sse4_1() 356 __m128i res2 = _mm_unpackhi_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_x_sse4_1()
|
D | highbd_convolve_2d_sse4.c | 248 __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_4), in av1_highbd_dist_wtd_convolve_2d_sse4_1() local 250 res_even = in av1_highbd_dist_wtd_convolve_2d_sse4_1() 251 _mm_sra_epi32(_mm_add_epi32(res_even, round_const), round_shift); in av1_highbd_dist_wtd_convolve_2d_sse4_1() 269 __m128i res = _mm_packs_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_2d_sse4_1() 322 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_highbd_dist_wtd_convolve_2d_sse4_1() local 348 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_2d_sse4_1() 349 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_2d_sse4_1()
|
D | jnt_convolve_sse2.c | 109 const __m128i res_even = convolve_lo_x(s, coeffs); in av1_dist_wtd_convolve_x_sse2() local 119 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_dist_wtd_convolve_x_sse2() 120 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_dist_wtd_convolve_x_sse2() 472 __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_4), in av1_dist_wtd_convolve_2d_sse2() local 474 res_even = in av1_dist_wtd_convolve_2d_sse2() 475 _mm_sra_epi32(_mm_add_epi32(res_even, round_const), round_shift); in av1_dist_wtd_convolve_2d_sse2() 501 __m128i res = _mm_packs_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_sse2() 554 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_dist_wtd_convolve_2d_sse2() local 580 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_sse2() 581 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_dist_wtd_convolve_2d_sse2()
|
D | convolve_2d_sse2.c | 84 __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_4), in av1_convolve_2d_sr_sse2() local 86 res_even = in av1_convolve_2d_sr_sse2() 87 _mm_sra_epi32(_mm_add_epi32(res_even, round_const), round_shift); in av1_convolve_2d_sr_sse2() 105 __m128i res = _mm_packs_epi32(res_even, res_odd); in av1_convolve_2d_sr_sse2() 162 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_convolve_2d_sr_sse2() local 188 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_convolve_2d_sr_sse2() 189 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_convolve_2d_sr_sse2()
|
D | highbd_convolve_2d_avx2.c | 84 __m256i res_even = convolve(s, coeffs_x); in av1_highbd_convolve_2d_sr_avx2() local 85 res_even = _mm256_sra_epi32(_mm256_add_epi32(res_even, round_const_x), in av1_highbd_convolve_2d_sr_avx2() 98 __m256i res_even1 = _mm256_packs_epi32(res_even, res_even); in av1_highbd_convolve_2d_sr_avx2()
|
D | highbd_jnt_convolve_avx2.c | 303 __m256i res_even = convolve(s, coeffs_x); in av1_highbd_dist_wtd_convolve_2d_avx2() local 304 res_even = _mm256_sra_epi32(_mm256_add_epi32(res_even, round_const_x), in av1_highbd_dist_wtd_convolve_2d_avx2() 317 __m256i res_even1 = _mm256_packs_epi32(res_even, res_even); in av1_highbd_dist_wtd_convolve_2d_avx2() 526 __m256i res_even = convolve(s, coeffs_x); in av1_highbd_dist_wtd_convolve_x_avx2() local 527 res_even = _mm256_sra_epi32(_mm256_add_epi32(res_even, round_const_x), in av1_highbd_dist_wtd_convolve_x_avx2() 540 res_even = _mm256_sll_epi32(res_even, round_shift_bits); in av1_highbd_dist_wtd_convolve_x_avx2() 543 __m256i res1 = _mm256_unpacklo_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_x_avx2() 585 __m256i res2 = _mm256_unpackhi_epi32(res_even, res_odd); in av1_highbd_dist_wtd_convolve_x_avx2()
|
D | highbd_warp_plane_sse4.c | 132 __m128i res_even = in highbd_filter_src_pixels() local 134 res_even = _mm_sra_epi32(_mm_add_epi32(res_even, round_const), in highbd_filter_src_pixels() 154 tmp[k + 7] = _mm_packs_epi32(res_even, res_odd); in highbd_filter_src_pixels() 492 const __m128i res_even = _mm_add_epi32(_mm_add_epi32(res_0, res_2), in av1_highbd_warp_affine_sse4_1() local 533 __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_highbd_warp_affine_sse4_1() 534 __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_highbd_warp_affine_sse4_1()
|
D | convolve_sse2.c | 309 const __m128i res_even = convolve_lo_x(s, coeffs); in av1_convolve_x_sr_sse2() local 319 const __m128i res_lo = _mm_unpacklo_epi32(res_even, res_odd); in av1_convolve_x_sr_sse2() 320 const __m128i res_hi = _mm_unpackhi_epi32(res_even, res_odd); in av1_convolve_x_sr_sse2()
|
D | warp_plane_sse4.c | 276 const __m128i res_even = _mm_add_epi16(res_02, res_46); in filter_src_pixels() local 279 _mm_add_epi16(_mm_add_epi16(res_even, res_odd), round_const); in filter_src_pixels() 559 const __m128i res_even = in filter_src_pixels_vertical() local 577 *res_lo = _mm_unpacklo_epi32(res_even, res_odd); in filter_src_pixels_vertical() 578 *res_hi = _mm_unpackhi_epi32(res_even, res_odd); in filter_src_pixels_vertical()
|
D | warp_plane_avx2.c | 92 const __m256i res_even = _mm256_add_epi16(res_02, res_46); in filter_src_pixels_avx2() local 95 _mm256_add_epi16(_mm256_add_epi16(res_even, res_odd), *round_const); in filter_src_pixels_avx2() 640 const __m256i res_even = _mm256_add_epi32(_mm256_add_epi32(res_0, res_2), in filter_src_pixels_vertical_avx2() local 654 *res_lo = _mm256_unpacklo_epi32(res_even, res_odd); in filter_src_pixels_vertical_avx2() 655 *res_hi = _mm256_unpackhi_epi32(res_even, res_odd); in filter_src_pixels_vertical_avx2()
|
/external/libaom/libaom/aom_dsp/x86/ |
D | highbd_convolve_ssse3.c | 215 __m128i res_even = convolve(s, coeffs_x); in av1_highbd_convolve_x_sr_ssse3() local 216 res_even = _mm_sra_epi32(_mm_add_epi32(res_even, round_const_x), in av1_highbd_convolve_x_sr_ssse3() 229 res_even = _mm_sra_epi32(_mm_add_epi32(res_even, round_const_bits), in av1_highbd_convolve_x_sr_ssse3() 234 __m128i res_even1 = _mm_packs_epi32(res_even, res_even); in av1_highbd_convolve_x_sr_ssse3()
|
D | highbd_convolve_avx2.c | 315 __m256i res_even = convolve(s, coeffs_x); in av1_highbd_convolve_x_sr_avx2() local 316 res_even = _mm256_sra_epi32(_mm256_add_epi32(res_even, round_const_x), in av1_highbd_convolve_x_sr_avx2() 329 res_even = _mm256_sra_epi32(_mm256_add_epi32(res_even, round_const_bits), in av1_highbd_convolve_x_sr_avx2() 334 __m256i res_even1 = _mm256_packs_epi32(res_even, res_even); in av1_highbd_convolve_x_sr_avx2() 675 __m256i res_even = convolve_4tap(s, ff); in aom_highbd_filter_block1d8_h4_avx2() local 676 res_even = _mm256_srai_epi32(_mm256_add_epi32(res_even, rounding), in aom_highbd_filter_block1d8_h4_avx2() 687 __m256i res = _mm256_packs_epi32(res_even, res_odd); in aom_highbd_filter_block1d8_h4_avx2()
|
/external/libaom/libaom/av1/common/arm/ |
D | warp_plane_neon.c | 315 int32x4_t res_even, res_odd, im_res_0, im_res_1; in vertical_filter_neon() local 409 res_even = vaddq_s32(im_res_0, im_res_1); in vertical_filter_neon() 465 c0 = vtrnq_s32(res_even, res_odd); in vertical_filter_neon()
|