Home
last modified time | relevance | path

Searched refs:sum_low (Results 1 – 3 of 3) sorted by relevance

/external/libgav1/libgav1/src/dsp/x86/
Dwarp_sse4.cc107 __m128i sum_low = _mm_set1_epi32(kOffsetRemoval); in WriteVerticalFilter() local
108 __m128i sum_high = sum_low; in WriteVerticalFilter()
123 sum_low = _mm_add_epi32(sum_low, product_low); in WriteVerticalFilter()
126 sum_low = RightShiftWithRounding_S32(sum_low, kRoundBitsVertical); in WriteVerticalFilter()
129 const __m128i sum = _mm_packs_epi32(sum_low, sum_high); in WriteVerticalFilter()
132 const __m128i sum = _mm_packus_epi32(sum_low, sum_high); in WriteVerticalFilter()
143 __m128i sum_low = _mm_setzero_si128(); in WriteVerticalFilter() local
154 sum_low = _mm_add_epi32(sum_low, product_low); in WriteVerticalFilter()
157 sum_low = RightShiftWithRounding_S32(sum_low, kRoundBitsVertical); in WriteVerticalFilter()
160 const __m128i sum = _mm_packs_epi32(sum_low, sum_high); in WriteVerticalFilter()
[all …]
/external/libgav1/libgav1/src/dsp/arm/
Dwarp_neon.cc302 int32x4_t sum_low = vdupq_n_s32(0); in Warp_NEON() local
303 int32x4_t sum_high = sum_low; in Warp_NEON()
306 sum_low = in Warp_NEON()
307 vmlal_n_s16(sum_low, vget_low_s16(filter[k]), intermediate); in Warp_NEON()
312 vcombine_s16(vrshrn_n_s32(sum_low, kRoundBitsVertical), in Warp_NEON()
404 int32x4_t sum_low = vdupq_n_s32(-kOffsetRemoval); in Warp_NEON() local
405 int32x4_t sum_high = sum_low; in Warp_NEON()
408 sum_low = vmlal_s16(sum_low, vget_low_s16(filter[k]), in Warp_NEON()
414 vcombine_s16(vrshrn_n_s32(sum_low, kRoundBitsVertical), in Warp_NEON()
/external/libvpx/libvpx/vpx_dsp/arm/
Ddeblock_neon.c289 static uint8x8_t combine_mask(const int16x4_t sum_low, const int16x4_t sum_high, in combine_mask() argument
293 const uint16x4_t mask16_low = calculate_mask(sum_low, sumsq_low, f, fifteen); in combine_mask()
321 int16x4_t sum_low, sum_high; in vpx_mbpost_proc_across_ip_neon() local
359 sum_low = vdup_lane_s16(sum_high, 3); in vpx_mbpost_proc_across_ip_neon()
362 accumulate_sum_sumsq(vget_low_s16(x), xy_low, &sum_low, &sumsq_low); in vpx_mbpost_proc_across_ip_neon()
366 sum_high = vdup_lane_s16(sum_low, 3); in vpx_mbpost_proc_across_ip_neon()
371 mask = combine_mask(sum_low, sum_high, sumsq_low, sumsq_high, f); in vpx_mbpost_proc_across_ip_neon()
373 output = filter_pixels(vcombine_s16(sum_low, sum_high), s); in vpx_mbpost_proc_across_ip_neon()