/external/libaom/libaom/aom_dsp/x86/ |
D | aom_subpixel_8t_intrin_sse2.c | 48 __m128i ss_1_1 = _mm_unpacklo_epi8(ss_2, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 49 __m128i ss_2_1 = _mm_unpacklo_epi8(ss_4, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 56 __m128i ss_1_2 = _mm_unpacklo_epi8(ss_1, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 57 __m128i ss_2_2 = _mm_unpacklo_epi8(ss_3, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 72 ss_1_1 = _mm_unpacklo_epi8(ss_2, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 73 ss_2_1 = _mm_unpacklo_epi8(ss_4, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 80 ss_1_2 = _mm_unpacklo_epi8(ss_1, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 81 ss_2_2 = _mm_unpacklo_epi8(ss_3, _mm_setzero_si128()); in aom_filter_block1d16_h4_sse2() 143 srcReg23_lo = _mm_unpacklo_epi8(srcReg2, srcReg3); in aom_filter_block1d16_v4_sse2() 145 __m128i resReg23_lo_1 = _mm_unpacklo_epi8(srcReg23_lo, _mm_setzero_si128()); in aom_filter_block1d16_v4_sse2() [all …]
|
D | avg_intrin_sse2.c | 24 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s)), u0); in aom_minmax_8x8_sse2() 25 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d)), u0); in aom_minmax_8x8_sse2() 30 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + p)), u0); in aom_minmax_8x8_sse2() 31 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + dp)), u0); in aom_minmax_8x8_sse2() 38 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 2 * p)), u0); in aom_minmax_8x8_sse2() 39 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 2 * dp)), u0); in aom_minmax_8x8_sse2() 46 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 3 * p)), u0); in aom_minmax_8x8_sse2() 47 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 3 * dp)), u0); in aom_minmax_8x8_sse2() 54 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 4 * p)), u0); in aom_minmax_8x8_sse2() 55 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 4 * dp)), u0); in aom_minmax_8x8_sse2() [all …]
|
D | lpf_common_sse2.h | 233 w0 = _mm_unpacklo_epi8( in transpose4x8_8x4_low_sse2() 235 w1 = _mm_unpacklo_epi8( in transpose4x8_8x4_low_sse2() 271 w0 = _mm_unpacklo_epi8( in transpose4x8_8x4_sse2() 273 w1 = _mm_unpacklo_epi8( in transpose4x8_8x4_sse2() 320 w0 = _mm_unpacklo_epi8( in transpose8x8_low_sse2() 323 w1 = _mm_unpacklo_epi8( in transpose8x8_low_sse2() 326 w2 = _mm_unpacklo_epi8( in transpose8x8_low_sse2() 329 w3 = _mm_unpacklo_epi8( in transpose8x8_low_sse2() 353 w0 = _mm_unpacklo_epi8( in transpose8x8_sse2() 358 w1 = _mm_unpacklo_epi8( in transpose8x8_sse2() [all …]
|
D | convolve_sse2.h | 51 ss[0] = _mm_unpacklo_epi8(s[0], _mm_setzero_si128()); in convolve_lo_x() 52 ss[1] = _mm_unpacklo_epi8(s[1], _mm_setzero_si128()); in convolve_lo_x() 53 ss[2] = _mm_unpacklo_epi8(s[2], _mm_setzero_si128()); in convolve_lo_x() 54 ss[3] = _mm_unpacklo_epi8(s[3], _mm_setzero_si128()); in convolve_lo_x() 61 ss[0] = _mm_unpacklo_epi8(s[0], _mm_setzero_si128()); in convolve_lo_y() 62 ss[1] = _mm_unpacklo_epi8(s[2], _mm_setzero_si128()); in convolve_lo_y() 63 ss[2] = _mm_unpacklo_epi8(s[4], _mm_setzero_si128()); in convolve_lo_y() 64 ss[3] = _mm_unpacklo_epi8(s[6], _mm_setzero_si128()); in convolve_lo_y()
|
D | intrapred_ssse3.c | 49 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_4x4_ssse3() 70 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_4x8_ssse3() 91 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_4x16_ssse3() 111 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_8x4_ssse3() 132 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_8x8_ssse3() 153 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_8x16_ssse3() 173 const __m128i t16 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_8x32_ssse3() 205 const __m128i top0 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_16x4_ssse3() 226 const __m128i top0 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_16x8_ssse3() 249 const __m128i top0 = _mm_unpacklo_epi8(t, zero); in aom_paeth_predictor_16x16_ssse3() [all …]
|
D | masked_variance_intrin_ssse3.h | 37 const __m128i ssAL = _mm_unpacklo_epi8(sA0, sA1); in comp_mask_pred_16_ssse3() 38 const __m128i aaAL = _mm_unpacklo_epi8(aA, maA); in comp_mask_pred_16_ssse3() 70 const __m128i ssA = _mm_unpacklo_epi8(sA0, sA1); in comp_mask_pred_8_ssse3() 71 const __m128i ssB = _mm_unpacklo_epi8(sB0, sB1); in comp_mask_pred_8_ssse3() 74 const __m128i aaA = _mm_unpacklo_epi8(a, ma); in comp_mask_pred_8_ssse3()
|
/external/libaom/libaom/av1/common/x86/ |
D | convolve_sse2.c | 51 ss[0] = _mm_unpacklo_epi8(s[0], _mm_setzero_si128()); in convolve_lo_x() 52 ss[1] = _mm_unpacklo_epi8(s[1], _mm_setzero_si128()); in convolve_lo_x() 53 ss[2] = _mm_unpacklo_epi8(s[2], _mm_setzero_si128()); in convolve_lo_x() 54 ss[3] = _mm_unpacklo_epi8(s[3], _mm_setzero_si128()); in convolve_lo_x() 61 ss[0] = _mm_unpacklo_epi8(s[0], _mm_setzero_si128()); in convolve_lo_y() 62 ss[1] = _mm_unpacklo_epi8(s[2], _mm_setzero_si128()); in convolve_lo_y() 63 ss[2] = _mm_unpacklo_epi8(s[4], _mm_setzero_si128()); in convolve_lo_y() 64 ss[3] = _mm_unpacklo_epi8(s[6], _mm_setzero_si128()); in convolve_lo_y() 104 s[0] = _mm_unpacklo_epi8( in av1_convolve_y_sr_sse2() 107 s[1] = _mm_unpacklo_epi8( in av1_convolve_y_sr_sse2() [all …]
|
D | jnt_convolve_sse2.c | 60 s[0] = _mm_unpacklo_epi8(data, _mm_srli_si128(data, 1)); in av1_dist_wtd_convolve_x_sse2() 62 _mm_unpacklo_epi8(_mm_srli_si128(data, 2), _mm_srli_si128(data, 3)); in av1_dist_wtd_convolve_x_sse2() 64 _mm_unpacklo_epi8(_mm_srli_si128(data, 4), _mm_srli_si128(data, 5)); in av1_dist_wtd_convolve_x_sse2() 66 _mm_unpacklo_epi8(_mm_srli_si128(data, 6), _mm_srli_si128(data, 7)); in av1_dist_wtd_convolve_x_sse2() 190 s[0] = _mm_unpacklo_epi8( in av1_dist_wtd_convolve_y_sse2() 193 s[1] = _mm_unpacklo_epi8( in av1_dist_wtd_convolve_y_sse2() 196 s[2] = _mm_unpacklo_epi8( in av1_dist_wtd_convolve_y_sse2() 199 s[3] = _mm_unpacklo_epi8( in av1_dist_wtd_convolve_y_sse2() 202 s[4] = _mm_unpacklo_epi8( in av1_dist_wtd_convolve_y_sse2() 205 s[5] = _mm_unpacklo_epi8( in av1_dist_wtd_convolve_y_sse2() [all …]
|
D | wiener_convolve_sse2.c | 73 const __m128i src_0 = _mm_unpacklo_epi8(data, zero); in av1_wiener_convolve_add_src_sse2() 75 const __m128i src_2 = _mm_unpacklo_epi8(_mm_srli_si128(data, 2), zero); in av1_wiener_convolve_add_src_sse2() 77 const __m128i src_4 = _mm_unpacklo_epi8(_mm_srli_si128(data, 4), zero); in av1_wiener_convolve_add_src_sse2() 79 const __m128i src_6 = _mm_unpacklo_epi8(_mm_srli_si128(data, 6), zero); in av1_wiener_convolve_add_src_sse2() 88 const __m128i src_1 = _mm_unpacklo_epi8(_mm_srli_si128(data, 1), zero); in av1_wiener_convolve_add_src_sse2() 90 const __m128i src_3 = _mm_unpacklo_epi8(_mm_srli_si128(data, 3), zero); in av1_wiener_convolve_add_src_sse2() 92 const __m128i src_5 = _mm_unpacklo_epi8(_mm_srli_si128(data, 5), zero); in av1_wiener_convolve_add_src_sse2() 94 const __m128i src_7 = _mm_unpacklo_epi8(_mm_srli_si128(data, 7), zero); in av1_wiener_convolve_add_src_sse2()
|
/external/libavc/common/x86/ |
D | ih264_deblk_luma_ssse3.c | 122 temp1 = _mm_unpacklo_epi8(line1, line2); in ih264_deblk_luma_vert_bs4_ssse3() 123 temp2 = _mm_unpacklo_epi8(line3, line4); in ih264_deblk_luma_vert_bs4_ssse3() 124 temp3 = _mm_unpacklo_epi8(line5, line6); in ih264_deblk_luma_vert_bs4_ssse3() 125 temp4 = _mm_unpacklo_epi8(line7, line8); in ih264_deblk_luma_vert_bs4_ssse3() 146 temp1 = _mm_unpacklo_epi8(line1, line2); in ih264_deblk_luma_vert_bs4_ssse3() 147 temp2 = _mm_unpacklo_epi8(line3, line4); in ih264_deblk_luma_vert_bs4_ssse3() 148 temp3 = _mm_unpacklo_epi8(line5, line6); in ih264_deblk_luma_vert_bs4_ssse3() 149 temp4 = _mm_unpacklo_epi8(line7, line8); in ih264_deblk_luma_vert_bs4_ssse3() 175 temp2 = _mm_unpacklo_epi8(temp1, zero); in ih264_deblk_luma_vert_bs4_ssse3() 188 temp2 = _mm_unpacklo_epi8(temp1, zero); in ih264_deblk_luma_vert_bs4_ssse3() [all …]
|
D | ih264_iquant_itrans_recon_dc_ssse3.c | 137 pred_r0 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p00 p01 p02 p03 0 0 0 0 -- all 16 bits in ih264_iquant_itrans_recon_4x4_dc_ssse3() 139 pred_r1 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p10 p11 p12 p13 0 0 0 0 -- all 16 bits in ih264_iquant_itrans_recon_4x4_dc_ssse3() 141 pred_r2 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p20 p21 p22 p23 0 0 0 0 -- all 16 bits in ih264_iquant_itrans_recon_4x4_dc_ssse3() 143 pred_r3 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p30 p31 p32 p33 0 0 0 0 -- all 16 bits in ih264_iquant_itrans_recon_4x4_dc_ssse3() 259 pred_r0 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p0 p1 p2 p3 p4 p5 p6 p7 -- all 16 bits in ih264_iquant_itrans_recon_8x8_dc_ssse3() 262 pred_r1 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p0 p1 p2 p3 p4 p5 p6 p7 -- all 16 bits in ih264_iquant_itrans_recon_8x8_dc_ssse3() 266 pred_r2 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p0 p1 p2 p3 p4 p5 p6 p7 -- all 16 bits in ih264_iquant_itrans_recon_8x8_dc_ssse3() 270 pred_r3 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p0 p1 p2 p3 p4 p5 p6 p7 -- all 16 bits in ih264_iquant_itrans_recon_8x8_dc_ssse3() 274 pred_r4 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p0 p1 p2 p3 p4 p5 p6 p7 -- all 16 bits in ih264_iquant_itrans_recon_8x8_dc_ssse3() 278 pred_r5 = _mm_unpacklo_epi8(predload_r, zero_8x16b); //p0 p1 p2 p3 p4 p5 p6 p7 -- all 16 bits in ih264_iquant_itrans_recon_8x8_dc_ssse3() [all …]
|
D | ih264_inter_pred_filters_ssse3.c | 258 …src_r0_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a0 a1 a1 a2 a2 a3 a3 a4 … in ih264_inter_pred_luma_horz_ssse3() 259 …src_r1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b0 b1 b1 b2 b2 b3 b3 b4 … in ih264_inter_pred_luma_horz_ssse3() 323 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a0 a1 a1 a2 a2 a3 a3 a4 a4… in ih264_inter_pred_luma_horz_ssse3() 324 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b0 b1 b1 b2 b2 b3 b3 b4 b4… in ih264_inter_pred_luma_horz_ssse3() 337 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a2 a3 a3 a4 a4 a5 a5 a6 a6… in ih264_inter_pred_luma_horz_ssse3() 338 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b2 b3 b3 b4 b4 b5 b5 b6 b6… in ih264_inter_pred_luma_horz_ssse3() 351 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a4 a5 a5 a6 a6 a7 a7 a8 a8… in ih264_inter_pred_luma_horz_ssse3() 352 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b4 b5 b5 b6 b6 b7 b7 b8 b8… in ih264_inter_pred_luma_horz_ssse3() 400 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a0 a1 a1 a2 a2 a3 a3 a4 a4… in ih264_inter_pred_luma_horz_ssse3() 401 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b0 b1 b1 b2 b2 b3 b3 b4 b4… in ih264_inter_pred_luma_horz_ssse3() [all …]
|
D | ih264_luma_intra_pred_filters_ssse3.c | 340 top_8x16b = _mm_unpacklo_epi8(top_16x8b, zero_vector); //t0 t1 t2 t3 t4 t5 t6 t7 in ih264_intra_pred_luma_4x4_mode_diag_dl_ssse3() 428 top_left_8x16b = _mm_unpacklo_epi8(top_left_16x8b, zero_vector); in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() 429 top_left_sh_8x16b = _mm_unpacklo_epi8(top_left_sh_16x8b, zero_vector); in ih264_intra_pred_luma_4x4_mode_diag_dr_ssse3() 514 w121_a1_8x16b = _mm_unpacklo_epi8(val_16x8b, zero_vector); //l2 l1 l0 tl t0 t1 t2 t3 in ih264_intra_pred_luma_4x4_mode_vert_r_ssse3() 610 w121_a1_8x16b = _mm_unpacklo_epi8(val_16x8b, zero_vector); //l3 l2 l1 l0 tl t0 t1 t2 in ih264_intra_pred_luma_4x4_mode_horz_d_ssse3() 624 row4_16x8b = _mm_unpacklo_epi8(w11_16x8b, w121_16x8b); in ih264_intra_pred_luma_4x4_mode_horz_d_ssse3() 704 w121_a1_8x16b = _mm_unpacklo_epi8(val_16x8b, zero_vector); //t0 t1 t2 t3 t4 t5... in ih264_intra_pred_luma_4x4_mode_vert_l_ssse3() 798 w121_a1_8x16b = _mm_unpacklo_epi8(val_16x8b, zero_vector); //l0 l1 l2 l3 l3 l3... in ih264_intra_pred_luma_4x4_mode_horz_u_ssse3() 816 row1_16x8b = _mm_unpacklo_epi8(w11_16x8b, w121_16x8b); in ih264_intra_pred_luma_4x4_mode_horz_u_ssse3() 1105 a0_8x16 = _mm_unpacklo_epi8(top_16x8, zero); in ih264_intra_pred_luma_8x8_mode_diag_dl_ssse3() [all …]
|
/external/libhevc/common/x86/ |
D | ihevc_inter_pred_filters_ssse3_intr.c | 335 … src_temp3_16x8b = _mm_unpacklo_epi8(src_temp1_16x8b, src_temp2_16x8b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 341 … src_temp4_16x8b = _mm_unpacklo_epi8(src_temp1_16x8b, src_temp2_16x8b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 347 … src_temp5_16x8b = _mm_unpacklo_epi8(src_temp1_16x8b, src_temp2_16x8b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 353 … src_temp6_16x8b = _mm_unpacklo_epi8(src_temp1_16x8b, src_temp2_16x8b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 368 … src_temp13_16x8b = _mm_unpacklo_epi8(src_temp11_16x8b, src_temp12_16x8b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 374 … src_temp14_16x8b = _mm_unpacklo_epi8(src_temp11_16x8b, src_temp12_16x8b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 380 … src_temp15_16x8b = _mm_unpacklo_epi8(src_temp11_16x8b, src_temp12_16x8b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 386 … src_temp16_16x8b = _mm_unpacklo_epi8(src_temp11_16x8b, src_temp12_16x8b); /* row = 1 */ in ihevc_inter_pred_luma_horz_ssse3() 424 … src_temp3_16x8b = _mm_unpacklo_epi8(src_temp1_16x8b, src_temp2_16x8b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() 430 … src_temp4_16x8b = _mm_unpacklo_epi8(src_temp1_16x8b, src_temp2_16x8b); /* row = 0 */ in ihevc_inter_pred_luma_horz_ssse3() [all …]
|
D | ihevc_chroma_intra_pred_filters_ssse3_intr.c | 232 src_temp_8x16b = _mm_unpacklo_epi8(src_temp_8x16b, zero_8x16b); in ihevc_intra_pred_chroma_planar_ssse3() 349 src_temp5 = _mm_unpacklo_epi8(src_temp3, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 350 src_temp6 = _mm_unpacklo_epi8(src_temp4, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 351 src_temp9 = _mm_unpacklo_epi8(src_temp7, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 352 src_temp10 = _mm_unpacklo_epi8(src_temp8, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 359 src_temp3 = _mm_unpacklo_epi8(src_temp3, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 360 src_temp4 = _mm_unpacklo_epi8(src_temp4, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 361 src_temp7 = _mm_unpacklo_epi8(src_temp7, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 362 src_temp8 = _mm_unpacklo_epi8(src_temp8, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() 391 src_temp5 = _mm_unpacklo_epi8(src_temp3, m_zero); in ihevc_intra_pred_chroma_dc_ssse3() [all …]
|
D | ihevc_deblk_ssse3_intr.c | 164 temp_coef0_8x16b = _mm_unpacklo_epi8(temp_coef0_8x16b, temp_coef1_8x16b); in ihevc_deblk_luma_vert_ssse3() 503 src_row0_8x16b = _mm_unpacklo_epi8(src_row0_8x16b, tmp2_const_8x16b); in ihevc_deblk_luma_vert_ssse3() 504 src_row1_8x16b = _mm_unpacklo_epi8(src_row1_8x16b, tmp2_const_8x16b); in ihevc_deblk_luma_vert_ssse3() 505 src_row2_8x16b = _mm_unpacklo_epi8(src_row2_8x16b, tmp2_const_8x16b); in ihevc_deblk_luma_vert_ssse3() 506 src_row3_8x16b = _mm_unpacklo_epi8(src_row3_8x16b, tmp2_const_8x16b); in ihevc_deblk_luma_vert_ssse3() 594 src_tmp_p_0_8x16b = _mm_unpacklo_epi8(src_p1_8x16b, src_p0_8x16b); in ihevc_deblk_luma_horz_ssse3() 595 src_tmp_p_1_8x16b = _mm_unpacklo_epi8(tmp_pq_str0_8x16b, src_p2_8x16b); in ihevc_deblk_luma_horz_ssse3() 597 src_tmp_q_0_8x16b = _mm_unpacklo_epi8(src_q0_8x16b, src_q1_8x16b); in ihevc_deblk_luma_horz_ssse3() 598 src_tmp_q_1_8x16b = _mm_unpacklo_epi8(src_q2_8x16b, tmp_pq_str1_8x16b); in ihevc_deblk_luma_horz_ssse3() 624 temp_coef0_8x16b = _mm_unpacklo_epi8(temp_coef0_8x16b, temp_coef1_8x16b); in ihevc_deblk_luma_horz_ssse3() [all …]
|
/external/libhevc/decoder/x86/ |
D | ihevcd_it_rec_dc_sse42_intr.c | 105 m_temp_reg_4 = _mm_unpacklo_epi8(m_temp_reg_4, zero_8x16b); in ihevcd_itrans_recon_dc_luma_sse42() 106 m_temp_reg_5 = _mm_unpacklo_epi8(m_temp_reg_5, zero_8x16b); in ihevcd_itrans_recon_dc_luma_sse42() 146 m_temp_reg_4 = _mm_unpacklo_epi8(m_temp_reg_0, zero_8x16b); in ihevcd_itrans_recon_dc_luma_sse42() 147 m_temp_reg_5 = _mm_unpacklo_epi8(m_temp_reg_1, zero_8x16b); in ihevcd_itrans_recon_dc_luma_sse42() 148 m_temp_reg_6 = _mm_unpacklo_epi8(m_temp_reg_2, zero_8x16b); in ihevcd_itrans_recon_dc_luma_sse42() 149 m_temp_reg_7 = _mm_unpacklo_epi8(m_temp_reg_3, zero_8x16b); in ihevcd_itrans_recon_dc_luma_sse42() 257 m_temp_reg_4 = _mm_unpacklo_epi8(m_temp_reg_14, zero_8x16b); in ihevcd_itrans_recon_dc_chroma_sse42() 258 m_temp_reg_5 = _mm_unpacklo_epi8(m_temp_reg_15, zero_8x16b); in ihevcd_itrans_recon_dc_chroma_sse42() 276 m_temp_reg_9 = _mm_unpacklo_epi8(m_temp_reg_8, m_temp_reg_0); in ihevcd_itrans_recon_dc_chroma_sse42() 278 m_temp_reg_10 = _mm_unpacklo_epi8(m_temp_reg_8, m_temp_reg_1); in ihevcd_itrans_recon_dc_chroma_sse42() [all …]
|
D | ihevcd_it_rec_dc_ssse3_intr.c | 106 m_temp_reg_4 = _mm_unpacklo_epi8(m_temp_reg_4, zero_8x16b); in ihevcd_itrans_recon_dc_luma_ssse3() 107 m_temp_reg_5 = _mm_unpacklo_epi8(m_temp_reg_5, zero_8x16b); in ihevcd_itrans_recon_dc_luma_ssse3() 147 m_temp_reg_4 = _mm_unpacklo_epi8(m_temp_reg_0, zero_8x16b); in ihevcd_itrans_recon_dc_luma_ssse3() 148 m_temp_reg_5 = _mm_unpacklo_epi8(m_temp_reg_1, zero_8x16b); in ihevcd_itrans_recon_dc_luma_ssse3() 149 m_temp_reg_6 = _mm_unpacklo_epi8(m_temp_reg_2, zero_8x16b); in ihevcd_itrans_recon_dc_luma_ssse3() 150 m_temp_reg_7 = _mm_unpacklo_epi8(m_temp_reg_3, zero_8x16b); in ihevcd_itrans_recon_dc_luma_ssse3() 257 m_temp_reg_4 = _mm_unpacklo_epi8(m_temp_reg_14, zero_8x16b); in ihevcd_itrans_recon_dc_chroma_ssse3() 258 m_temp_reg_5 = _mm_unpacklo_epi8(m_temp_reg_15, zero_8x16b); in ihevcd_itrans_recon_dc_chroma_ssse3() 276 m_temp_reg_9 = _mm_unpacklo_epi8(m_temp_reg_8, m_temp_reg_0); in ihevcd_itrans_recon_dc_chroma_ssse3() 278 m_temp_reg_10 = _mm_unpacklo_epi8(m_temp_reg_8, m_temp_reg_1); in ihevcd_itrans_recon_dc_chroma_ssse3() [all …]
|
/external/libvpx/libvpx/vpx_dsp/x86/ |
D | avg_intrin_sse2.c | 23 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s)), u0); in vpx_minmax_8x8_sse2() 24 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d)), u0); in vpx_minmax_8x8_sse2() 29 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + p)), u0); in vpx_minmax_8x8_sse2() 30 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + dp)), u0); in vpx_minmax_8x8_sse2() 37 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 2 * p)), u0); in vpx_minmax_8x8_sse2() 38 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 2 * dp)), u0); in vpx_minmax_8x8_sse2() 45 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 3 * p)), u0); in vpx_minmax_8x8_sse2() 46 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 3 * dp)), u0); in vpx_minmax_8x8_sse2() 53 s0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(s + 4 * p)), u0); in vpx_minmax_8x8_sse2() 54 d0 = _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)(d + 4 * dp)), u0); in vpx_minmax_8x8_sse2() [all …]
|
D | vpx_subpixel_4t_intrin_sse2.c | 161 src_reg_m10_lo = _mm_unpacklo_epi8(src_reg_m1, src_reg_0); in vpx_filter_block1d16_v4_sse2() 163 src_reg_m10_lo_1 = _mm_unpacklo_epi8(src_reg_m10_lo, _mm_setzero_si128()); in vpx_filter_block1d16_v4_sse2() 165 src_reg_m10_hi_1 = _mm_unpacklo_epi8(src_reg_m10_hi, _mm_setzero_si128()); in vpx_filter_block1d16_v4_sse2() 170 src_reg_01_lo = _mm_unpacklo_epi8(src_reg_0, src_reg_1); in vpx_filter_block1d16_v4_sse2() 172 src_reg_01_lo_1 = _mm_unpacklo_epi8(src_reg_01_lo, _mm_setzero_si128()); in vpx_filter_block1d16_v4_sse2() 174 src_reg_01_hi_1 = _mm_unpacklo_epi8(src_reg_01_hi, _mm_setzero_si128()); in vpx_filter_block1d16_v4_sse2() 180 src_reg_12_lo = _mm_unpacklo_epi8(src_reg_1, src_reg_2); in vpx_filter_block1d16_v4_sse2() 185 src_reg_23_lo = _mm_unpacklo_epi8(src_reg_2, src_reg_3); in vpx_filter_block1d16_v4_sse2() 195 src_reg_12_lo_1 = _mm_unpacklo_epi8(src_reg_12_lo, _mm_setzero_si128()); in vpx_filter_block1d16_v4_sse2() 200 src_reg_23_lo_1 = _mm_unpacklo_epi8(src_reg_23_lo, _mm_setzero_si128()); in vpx_filter_block1d16_v4_sse2() [all …]
|
D | loopfilter_sse2.c | 33 _mm_unpacklo_epi8(_mm_max_epu8(flat, _mm_srli_si128(flat, 8)), zero); \ 84 filter2filter1 = _mm_unpacklo_epi8(filter2filter1, filter2filter1); \ 91 filter = _mm_unpacklo_epi8(filter, filter); \ 114 _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)thresh), zero); in vpx_lpf_horizontal_4_sse2() 148 _mm_unpacklo_epi8(_mm_loadl_epi64((const __m128i *)thresh), zero); in vpx_lpf_vertical_4_sse2() 155 q1q0 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(s + 0 * pitch - 4)), in vpx_lpf_vertical_4_sse2() 159 x1 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(s + 2 * pitch - 4)), in vpx_lpf_vertical_4_sse2() 163 x2 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(s + 4 * pitch - 4)), in vpx_lpf_vertical_4_sse2() 167 x3 = _mm_unpacklo_epi8(_mm_loadl_epi64((__m128i *)(s + 6 * pitch - 4)), in vpx_lpf_vertical_4_sse2() 208 ps1ps0 = _mm_unpacklo_epi8(ps1ps0, qs1qs0); in vpx_lpf_vertical_4_sse2() [all …]
|
/external/webp/src/dsp/ |
D | lossless_sse2.c | 31 const __m128i C0 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c0), zero); in ClampedAddSubtractFull_SSE2() 32 const __m128i C1 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c1), zero); in ClampedAddSubtractFull_SSE2() 33 const __m128i C2 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c2), zero); in ClampedAddSubtractFull_SSE2() 45 const __m128i C0 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c0), zero); in ClampedAddSubtractHalf_SSE2() 46 const __m128i C1 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c1), zero); in ClampedAddSubtractHalf_SSE2() 47 const __m128i B0 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(c2), zero); in ClampedAddSubtractHalf_SSE2() 72 const __m128i pa = _mm_unpacklo_epi8(AC, zero); // |a - c| in Select_SSE2() 73 const __m128i pb = _mm_unpacklo_epi8(BC, zero); // |b - c| in Select_SSE2() 107 const __m128i A0 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(a0), zero); in Average2_uint32_16_SSE2() 108 const __m128i A1 = _mm_unpacklo_epi8(_mm_cvtsi32_si128(a1), zero); in Average2_uint32_16_SSE2() [all …]
|
D | common_sse2.h | 167 const __m128i A0 = _mm_unpacklo_epi8(*in0, *in1); in VP8L32bToPlanar_SSE2() 169 const __m128i A2 = _mm_unpacklo_epi8(*in2, *in3); in VP8L32bToPlanar_SSE2() 171 const __m128i B0 = _mm_unpacklo_epi8(A0, A1); in VP8L32bToPlanar_SSE2() 173 const __m128i B2 = _mm_unpacklo_epi8(A2, A3); in VP8L32bToPlanar_SSE2() 177 const __m128i C0 = _mm_unpacklo_epi8(B0, B1); in VP8L32bToPlanar_SSE2() 179 const __m128i C2 = _mm_unpacklo_epi8(B2, B3); in VP8L32bToPlanar_SSE2()
|
/external/libavc/encoder/x86/ |
D | ih264e_half_pel_ssse3.c | 138 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a0 a1 a1 a2 a2 a3 a3 a4… in ih264e_sixtapfilter_horz_ssse3() 139 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b0 b1 b1 b2 b2 b3 b3 b4… in ih264e_sixtapfilter_horz_ssse3() 152 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a2 a3 a3 a4 a4 a5 a5 a6… in ih264e_sixtapfilter_horz_ssse3() 153 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b2 b3 b3 b4 b4 b5 b5 b6… in ih264e_sixtapfilter_horz_ssse3() 166 …src_r0_t1_16x8b = _mm_unpacklo_epi8(src_r0_16x8b, src_r0_sht_16x8b); //a4 a5 a5 a6 a6 a7 a7 a8… in ih264e_sixtapfilter_horz_ssse3() 167 …src_r1_t1_16x8b = _mm_unpacklo_epi8(src_r1_16x8b, src_r1_sht_16x8b); //b4 b5 b5 b6 b6 b7 b7 b8… in ih264e_sixtapfilter_horz_ssse3() 308 src_r0r1_16x8b = _mm_unpacklo_epi8(src1_r0_16x8b, src1_r1_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 309 src_r2r3_16x8b = _mm_unpacklo_epi8(src1_r2_16x8b, src1_r3_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 310 src_r4r5_16x8b = _mm_unpacklo_epi8(src1_r4_16x8b, src1_r5_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() 334 src_r0r1_16x8b = _mm_unpacklo_epi8(src2_r0_16x8b, src2_r1_16x8b); in ih264e_sixtap_filter_2dvh_vert_ssse3() [all …]
|
/external/libmpeg2/common/x86/ |
D | ideint_spatial_filter_ssse3.c | 125 row1_m1 = _mm_unpacklo_epi8(row1_m1, zero); in ideint_spatial_filter_ssse3() 126 row1_0 = _mm_unpacklo_epi8(row1_0, zero); in ideint_spatial_filter_ssse3() 127 row1_p1 = _mm_unpacklo_epi8(row1_p1, zero); in ideint_spatial_filter_ssse3() 140 row2_m1 = _mm_unpacklo_epi8(row2_m1, zero); in ideint_spatial_filter_ssse3() 141 row2_0 = _mm_unpacklo_epi8(row2_0, zero); in ideint_spatial_filter_ssse3() 142 row2_p1 = _mm_unpacklo_epi8(row2_p1, zero); in ideint_spatial_filter_ssse3()
|