1 /******************************************************************************
2  *
3  * Copyright (C) 2015 The Android Open Source Project
4  *
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at:
8  *
9  * http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  *
17  *****************************************************************************
18  * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
19 */
20 
21 /*!
22  **************************************************************************
23  * \file ih264d_thread_compute_bs.c
24  *
25  * \brief
26  *    Contains routines that for multi-thread decoder
27  *
28  * Detailed_description
29  *
30  * \date
31  *    20/02/2012
32  *
33  * \author  ZR
34  **************************************************************************
35  */
36 #include "ih264d_error_handler.h"
37 #include "ih264d_debug.h"
38 #include <string.h>
39 #include "ih264d_defs.h"
40 #include "ih264d_debug.h"
41 #include "ih264d_tables.h"
42 #include "ih264d_structs.h"
43 #include "ih264d_defs.h"
44 #include "ih264d_mb_utils.h"
45 
46 #include "ih264d_thread_compute_bs.h"
47 #include "ithread.h"
48 #include "ih264d_deblocking.h"
49 #include "ih264d_process_pslice.h"
50 #include "ih264d_process_intra_mb.h"
51 #include "ih264d_mb_utils.h"
52 #include "ih264d_tables.h"
53 #include "ih264d_format_conv.h"
54 #include "ih264d_defs.h"
55 UWORD16 ih264d_update_csbp_8x8(UWORD16 u2_luma_csbp);
56 void ih264d_fill_bs2_horz_vert(UWORD32 *pu4_bs, /* Base pointer of BS table */
57                                WORD32 u4_left_mb_csbp, /* csbp of left mb */
58                                WORD32 u4_top_mb_csbp, /* csbp of top mb */
59                                WORD32 u4_cur_mb_csbp, /* csbp of current mb */
60                                const UWORD32 *pu4_packed_bs2, const UWORD16 *pu2_4x4_v2h_reorder);
61 void ih264d_copy_intra_pred_line(dec_struct_t *ps_dec,
62                                  dec_mb_info_t *ps_cur_mb_info,
63                                  UWORD32 nmb_index);
64 
65 #define BS_MB_GROUP 4
66 #define DEBLK_MB_GROUP 1
67 #define FORMAT_CONV_MB_GROUP 4
68 
69 /*****************************************************************************/
70 /*                                                                           */
71 /*  Function Name : ih264d_compute_bs_non_mbaff_thread                                           */
72 /*                                                                           */
73 /*  Description   : This function computes the pointers of left,top & current*/
74 /*                : Nnz, MvPred & deblk_mb_t and supplies to FillBs function for*/
75 /*                : Boundary Strength Calculation .this function is used     */
76 /*                : BS being calculated in separate thread                   */
77 /*  Inputs        : pointer to decoder context,cur_mb_info,u4_mb_num            */
78 /*  Processing    :                                                          */
79 /*                                                                           */
80 /*  Outputs       : Produces the Boundary Strength for Current Mb            */
81 /*  Returns       : None                                                     */
82 /*                                                                           */
83 /*  Revision History:                                                        */
84 /*                                                                           */
85 /*         DD MM YYYY   Author(s)       Changes (Describe the changes made)  */
86 /*                      ITTIAM                                               */
87 /*****************************************************************************/
88 
ih264d_compute_bs_non_mbaff_thread(dec_struct_t * ps_dec,dec_mb_info_t * ps_cur_mb_info,UWORD32 u4_mb_num)89 void ih264d_compute_bs_non_mbaff_thread(dec_struct_t * ps_dec,
90                                         dec_mb_info_t * ps_cur_mb_info,
91                                         UWORD32 u4_mb_num)
92 {
93     /* Mvpred and Nnz for top and Courrent */
94     mv_pred_t *ps_cur_mv_pred, *ps_top_mv_pred = NULL, *ps_left_mv_pred;
95     /* deblk_mb_t Params */
96     deblk_mb_t *ps_cur_mb_params; /*< Parameters of current MacroBlock */
97     deblkmb_neighbour_t *ps_deblk_top_mb;
98 
99     /* Reference Index to POC mapping*/
100     void ** apv_map_ref_idx_to_poc;
101     UWORD32 u4_leftmbtype;
102 
103     UWORD16 u2_left_csbp, u2_top_csbp, u2_cur_csbp;
104 
105     /* Set of flags */
106     UWORD32 u4_cur_mb_intra, u1_top_mb_typ, u4_cur_mb_fld;
107     UWORD32 u1_cur_mb_type;
108     UWORD32 * pu4_bs_table;
109 
110     /* Neighbour availability */
111     /* Initialization */
112     const UWORD32 u2_mbx = ps_cur_mb_info->u2_mbx;
113     const UWORD32 u2_mby = ps_cur_mb_info->u2_mby;
114     const UWORD32 u1_pingpong = u2_mbx & 0x01;
115 
116     PROFILE_DISABLE_BOUNDARY_STRENGTH()
117     ps_deblk_top_mb = ps_dec->ps_deblk_top_mb + u2_mbx;
118 
119     /* Pointer assignment for Current DeblkMB, Current Mv Pred  */
120     ps_cur_mb_params = ps_dec->ps_deblk_pic + u4_mb_num;
121     ps_cur_mv_pred = ps_dec->s_cur_pic.ps_mv + (u4_mb_num << 4);
122 
123     apv_map_ref_idx_to_poc =
124                     (void **)ps_dec->ps_computebs_cur_slice->ppv_map_ref_idx_to_poc
125                                     + 1;
126     u1_cur_mb_type = ps_cur_mb_params->u1_mb_type;
127     u1_top_mb_typ = ps_deblk_top_mb->u1_mb_type;
128     ps_deblk_top_mb->u1_mb_type = u1_cur_mb_type;
129 
130     {
131         ps_cur_mb_params->u1_topmb_qp = ps_deblk_top_mb->u1_mb_qp;
132         ps_deblk_top_mb->u1_mb_qp = ps_cur_mb_params->u1_mb_qp;
133 
134         ps_cur_mb_params->u1_left_mb_qp = ps_dec->deblk_left_mb[1].u1_mb_qp;
135         ps_dec->deblk_left_mb[1].u1_mb_qp = ps_cur_mb_params->u1_mb_qp;
136 
137     }
138 
139     /* if no deblocking required for current Mb then continue */
140     /* Check next Mbs   in Mb group                           */
141     if(ps_cur_mb_params->u1_deblocking_mode & MB_DISABLE_FILTERING)
142     {
143         void ** pu4_map_ref_idx_to_poc_l1 = apv_map_ref_idx_to_poc +
144         POC_LIST_L0_TO_L1_DIFF;
145         {
146             /* Store Parameter for Top MvPred refernce frame Address */
147 
148             void ** ppv_top_mv_pred_addr = ps_cur_mb_info->ps_curmb->u4_pic_addrress;
149             WORD8 * p1_refTop0 = (ps_cur_mv_pred + 12)->i1_ref_frame;
150             WORD8 * p1_refTop1 = (ps_cur_mv_pred + 14)->i1_ref_frame;
151 
152             /* Store Left addresses for Next Mb   */
153             void ** ppv_left_mv_pred_addr =
154                             ps_dec->ps_left_mvpred_addr[!u1_pingpong][1].u4_add;
155             WORD8 * p1_refleft0 = (ps_cur_mv_pred + 3)->i1_ref_frame;
156 
157 
158             ppv_top_mv_pred_addr[0] = apv_map_ref_idx_to_poc[p1_refTop0[0]];
159             ppv_top_mv_pred_addr[1] = pu4_map_ref_idx_to_poc_l1[p1_refTop0[1]];
160 
161             ppv_left_mv_pred_addr[2] = apv_map_ref_idx_to_poc[p1_refTop1[0]];
162             ppv_top_mv_pred_addr[2] = apv_map_ref_idx_to_poc[p1_refTop1[0]];
163             ppv_left_mv_pred_addr[3] = pu4_map_ref_idx_to_poc_l1[p1_refTop1[1]];
164             ppv_top_mv_pred_addr[3] = pu4_map_ref_idx_to_poc_l1[p1_refTop1[1]];
165 
166             ppv_left_mv_pred_addr[0] = apv_map_ref_idx_to_poc[p1_refleft0[0]];
167             ppv_left_mv_pred_addr[1] = pu4_map_ref_idx_to_poc_l1[p1_refleft0[1]];
168             //}
169             /* Storing the leftMbtype for next Mb */
170             ps_dec->deblk_left_mb[1].u1_mb_type = ps_cur_mb_params->u1_mb_type;
171         }
172 
173         return;
174     }
175 
176     /* Flag for extra left Edge */
177     ps_cur_mb_params->u1_single_call = 1;
178 
179     /* Update the Left deblk_mb_t and Left MvPred Parameters           */
180     if(!u2_mbx)
181     {
182         u4_leftmbtype = 0;
183 
184         /* Initialize the ps_left_mv_pred with Junk but Valid Location */
185         /* to avoid invalid memory access                           */
186         /* this is read only pointer                                */
187         ps_left_mv_pred = ps_cur_mv_pred + 3;
188     }
189     else
190     {
191         u4_leftmbtype = ps_dec->deblk_left_mb[1].u1_mb_type;
192 
193         /* Come to Left Most Edge of the MB */
194         ps_left_mv_pred = ps_cur_mv_pred - (1 << 4) + 3;
195     }
196 
197     if(!u2_mby)
198         u1_top_mb_typ = 0;
199 
200     /* MvPred Pointer Calculation */
201     /* CHANGED CODE */
202     ps_top_mv_pred = ps_cur_mv_pred - (ps_dec->u2_frm_wd_in_mbs << 4) + 12;
203 
204     u4_cur_mb_intra = u1_cur_mb_type & D_INTRA_MB;
205     u4_cur_mb_fld = !!(u1_cur_mb_type & D_FLD_MB);
206     /* Compute BS function */
207     pu4_bs_table = ps_cur_mb_params->u4_bs_table;
208 
209     u2_cur_csbp = ps_cur_mb_info->ps_curmb->u2_luma_csbp;
210     u2_left_csbp = ps_cur_mb_info->ps_left_mb->u2_luma_csbp;
211     u2_top_csbp = ps_cur_mb_info->ps_top_mb->u2_luma_csbp;
212 
213     /* Compute BS function */
214     if(ps_dec->ps_cur_sps->u1_profile_idc == HIGH_PROFILE_IDC)
215     {
216         if(ps_cur_mb_info->u1_tran_form8x8 == 1)
217         {
218             u2_cur_csbp = ih264d_update_csbp_8x8(
219                             ps_cur_mb_info->ps_curmb->u2_luma_csbp);
220         }
221 
222         if(ps_cur_mb_info->ps_left_mb->u1_tran_form8x8 == 1)
223         {
224             u2_left_csbp = ih264d_update_csbp_8x8(
225                             ps_cur_mb_info->ps_left_mb->u2_luma_csbp);
226         }
227 
228         if(ps_cur_mb_info->ps_top_mb->u1_tran_form8x8 == 1)
229         {
230             u2_top_csbp = ih264d_update_csbp_8x8(
231                             ps_cur_mb_info->ps_top_mb->u2_luma_csbp);
232         }
233     }
234     if(u4_cur_mb_intra)
235     {
236 
237         pu4_bs_table[4] = 0x04040404;
238         pu4_bs_table[0] = u4_cur_mb_fld ? 0x03030303 : 0x04040404;
239         pu4_bs_table[1] = 0x03030303;
240         pu4_bs_table[2] = 0x03030303;
241         pu4_bs_table[3] = 0x03030303;
242         pu4_bs_table[5] = 0x03030303;
243         pu4_bs_table[6] = 0x03030303;
244         pu4_bs_table[7] = 0x03030303;
245     }
246     else
247     {
248         UWORD32 u4_is_non16x16 = !!(u1_cur_mb_type & D_PRED_NON_16x16);
249         UWORD32 u4_is_b =
250                         (ps_dec->ps_computebs_cur_slice->slice_type == B_SLICE);
251 
252 
253 
254 
255 
256 
257         ih264d_fill_bs2_horz_vert(pu4_bs_table, u2_left_csbp, u2_top_csbp,
258                                   u2_cur_csbp, gau4_ih264d_packed_bs2,
259                                   gau2_ih264d_4x4_v2h_reorder);
260 
261         if(u4_leftmbtype & D_INTRA_MB)
262             pu4_bs_table[4] = 0x04040404;
263 
264         if(u1_top_mb_typ & D_INTRA_MB)
265             pu4_bs_table[0] = u4_cur_mb_fld ? 0x03030303 : 0x04040404;
266 
267         ps_dec->pf_fill_bs1[u4_is_b][u4_is_non16x16](
268                         ps_cur_mv_pred, ps_top_mv_pred, apv_map_ref_idx_to_poc,
269                         pu4_bs_table, ps_left_mv_pred,
270                         &(ps_dec->ps_left_mvpred_addr[u1_pingpong][1]),
271                         ps_cur_mb_info->ps_top_mb->u4_pic_addrress,
272                         (4 >> u4_cur_mb_fld));
273     }
274 
275     {
276         void ** pu4_map_ref_idx_to_poc_l1 = apv_map_ref_idx_to_poc +
277         POC_LIST_L0_TO_L1_DIFF;
278         {
279             /* Store Parameter for Top MvPred refernce frame Address */
280 
281             void ** ppv_top_mv_pred_addr = ps_cur_mb_info->ps_curmb->u4_pic_addrress;
282             WORD8 * p1_refTop0 = (ps_cur_mv_pred + 12)->i1_ref_frame;
283             WORD8 * p1_refTop1 = (ps_cur_mv_pred + 14)->i1_ref_frame;
284 
285             /* Store Left addresses for Next Mb   */
286             void ** ppv_left_mv_pred_addr =
287                             ps_dec->ps_left_mvpred_addr[!u1_pingpong][1].u4_add;
288             WORD8 * p1_refleft0 = (ps_cur_mv_pred + 3)->i1_ref_frame;
289 
290             ppv_top_mv_pred_addr[0] = apv_map_ref_idx_to_poc[p1_refTop0[0]];
291             ppv_top_mv_pred_addr[1] = pu4_map_ref_idx_to_poc_l1[p1_refTop0[1]];
292 
293             ppv_left_mv_pred_addr[2] = apv_map_ref_idx_to_poc[p1_refTop1[0]];
294             ppv_top_mv_pred_addr[2] = apv_map_ref_idx_to_poc[p1_refTop1[0]];
295             ppv_left_mv_pred_addr[3] = pu4_map_ref_idx_to_poc_l1[p1_refTop1[1]];
296             ppv_top_mv_pred_addr[3] = pu4_map_ref_idx_to_poc_l1[p1_refTop1[1]];
297 
298             ppv_left_mv_pred_addr[0] = apv_map_ref_idx_to_poc[p1_refleft0[0]];
299             ppv_left_mv_pred_addr[1] = pu4_map_ref_idx_to_poc_l1[p1_refleft0[1]];
300 
301             /* Storing the leftMbtype for next Mb */
302             ps_dec->deblk_left_mb[1].u1_mb_type = ps_cur_mb_params->u1_mb_type;
303 
304         }
305     }
306 
307     /* For transform 8x8 disable deblocking of the intrernal edges of a 8x8 block */
308     if(ps_cur_mb_info->u1_tran_form8x8)
309     {
310         pu4_bs_table[1] = 0;
311         pu4_bs_table[3] = 0;
312         pu4_bs_table[5] = 0;
313         pu4_bs_table[7] = 0;
314     }
315 }
316 
317 
ih264d_check_mb_map_deblk(dec_struct_t * ps_dec,UWORD32 deblk_mb_grp,tfr_ctxt_t * ps_tfr_cxt,UWORD32 u4_check_mb_map)318 void ih264d_check_mb_map_deblk(dec_struct_t *ps_dec,
319                                     UWORD32 deblk_mb_grp,
320                                     tfr_ctxt_t *ps_tfr_cxt,
321                                     UWORD32 u4_check_mb_map)
322 {
323     UWORD32 i = 0;
324     UWORD32 u4_mb_num;
325     UWORD32 u4_cond;
326     volatile UWORD8 *mb_map = ps_dec->pu1_recon_mb_map;
327     const WORD32 i4_cb_qp_idx_ofst =
328                     ps_dec->ps_cur_pps->i1_chroma_qp_index_offset;
329     const WORD32 i4_cr_qp_idx_ofst =
330                     ps_dec->ps_cur_pps->i1_second_chroma_qp_index_offset;
331 
332     UWORD32 u4_wd_y, u4_wd_uv;
333     UWORD8 u1_field_pic_flag = ps_dec->ps_cur_slice->u1_field_pic_flag;
334 
335 
336     u4_wd_y = ps_dec->u2_frm_wd_y << u1_field_pic_flag;
337     u4_wd_uv = ps_dec->u2_frm_wd_uv << u1_field_pic_flag;
338 
339 
340     for(i = 0; i < deblk_mb_grp; i++)
341     {
342         WORD32 nop_cnt = 8*128;
343         while(u4_check_mb_map == 1)
344         {
345             u4_mb_num = ps_dec->u4_cur_deblk_mb_num;
346             /*we wait for the right mb because of intra pred data dependency*/
347             u4_mb_num = MIN(u4_mb_num + 1, (ps_dec->u4_deblk_mb_y + 1) * ps_dec->u2_frm_wd_in_mbs - 1);
348             CHECK_MB_MAP_BYTE(u4_mb_num, mb_map, u4_cond);
349 
350             if(u4_cond)
351             {
352                 break;
353             }
354             else
355             {
356                 if(nop_cnt > 0)
357                 {
358                     nop_cnt -= 128;
359                     NOP(128);
360                 }
361                 else
362                 {
363                     nop_cnt = 8*128;
364                     ithread_yield();
365                 }
366             }
367         }
368 
369         ih264d_deblock_mb_nonmbaff(ps_dec, ps_tfr_cxt,
370                                    i4_cb_qp_idx_ofst, i4_cr_qp_idx_ofst,
371                                     u4_wd_y, u4_wd_uv);
372 
373 
374     }
375 
376 
377 }
ih264d_recon_deblk_slice(dec_struct_t * ps_dec,tfr_ctxt_t * ps_tfr_cxt)378 void ih264d_recon_deblk_slice(dec_struct_t *ps_dec, tfr_ctxt_t *ps_tfr_cxt)
379 {
380     dec_mb_info_t *p_cur_mb;
381     UWORD32 u4_max_addr;
382     WORD32 i;
383     UWORD32 u1_mb_aff;
384     UWORD16 u2_slice_num;
385     UWORD32 u4_mb_num;
386     UWORD16 u2_first_mb_in_slice;
387     UWORD32 i2_pic_wdin_mbs;
388     UWORD8 u1_num_mbsleft, u1_end_of_row;
389     UWORD8 u1_mbaff;
390     UWORD16 i16_mb_x, i16_mb_y;
391     WORD32 j;
392     dec_mb_info_t * ps_cur_mb_info;
393     UWORD32 u1_slice_type, u1_B;
394     WORD32 u1_skip_th;
395     UWORD32 u1_ipcm_th;
396     WORD32 ret;
397     tfr_ctxt_t *ps_trns_addr;
398     UWORD32 u4_frame_stride;
399     UWORD32 x_offset, y_offset;
400     UWORD32 u4_slice_end;
401     pad_mgr_t *ps_pad_mgr ;
402 
403     /*check for mb map of first mb in slice to ensure slice header is parsed*/
404     while(1)
405     {
406         UWORD32 u4_mb_num = ps_dec->cur_recon_mb_num;
407         UWORD32 u4_cond = 0;
408         WORD32 nop_cnt = 8*128;
409 
410         CHECK_MB_MAP_BYTE(u4_mb_num, ps_dec->pu1_recon_mb_map, u4_cond);
411         if(u4_cond)
412         {
413             break;
414         }
415         else
416         {
417             if(nop_cnt > 0)
418             {
419                 nop_cnt -= 128;
420                 NOP(128);
421             }
422             else
423             {
424                 if(ps_dec->u4_output_present &&
425                    (ps_dec->u4_fmt_conv_cur_row < ps_dec->s_disp_frame_info.u4_y_ht))
426                 {
427                     ps_dec->u4_fmt_conv_num_rows =
428                                     MIN(FMT_CONV_NUM_ROWS,
429                                         (ps_dec->s_disp_frame_info.u4_y_ht
430                                                         - ps_dec->u4_fmt_conv_cur_row));
431                     ih264d_format_convert(ps_dec, &(ps_dec->s_disp_op),
432                                           ps_dec->u4_fmt_conv_cur_row,
433                                           ps_dec->u4_fmt_conv_num_rows);
434                     ps_dec->u4_fmt_conv_cur_row += ps_dec->u4_fmt_conv_num_rows;
435                 }
436                 else
437                 {
438                     nop_cnt = 8*128;
439                     ithread_yield();
440                 }
441             }
442             DEBUG_THREADS_PRINTF("waiting for mb mapcur_dec_mb_num = %d,ps_dec->u2_cur_mb_addr  = %d\n",u2_cur_dec_mb_num,
443                             ps_dec->u2_cur_mb_addr);
444 
445         }
446     }
447 
448     u4_max_addr = ps_dec->ps_cur_sps->u2_max_mb_addr;
449     u1_mb_aff = ps_dec->ps_cur_slice->u1_mbaff_frame_flag;
450     u2_first_mb_in_slice = ps_dec->ps_computebs_cur_slice->u4_first_mb_in_slice;
451     i2_pic_wdin_mbs = ps_dec->u2_frm_wd_in_mbs;
452     u1_mbaff = ps_dec->ps_cur_slice->u1_mbaff_frame_flag;
453     ps_pad_mgr = &ps_dec->s_pad_mgr;
454 
455     if(u2_first_mb_in_slice == 0)
456     ih264d_init_deblk_tfr_ctxt(ps_dec, ps_pad_mgr, ps_tfr_cxt,
457                                ps_dec->u2_frm_wd_in_mbs, 0);
458 
459 
460     i16_mb_x = MOD(u2_first_mb_in_slice, i2_pic_wdin_mbs);
461     i16_mb_y = DIV(u2_first_mb_in_slice, i2_pic_wdin_mbs);
462     i16_mb_y <<= u1_mbaff;
463     ps_dec->i2_recon_thread_mb_y = i16_mb_y;
464     u4_frame_stride = ps_dec->u2_frm_wd_y
465                     << ps_dec->ps_cur_slice->u1_field_pic_flag;
466 
467     x_offset = i16_mb_x << 4;
468     y_offset = (i16_mb_y * u4_frame_stride) << 4;
469     ps_trns_addr = &ps_dec->s_tran_iprecon;
470 
471     ps_trns_addr->pu1_dest_y = ps_dec->s_cur_pic.pu1_buf1 + x_offset + y_offset;
472 
473     u4_frame_stride = ps_dec->u2_frm_wd_uv
474                     << ps_dec->ps_cur_slice->u1_field_pic_flag;
475     x_offset >>= 1;
476     y_offset = (i16_mb_y * u4_frame_stride) << 3;
477 
478     x_offset *= YUV420SP_FACTOR;
479 
480     ps_trns_addr->pu1_dest_u = ps_dec->s_cur_pic.pu1_buf2 + x_offset + y_offset;
481     ps_trns_addr->pu1_dest_v = ps_dec->s_cur_pic.pu1_buf3 + x_offset + y_offset;
482 
483     ps_trns_addr->pu1_mb_y = ps_trns_addr->pu1_dest_y;
484     ps_trns_addr->pu1_mb_u = ps_trns_addr->pu1_dest_u;
485     ps_trns_addr->pu1_mb_v = ps_trns_addr->pu1_dest_v;
486 
487     ps_dec->cur_recon_mb_num = u2_first_mb_in_slice << u1_mbaff;
488 
489     u4_slice_end = 0;
490     ps_dec->u4_bs_cur_slice_num_mbs = 0;
491     ps_dec->u4_cur_bs_mb_num =
492                     (ps_dec->ps_computebs_cur_slice->u4_first_mb_in_slice)
493                                     << u1_mb_aff;
494 
495     if(ps_dec->i1_recon_in_thread3_flag)
496     {
497         ps_dec->pv_proc_tu_coeff_data =
498                 (void *) ps_dec->ps_computebs_cur_slice->pv_tu_coeff_data_start;
499     }
500 
501     u1_slice_type = ps_dec->ps_computebs_cur_slice->slice_type;
502 
503     u1_B = (u1_slice_type == B_SLICE);
504 
505     u1_skip_th = ((u1_slice_type != I_SLICE) ?
506                                     (u1_B ? B_8x8 : PRED_8x8R0) : -1);
507 
508     u1_ipcm_th = ((u1_slice_type != I_SLICE) ? (u1_B ? 23 : 5) : 0);
509 
510 
511 
512     while(u4_slice_end != 1)
513     {
514         WORD32 recon_mb_grp,bs_mb_grp;
515         WORD32 nop_cnt = 8*128;
516         u1_num_mbsleft = ((i2_pic_wdin_mbs - i16_mb_x) << u1_mbaff);
517         if(u1_num_mbsleft <= ps_dec->u1_recon_mb_grp)
518         {
519             recon_mb_grp = u1_num_mbsleft;
520             u1_end_of_row = 1;
521             i16_mb_x = 0;
522         }
523         else
524         {
525             recon_mb_grp = ps_dec->u1_recon_mb_grp;
526             u1_end_of_row = 0;
527             i16_mb_x += (recon_mb_grp >> u1_mbaff);
528         }
529 
530 
531         while(1)
532         {
533             UWORD32 u4_cond = 0;
534             UWORD32 u4_mb_num = ps_dec->cur_recon_mb_num + recon_mb_grp - 1;
535 
536             /*
537              * Wait for one extra mb of MC, because some chroma IQ-IT functions
538              * sometimes loads the pixels of the right mb and stores with the loaded
539              * values.
540              */
541             u4_mb_num = MIN(u4_mb_num + 1, (ps_dec->i2_recon_thread_mb_y + 1) * i2_pic_wdin_mbs - 1);
542 
543             CHECK_MB_MAP_BYTE(u4_mb_num, ps_dec->pu1_recon_mb_map, u4_cond);
544             if(u4_cond)
545             {
546                 break;
547             }
548             else
549             {
550                 if(nop_cnt > 0)
551                 {
552                     nop_cnt -= 128;
553                     NOP(128);
554                 }
555                 else
556                 {
557                     if(ps_dec->u4_output_present &&
558                        (ps_dec->u4_fmt_conv_cur_row < ps_dec->s_disp_frame_info.u4_y_ht))
559                     {
560                         ps_dec->u4_fmt_conv_num_rows =
561                                         MIN(FMT_CONV_NUM_ROWS,
562                                             (ps_dec->s_disp_frame_info.u4_y_ht
563                                                             - ps_dec->u4_fmt_conv_cur_row));
564                         ih264d_format_convert(ps_dec, &(ps_dec->s_disp_op),
565                                               ps_dec->u4_fmt_conv_cur_row,
566                                               ps_dec->u4_fmt_conv_num_rows);
567                         ps_dec->u4_fmt_conv_cur_row += ps_dec->u4_fmt_conv_num_rows;
568                     }
569                     else
570                     {
571                         nop_cnt = 8*128;
572                         ithread_yield();
573                     }
574                 }
575             }
576         }
577 
578         for(j = 0; j < recon_mb_grp; j++)
579         {
580             GET_SLICE_NUM_MAP(ps_dec->pu2_slice_num_map, ps_dec->cur_recon_mb_num,
581                               u2_slice_num);
582 
583             if(u2_slice_num != ps_dec->u2_cur_slice_num_bs)
584             {
585                 u4_slice_end = 1;
586                 break;
587             }
588             if(ps_dec->i1_recon_in_thread3_flag)
589             {
590                 ps_cur_mb_info = &ps_dec->ps_frm_mb_info[ps_dec->cur_recon_mb_num];
591 
592                 if(ps_cur_mb_info->u1_mb_type <= u1_skip_th)
593                 {
594                     ih264d_process_inter_mb(ps_dec, ps_cur_mb_info, j);
595                 }
596                 else if(ps_cur_mb_info->u1_mb_type != MB_SKIP)
597                 {
598                     if((u1_ipcm_th + 25) != ps_cur_mb_info->u1_mb_type)
599                     {
600                         ps_cur_mb_info->u1_mb_type -= (u1_skip_th + 1);
601                         ih264d_process_intra_mb(ps_dec, ps_cur_mb_info, j);
602                     }
603                 }
604 
605                 ih264d_copy_intra_pred_line(ps_dec, ps_cur_mb_info, j);
606             }
607             ps_dec->cur_recon_mb_num++;
608         }
609 
610         if(j != recon_mb_grp)
611         {
612             u1_end_of_row = 0;
613         }
614 
615         {
616             tfr_ctxt_t *ps_trns_addr = &ps_dec->s_tran_iprecon;
617             UWORD16 u2_mb_y;
618 
619             ps_trns_addr->pu1_dest_y += ps_trns_addr->u4_inc_y[u1_end_of_row];
620             ps_trns_addr->pu1_dest_u += ps_trns_addr->u4_inc_uv[u1_end_of_row];
621             ps_trns_addr->pu1_dest_v += ps_trns_addr->u4_inc_uv[u1_end_of_row];
622 
623             if(u1_end_of_row)
624             {
625                 ps_dec->i2_recon_thread_mb_y += (1 << u1_mbaff);
626                 u2_mb_y = ps_dec->i2_recon_thread_mb_y;
627                 y_offset = (u2_mb_y * u4_frame_stride) << 4;
628                 ps_trns_addr->pu1_dest_y = ps_dec->s_cur_pic.pu1_buf1 + y_offset;
629 
630                 u4_frame_stride = ps_dec->u2_frm_wd_uv
631                                 << ps_dec->ps_cur_slice->u1_field_pic_flag;
632                 y_offset = (u2_mb_y * u4_frame_stride) << 3;
633                 ps_trns_addr->pu1_dest_u = ps_dec->s_cur_pic.pu1_buf2 + y_offset;
634                 ps_trns_addr->pu1_dest_v = ps_dec->s_cur_pic.pu1_buf3 + y_offset;
635 
636                 ps_trns_addr->pu1_mb_y = ps_trns_addr->pu1_dest_y;
637                 ps_trns_addr->pu1_mb_u = ps_trns_addr->pu1_dest_u;
638                 ps_trns_addr->pu1_mb_v = ps_trns_addr->pu1_dest_v;
639 
640             }
641         }
642 
643         bs_mb_grp = j;
644         /* Compute BS for NMB group*/
645         for(i = 0; i < bs_mb_grp; i++)
646         {
647             p_cur_mb = &ps_dec->ps_frm_mb_info[ps_dec->u4_cur_bs_mb_num];
648 
649             DEBUG_THREADS_PRINTF("ps_dec->u4_cur_bs_mb_num = %d\n",ps_dec->u4_cur_bs_mb_num);
650             ih264d_compute_bs_non_mbaff_thread(ps_dec, p_cur_mb,
651                                                ps_dec->u4_cur_bs_mb_num);
652             ps_dec->u4_cur_bs_mb_num++;
653             ps_dec->u4_bs_cur_slice_num_mbs++;
654 
655         }
656 
657         if(ps_dec->u4_cur_bs_mb_num > u4_max_addr)
658         {
659             u4_slice_end = 1;
660         }
661 
662         /*deblock MB group*/
663         {
664             UWORD32 u4_num_mbs;
665 
666             if(ps_dec->u4_cur_bs_mb_num > ps_dec->u4_cur_deblk_mb_num)
667             {
668                 if(u1_end_of_row)
669                 {
670                     u4_num_mbs = ps_dec->u4_cur_bs_mb_num
671                                     - ps_dec->u4_cur_deblk_mb_num;
672                 }
673                 else
674                 {
675                     u4_num_mbs = ps_dec->u4_cur_bs_mb_num
676                                     - ps_dec->u4_cur_deblk_mb_num - 1;
677                 }
678             }
679             else
680                 u4_num_mbs = 0;
681 
682             ih264d_check_mb_map_deblk(ps_dec, u4_num_mbs, ps_tfr_cxt,0);
683         }
684 
685     }
686 }
687 
ih264d_recon_deblk_thread(dec_struct_t * ps_dec)688 void ih264d_recon_deblk_thread(dec_struct_t *ps_dec)
689 {
690     tfr_ctxt_t s_tfr_ctxt;
691     tfr_ctxt_t *ps_tfr_cxt = &s_tfr_ctxt; // = &ps_dec->s_tran_addrecon;
692 
693 
694     UWORD32 yield_cnt = 0;
695 
696     ithread_set_name("ih264d_recon_deblk_thread");
697 
698     while(1)
699     {
700 
701         DEBUG_THREADS_PRINTF(" Entering compute bs slice\n");
702         ih264d_recon_deblk_slice(ps_dec, ps_tfr_cxt);
703 
704         DEBUG_THREADS_PRINTF(" Exit  compute bs slice \n");
705 
706         if(ps_dec->cur_recon_mb_num > ps_dec->ps_cur_sps->u2_max_mb_addr)
707         {
708                 break;
709         }
710         else
711         {
712             ps_dec->ps_computebs_cur_slice++;
713             ps_dec->u2_cur_slice_num_bs++;
714         }
715         DEBUG_THREADS_PRINTF("CBS thread:Got next slice/end of frame signal \n ");
716 
717     }
718 
719     if(ps_dec->u4_output_present &&
720        (3 == ps_dec->u4_num_cores) &&
721        (ps_dec->u4_fmt_conv_cur_row < ps_dec->s_disp_frame_info.u4_y_ht))
722     {
723         ps_dec->u4_fmt_conv_num_rows =
724                         (ps_dec->s_disp_frame_info.u4_y_ht
725                                         - ps_dec->u4_fmt_conv_cur_row);
726         ih264d_format_convert(ps_dec, &(ps_dec->s_disp_op),
727                               ps_dec->u4_fmt_conv_cur_row,
728                               ps_dec->u4_fmt_conv_num_rows);
729         ps_dec->u4_fmt_conv_cur_row += ps_dec->u4_fmt_conv_num_rows;
730 
731     }
732 
733 
734 
735 }
736 
737 
738