• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /******************************************************************************
2 *
3 * Copyright (C) 2012 Ittiam Systems Pvt Ltd, Bangalore
4 *
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at:
8 *
9 * http://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 *
17 ******************************************************************************/
18 /**
19  *******************************************************************************
20  * @file
21  *  ihevcd_parse_slice.c
22  *
23  * @brief
24  *  Contains functions for parsing slice data
25  *
26  * @author
27  *  Harish
28  *
29  * @par List of Functions:
30  *
31  * @remarks
32  *  None
33  *
34  *******************************************************************************
35  */
36 /*****************************************************************************/
37 /* File Includes                                                             */
38 /*****************************************************************************/
39 #include <stdio.h>
40 #include <stddef.h>
41 #include <stdlib.h>
42 #include <string.h>
43 #include <assert.h>
44 
45 #include "ihevc_typedefs.h"
46 #include "iv.h"
47 #include "ivd.h"
48 #include "ihevcd_cxa.h"
49 #include "ithread.h"
50 
51 #include "ihevc_defs.h"
52 #include "ihevc_debug.h"
53 #include "ihevc_structs.h"
54 #include "ihevc_macros.h"
55 #include "ihevc_mem_fns.h"
56 #include "ihevc_platform_macros.h"
57 
58 #include "ihevc_common_tables.h"
59 #include "ihevc_error.h"
60 #include "ihevc_cabac_tables.h"
61 
62 #include "ihevcd_trace.h"
63 #include "ihevcd_defs.h"
64 #include "ihevcd_function_selector.h"
65 #include "ihevcd_structs.h"
66 #include "ihevcd_error.h"
67 #include "ihevcd_nal.h"
68 #include "ihevcd_bitstream.h"
69 #include "ihevcd_utils.h"
70 #include "ihevcd_parse_slice.h"
71 #include "ihevcd_parse_residual.h"
72 #include "ihevcd_cabac.h"
73 #include "ihevcd_job_queue.h"
74 #include "ihevcd_intra_pred_mode_prediction.h"
75 #include "ihevcd_common_tables.h"
76 #include "ihevcd_process_slice.h"
77 #include "ihevcd_debug.h"
78 #include "ihevcd_get_mv.h"
79 #include "ihevcd_boundary_strength.h"
80 #include "ihevcd_ilf_padding.h"
81 #include "ihevcd_statistics.h"
82 /* Bit stream offset threshold */
83 #define BITSTRM_OFF_THRS 8
84 
85 #define MIN_CU_QP_DELTA_ABS(x) (-26 + ((x) * 6) / 2)
86 #define MAX_CU_QP_DELTA_ABS(x) (25 + ((x) * 6) / 2)
87 
88 /**
89  * Table used to decode part_mode if AMP is enabled and current CU is not min CU
90  */
91 const UWORD8 gau1_part_mode_amp[] = { PART_nLx2N, PART_nRx2N, PART_Nx2N, 0xFF, PART_2NxnU, PART_2NxnD, PART_2NxN, 0xFF };
92 
93 const UWORD32 gau4_ct_depth_mask[] = { 0x0, 0x55555555, 0xAAAAAAAA, 0xFFFFFFFF };
94 
95 
96 
97 /**
98  *******************************************************************************
99  *
100  * @brief
101  *  Parses Transform tree syntax
102  *
103  * @par Description:
104  *  Parses Transform tree syntax as per Section:7.3.9.8
105  *
106  * @param[in] ps_codec
107  *  Pointer to codec context
108  *
109  * @returns  Status
110  *
111  * @remarks
112  *
113  *
114  *******************************************************************************
115  */
116 
ihevcd_parse_transform_tree(codec_t * ps_codec,WORD32 x0,WORD32 y0,WORD32 cu_x_base,WORD32 cu_y_base,WORD32 log2_trafo_size,WORD32 trafo_depth,WORD32 blk_idx,WORD32 intra_pred_mode)117 WORD32 ihevcd_parse_transform_tree(codec_t *ps_codec,
118                                    WORD32 x0, WORD32 y0,
119                                    WORD32 cu_x_base, WORD32 cu_y_base,
120                                    WORD32 log2_trafo_size,
121                                    WORD32 trafo_depth,
122                                    WORD32 blk_idx,
123                                    WORD32 intra_pred_mode)
124 {
125     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
126     sps_t *ps_sps;
127     pps_t *ps_pps;
128     WORD32 value;
129     WORD32 x1, y1;
130     WORD32 max_trafo_depth;
131 
132     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
133     WORD32 intra_split_flag;
134     WORD32 split_transform_flag;
135     WORD32 ctxt_idx;
136     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
137 
138     max_trafo_depth = ps_codec->s_parse.s_cu.i4_max_trafo_depth;
139     ps_sps = ps_codec->s_parse.ps_sps;
140     ps_pps = ps_codec->s_parse.ps_pps;
141     intra_split_flag = ps_codec->s_parse.s_cu.i4_intra_split_flag;
142 
143     {
144         split_transform_flag = 0;
145         if((log2_trafo_size <= ps_sps->i1_log2_max_transform_block_size) &&
146                         (log2_trafo_size > ps_sps->i1_log2_min_transform_block_size) &&
147                         (trafo_depth < max_trafo_depth) &&
148                         !(intra_split_flag && (trafo_depth == 0)))
149         {
150             /* encode the split transform flag, context derived as per Table9-37 */
151             ctxt_idx = IHEVC_CAB_SPLIT_TFM + (5 - log2_trafo_size);
152 
153             TRACE_CABAC_CTXT("split_transform_flag", ps_cabac->u4_range, ctxt_idx);
154             split_transform_flag = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
155             AEV_TRACE("split_transform_flag", split_transform_flag,
156                       ps_cabac->u4_range);
157 
158         }
159         else
160         {
161             WORD32 inter_split_flag = 0;
162 
163             if((0 == ps_sps->i1_max_transform_hierarchy_depth_inter) &&
164                             (PRED_MODE_INTER == ps_codec->s_parse.s_cu.i4_pred_mode) &&
165                             (PART_2Nx2N != ps_codec->s_parse.s_cu.i4_part_mode) &&
166                             (0 == trafo_depth))
167             {
168                 inter_split_flag = 1;
169             }
170 
171             if((log2_trafo_size > ps_sps->i1_log2_max_transform_block_size) ||
172                             ((1 == intra_split_flag) && (0 == trafo_depth)) ||
173                             (1 == inter_split_flag))
174             {
175                 split_transform_flag = 1;
176             }
177         }
178 
179         if(0 == trafo_depth)
180         {
181             ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth] = 0;
182             ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth] = 0;
183         }
184         else
185         {
186             ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth] = ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth - 1];
187             ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth] = ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth - 1];
188         }
189         if(trafo_depth == 0 || log2_trafo_size > 2)
190         {
191             ctxt_idx = IHEVC_CAB_CBCR_IDX + trafo_depth;
192             /* CBF for Cb/Cr is sent only if the parent CBF for Cb/Cr is non-zero */
193             if((trafo_depth == 0) || ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth - 1])
194             {
195                 TRACE_CABAC_CTXT("cbf_cb", ps_cabac->u4_range, ctxt_idx);
196                 value = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
197                 AEV_TRACE("cbf_cb", value, ps_cabac->u4_range);
198                 ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth] = value;
199             }
200 
201             if((trafo_depth == 0) || ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth - 1])
202             {
203                 TRACE_CABAC_CTXT("cbf_cr", ps_cabac->u4_range, ctxt_idx);
204                 value = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
205                 AEV_TRACE("cbf_cr", value, ps_cabac->u4_range);
206                 ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth] = value;
207             }
208         }
209         if(split_transform_flag)
210         {
211             WORD32 intra_pred_mode_tmp;
212             x1 = x0 + ((1 << log2_trafo_size) >> 1);
213             y1 = y0 + ((1 << log2_trafo_size) >> 1);
214 
215             /* For transform depth of zero, intra pred mode as decoded at CU */
216             /* level is sent to the transform tree nodes */
217             /* When depth is non-zero intra pred mode of parent node is sent */
218             /* This takes care of passing correct mode to all the child nodes */
219             intra_pred_mode_tmp = trafo_depth ? intra_pred_mode : ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[0];
220             ret = ihevcd_parse_transform_tree(ps_codec, x0, y0, x0, y0, log2_trafo_size - 1, trafo_depth + 1, 0, intra_pred_mode_tmp);
221             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
222 
223             intra_pred_mode_tmp = trafo_depth ? intra_pred_mode : ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[1];
224             ret = ihevcd_parse_transform_tree(ps_codec, x1, y0, x0, y0, log2_trafo_size - 1, trafo_depth + 1, 1, intra_pred_mode_tmp);
225             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
226 
227             intra_pred_mode_tmp = trafo_depth ? intra_pred_mode : ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[2];
228             ret = ihevcd_parse_transform_tree(ps_codec, x0, y1, x0, y0, log2_trafo_size - 1, trafo_depth + 1, 2, intra_pred_mode_tmp);
229             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
230 
231             intra_pred_mode_tmp = trafo_depth ? intra_pred_mode : ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[3];
232             ret = ihevcd_parse_transform_tree(ps_codec, x1, y1, x0, y0, log2_trafo_size - 1, trafo_depth + 1, 3, intra_pred_mode_tmp);
233             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
234 
235         }
236         else
237         {
238             WORD32 ctb_x_base;
239             WORD32 ctb_y_base;
240             WORD32 cu_qp_delta_abs;
241 
242 
243 
244             tu_t *ps_tu = ps_codec->s_parse.ps_tu;
245             cu_qp_delta_abs = 0;
246             ctb_x_base = ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size;
247             ctb_y_base = ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size;
248 
249             if((ps_codec->s_parse.s_cu.i4_pred_mode == PRED_MODE_INTRA) ||
250                             (trafo_depth != 0) ||
251                             (ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth]) ||
252                             (ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth]))
253             {
254                 ctxt_idx = IHEVC_CAB_CBF_LUMA_IDX;
255                 ctxt_idx += (trafo_depth == 0) ? 1 : 0;
256 
257                 TRACE_CABAC_CTXT("cbf_luma", ps_cabac->u4_range, ctxt_idx);
258                 value = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
259                 AEV_TRACE("cbf_luma", value, ps_cabac->u4_range);
260 
261                 ps_codec->s_parse.s_cu.i1_cbf_luma = value;
262             }
263             else
264             {
265                 ps_codec->s_parse.s_cu.i1_cbf_luma = 1;
266             }
267 
268             /* Initialize ps_tu to default values */
269             /* If required change this to WORD32 packed write */
270             ps_tu->b1_cb_cbf = 0;
271             ps_tu->b1_cr_cbf = 0;
272             ps_tu->b1_y_cbf = 0;
273             ps_tu->b4_pos_x = ((x0 - ctb_x_base) >> 2);
274             ps_tu->b4_pos_y = ((y0 - ctb_y_base) >> 2);
275             ps_tu->b1_transquant_bypass = ps_codec->s_parse.s_cu.i4_cu_transquant_bypass;
276             ps_tu->b3_size = (log2_trafo_size - 2);
277             ps_tu->b7_qp = ps_codec->s_parse.u4_qp;
278 
279             ps_tu->b6_luma_intra_mode = intra_pred_mode;
280             ps_tu->b3_chroma_intra_mode_idx = ps_codec->s_parse.s_cu.i4_intra_chroma_pred_mode_idx;
281 
282             /* Section:7.3.12  Transform unit syntax inlined here */
283             if(ps_codec->s_parse.s_cu.i1_cbf_luma ||
284                             ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth] ||
285                             ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth])
286             {
287                 WORD32 intra_pred_mode_chroma;
288                 if(ps_pps->i1_cu_qp_delta_enabled_flag && !ps_codec->s_parse.i4_is_cu_qp_delta_coded)
289                 {
290 
291 
292                     WORD32 c_max        = TU_MAX_QP_DELTA_ABS;
293                     WORD32 ctxt_inc     = IHEVC_CAB_QP_DELTA_ABS;
294                     WORD32 ctxt_inc_max = CTXT_MAX_QP_DELTA_ABS;
295 
296                     TRACE_CABAC_CTXT("cu_qp_delta_abs", ps_cabac->u4_range, ctxt_inc);
297                     /* qp_delta_abs is coded as combination of tunary and eg0 code  */
298                     /* See Table 9-32 and Table 9-37 for details on cu_qp_delta_abs */
299                     cu_qp_delta_abs = ihevcd_cabac_decode_bins_tunary(ps_cabac,
300                                                                       ps_bitstrm,
301                                                                       c_max,
302                                                                       ctxt_inc,
303                                                                       0,
304                                                                       ctxt_inc_max);
305                     if(cu_qp_delta_abs >= c_max)
306                     {
307                         value = ihevcd_cabac_decode_bypass_bins_egk(ps_cabac, ps_bitstrm, 0);
308                         cu_qp_delta_abs += value;
309                     }
310                     AEV_TRACE("cu_qp_delta_abs", cu_qp_delta_abs, ps_cabac->u4_range);
311 
312                     ps_codec->s_parse.i4_is_cu_qp_delta_coded = 1;
313 
314 
315                     if(cu_qp_delta_abs)
316                     {
317                         value = ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
318                         AEV_TRACE("cu_qp_delta_sign", value, ps_cabac->u4_range);
319 
320                         if(value)
321                             cu_qp_delta_abs = -cu_qp_delta_abs;
322 
323                     }
324 
325                     if (cu_qp_delta_abs < MIN_CU_QP_DELTA_ABS(ps_sps->i1_bit_depth_luma_minus8)
326                                     || cu_qp_delta_abs > MAX_CU_QP_DELTA_ABS(ps_sps->i1_bit_depth_luma_minus8))
327                     {
328                         return IHEVCD_INVALID_PARAMETER;
329                     }
330 
331                     ps_codec->s_parse.s_cu.i4_cu_qp_delta = cu_qp_delta_abs;
332 
333                 }
334 
335                 if(ps_codec->s_parse.s_cu.i1_cbf_luma)
336                 {
337                     ps_tu->b1_y_cbf = 1;
338                     ihevcd_parse_residual_coding(ps_codec, x0, y0, log2_trafo_size, 0, intra_pred_mode);
339                 }
340 
341                 if(4 == ps_codec->s_parse.s_cu.i4_intra_chroma_pred_mode_idx)
342                     intra_pred_mode_chroma = ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[0];
343                 else
344                 {
345                     intra_pred_mode_chroma = gau1_intra_pred_chroma_modes[ps_codec->s_parse.s_cu.i4_intra_chroma_pred_mode_idx];
346 
347                     if(intra_pred_mode_chroma ==
348                                     ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[0])
349                     {
350                         intra_pred_mode_chroma = INTRA_ANGULAR(34);
351                     }
352 
353                 }
354                 if(log2_trafo_size > 2)
355                 {
356                     if(ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth])
357                     {
358                         ps_tu->b1_cb_cbf = 1;
359                         ihevcd_parse_residual_coding(ps_codec, x0, y0, log2_trafo_size - 1, 1, intra_pred_mode_chroma);
360                     }
361 
362                     if(ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth])
363                     {
364                         ps_tu->b1_cr_cbf = 1;
365                         ihevcd_parse_residual_coding(ps_codec, x0, y0, log2_trafo_size - 1, 2, intra_pred_mode_chroma);
366                     }
367                 }
368                 else if(blk_idx == 3)
369                 {
370                     if(ps_codec->s_parse.s_cu.ai1_cbf_cb[trafo_depth])
371                     {
372                         ps_tu->b1_cb_cbf = 1;
373                         ihevcd_parse_residual_coding(ps_codec, cu_x_base, cu_y_base, log2_trafo_size, 1, intra_pred_mode_chroma);
374                     }
375 
376                     if(ps_codec->s_parse.s_cu.ai1_cbf_cr[trafo_depth])
377                     {
378                         ps_tu->b1_cr_cbf = 1;
379                         ihevcd_parse_residual_coding(ps_codec, cu_x_base, cu_y_base, log2_trafo_size, 2, intra_pred_mode_chroma);
380                     }
381                 }
382                 else
383                 {
384                     //ps_tu->b1_chroma_present = 0;
385                     ps_tu->b3_chroma_intra_mode_idx = INTRA_PRED_CHROMA_IDX_NONE;
386                 }
387             }
388             else
389             {
390                 if((3 != blk_idx) && (2 == log2_trafo_size))
391                 {
392                     ps_tu->b3_chroma_intra_mode_idx = INTRA_PRED_CHROMA_IDX_NONE;
393                 }
394             }
395 
396             /* Set the first TU in CU flag */
397             {
398                 if((ps_codec->s_parse.s_cu.i4_pos_x << 3) == (ps_tu->b4_pos_x << 2) &&
399                                 (ps_codec->s_parse.s_cu.i4_pos_y << 3) == (ps_tu->b4_pos_y << 2))
400                 {
401                     ps_tu->b1_first_tu_in_cu = 1;
402                 }
403                 else
404                 {
405                     ps_tu->b1_first_tu_in_cu = 0;
406                 }
407             }
408             ps_codec->s_parse.ps_tu++;
409             ps_codec->s_parse.s_cu.i4_tu_cnt++;
410             ps_codec->s_parse.i4_pic_tu_idx++;
411         }
412     }
413     return ret;
414 }
415 /**
416  *******************************************************************************
417  *
418  * @brief
419  *  Parses Motion vector difference
420  *
421  * @par Description:
422  *  Parses Motion vector difference as per Section:7.3.9.9
423  *
424  * @param[in] ps_codec
425  *  Pointer to codec context
426  *
427  * @returns  Error from IHEVCD_ERROR_T
428  *
429  * @remarks
430  *
431  *
432  *******************************************************************************
433  */
ihevcd_parse_mvd(codec_t * ps_codec,mv_t * ps_mv)434 IHEVCD_ERROR_T ihevcd_parse_mvd(codec_t *ps_codec, mv_t *ps_mv)
435 {
436     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
437     WORD32 value;
438     WORD32 abs_mvd;
439     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
440     WORD32 abs_mvd_greater0_flag[2];
441     WORD32 abs_mvd_greater1_flag[2];
442     WORD32 ctxt_idx;
443     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
444 
445 
446     ctxt_idx  = IHEVC_CAB_MVD_GRT0;
447     /* encode absmvd_x > 0 */
448     TRACE_CABAC_CTXT("abs_mvd_greater0_flag[0]", ps_cabac->u4_range, ctxt_idx);
449     abs_mvd_greater0_flag[0] = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
450     AEV_TRACE("abs_mvd_greater0_flag[0]", abs_mvd_greater0_flag[0], ps_cabac->u4_range);
451 
452     /* encode absmvd_y > 0 */
453     TRACE_CABAC_CTXT("abs_mvd_greater0_flag[1]", ps_cabac->u4_range, ctxt_idx);
454     abs_mvd_greater0_flag[1] = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
455     AEV_TRACE("abs_mvd_greater0_flag[1]", abs_mvd_greater0_flag[1], ps_cabac->u4_range);
456 
457     ctxt_idx  = IHEVC_CAB_MVD_GRT1;
458     abs_mvd_greater1_flag[0] = 0;
459     abs_mvd_greater1_flag[1] = 0;
460 
461     if(abs_mvd_greater0_flag[0])
462     {
463         TRACE_CABAC_CTXT("abs_mvd_greater1_flag[0]", ps_cabac->u4_range, ctxt_idx);
464         abs_mvd_greater1_flag[0] = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
465         AEV_TRACE("abs_mvd_greater1_flag[0]", abs_mvd_greater1_flag[0], ps_cabac->u4_range);
466     }
467     if(abs_mvd_greater0_flag[1])
468     {
469         TRACE_CABAC_CTXT("abs_mvd_greater1_flag[1]", ps_cabac->u4_range, ctxt_idx);
470         abs_mvd_greater1_flag[1] = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
471         AEV_TRACE("abs_mvd_greater1_flag[1]", abs_mvd_greater1_flag[1], ps_cabac->u4_range);
472     }
473     abs_mvd = 0;
474     if(abs_mvd_greater0_flag[0])
475     {
476         abs_mvd = 1;
477         if(abs_mvd_greater1_flag[0])
478         {
479             value = ihevcd_cabac_decode_bypass_bins_egk(ps_cabac, ps_bitstrm, 1);
480             AEV_TRACE("abs_mvd_minus2[0]", value, ps_cabac->u4_range);
481             abs_mvd = value + 2;
482         }
483         value = ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
484         AEV_TRACE("mvd_sign_flag[0]", value, ps_cabac->u4_range);
485         if(value)
486         {
487             abs_mvd = -abs_mvd;
488         }
489 
490     }
491     ps_mv->i2_mvx = abs_mvd;
492     abs_mvd = 0;
493     if(abs_mvd_greater0_flag[1])
494     {
495         abs_mvd = 1;
496         if(abs_mvd_greater1_flag[1])
497         {
498             value = ihevcd_cabac_decode_bypass_bins_egk(ps_cabac, ps_bitstrm, 1);
499             AEV_TRACE("abs_mvd_minus2[1]", value, ps_cabac->u4_range);
500             abs_mvd = value + 2;
501 
502         }
503         value = ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
504         AEV_TRACE("mvd_sign_flag[1]", value, ps_cabac->u4_range);
505 
506         if(value)
507         {
508             abs_mvd = -abs_mvd;
509         }
510     }
511     ps_mv->i2_mvy = abs_mvd;
512 
513     return ret;
514 }
515 
516 /**
517  *******************************************************************************
518  *
519  * @brief
520  *  Parses PCM sample
521  *
522  *
523  * @par Description:
524  *  Parses PCM sample as per Section:7.3.9.7 Pcm sample syntax
525  *
526  * @param[in] ps_codec
527  *  Pointer to codec context
528  *
529  * @returns  Error from IHEVCD_ERROR_T
530  *
531  * @remarks
532  *
533  *
534  *******************************************************************************
535  */
536 
ihevcd_parse_pcm_sample(codec_t * ps_codec,WORD32 x0,WORD32 y0,WORD32 log2_cb_size)537 IHEVCD_ERROR_T  ihevcd_parse_pcm_sample(codec_t *ps_codec,
538                                         WORD32 x0,
539                                         WORD32 y0,
540                                         WORD32 log2_cb_size)
541 {
542     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
543     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
544     sps_t *ps_sps;
545 
546     WORD32 value;
547     WORD32 i;
548 
549     WORD32 num_bits;
550     UWORD32 u4_sig_coeff_map;
551     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
552     tu_t *ps_tu = ps_codec->s_parse.ps_tu;
553     tu_sblk_coeff_data_t *ps_tu_sblk_coeff_data;
554     UWORD8 *pu1_coeff_data;
555     ps_sps = ps_codec->s_parse.ps_sps;
556 
557     UNUSED(value);
558     UNUSED(ps_tu);
559     UNUSED(ps_cabac);
560     UNUSED(x0);
561     UNUSED(y0);
562 
563     {
564         WORD8 *pi1_scan_idx;
565         WORD8 *pi1_buf = (WORD8 *)ps_codec->s_parse.pv_tu_coeff_data;
566         WORD8 *pi1_num_coded_subblks;
567 
568         /* First WORD8 gives number of coded subblocks */
569         pi1_num_coded_subblks = pi1_buf++;
570 
571         /* Set number of coded subblocks in the current TU to zero */
572         /* For PCM there will be only one subblock which is the same size as CU */
573         *pi1_num_coded_subblks = 1;
574 
575         /* Second WORD8 gives (scan idx << 1) | trans_skip */
576         pi1_scan_idx = pi1_buf++;
577         *pi1_scan_idx = (0 << 1) | 1;
578 
579         /* Store the incremented pointer in pv_tu_coeff_data */
580         ps_codec->s_parse.pv_tu_coeff_data = pi1_buf;
581 
582     }
583 
584     u4_sig_coeff_map = 0xFFFFFFFF;
585     ps_tu_sblk_coeff_data = (tu_sblk_coeff_data_t *)ps_codec->s_parse.pv_tu_coeff_data;
586     ps_tu_sblk_coeff_data->u2_sig_coeff_map = u4_sig_coeff_map;
587     ps_tu_sblk_coeff_data->u2_subblk_pos = 0;
588 
589     pu1_coeff_data = (UWORD8 *)&ps_tu_sblk_coeff_data->ai2_level[0];
590 
591     num_bits = ps_sps->i1_pcm_sample_bit_depth_luma;
592 
593     for(i = 0; i < 1 << (log2_cb_size << 1); i++)
594     {
595         TRACE_CABAC_CTXT("pcm_sample_luma", ps_cabac->u4_range, 0);
596         BITS_PARSE("pcm_sample_luma", value, ps_bitstrm, num_bits);
597 
598         //ps_pcmsample_t->i1_pcm_sample_luma[i] = value;
599         *pu1_coeff_data++ = value << (BIT_DEPTH_LUMA - num_bits);
600     }
601 
602     num_bits = ps_sps->i1_pcm_sample_bit_depth_chroma;
603 
604     for(i = 0; i < (1 << (log2_cb_size << 1)) >> 1; i++)
605     {
606         TRACE_CABAC_CTXT("pcm_sample_chroma", ps_cabac->u4_range, 0);
607         BITS_PARSE("pcm_sample_chroma", value, ps_bitstrm, num_bits);
608 
609         // ps_pcmsample_t->i1_pcm_sample_chroma[i] = value;
610         *pu1_coeff_data++ = value << (BIT_DEPTH_CHROMA - num_bits);
611     }
612 
613     ps_codec->s_parse.pv_tu_coeff_data = pu1_coeff_data;
614 
615     return ret;
616 }
617 /**
618  *******************************************************************************
619  *
620  * @brief
621  *  Parses Prediction unit
622  *
623  * @par Description:
624  *  Parses Prediction unit as per Section:7.3.9.6
625  *
626  * @param[in] ps_codec
627  *  Pointer to codec context
628  *
629  * @returns  Error from IHEVCD_ERROR_T
630  *
631  * @remarks
632  *
633  *
634  *******************************************************************************
635  */
636 
ihevcd_parse_pu_mvp(codec_t * ps_codec,pu_t * ps_pu)637 IHEVCD_ERROR_T  ihevcd_parse_pu_mvp(codec_t *ps_codec, pu_t *ps_pu)
638 {
639     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
640     WORD32 value;
641     slice_header_t *ps_slice_hdr;
642     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
643     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
644     WORD32 inter_pred_idc;
645 
646     ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr;
647 
648     if(ps_slice_hdr->i1_slice_type == BSLICE)
649     {
650         WORD32 pu_w_plus_pu_h;
651         WORD32 ctxt_idx;
652         /* required to check if w+h==12 case */
653         pu_w_plus_pu_h = ((ps_pu->b4_wd + 1) << 2) + ((ps_pu->b4_ht + 1) << 2);
654         if(12 == pu_w_plus_pu_h)
655         {
656             ctxt_idx = IHEVC_CAB_INTER_PRED_IDC + 4;
657             TRACE_CABAC_CTXT("inter_pred_idc", ps_cabac->u4_range, ctxt_idx);
658             inter_pred_idc = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm,
659                                                      ctxt_idx);
660         }
661         else
662         {
663             /* larger PUs can be encoded as bi_pred/l0/l1 inter_pred_idc */
664             WORD32 is_bipred;
665 
666             ctxt_idx = IHEVC_CAB_INTER_PRED_IDC + ps_codec->s_parse.i4_ct_depth;
667             TRACE_CABAC_CTXT("inter_pred_idc", ps_cabac->u4_range, ctxt_idx);
668             is_bipred = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
669             inter_pred_idc = PRED_BI;
670             if(!is_bipred)
671             {
672                 ctxt_idx = IHEVC_CAB_INTER_PRED_IDC + 4;
673                 inter_pred_idc = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm,
674                                                          ctxt_idx);
675             }
676         }
677 
678         AEV_TRACE("inter_pred_idc", inter_pred_idc, ps_cabac->u4_range);
679     }
680     else
681         inter_pred_idc = PRED_L0;
682     ps_pu->mv.i1_l0_ref_idx = 0;
683     ps_pu->mv.i1_l1_ref_idx = 0;
684     /* Decode MVD for L0 for PRED_L0 or PRED_BI */
685     if(inter_pred_idc != PRED_L1)
686     {
687         WORD32 active_refs = ps_slice_hdr->i1_num_ref_idx_l0_active;
688         WORD32 ref_idx = 0;
689         WORD32 ctxt_idx;
690 
691         if(active_refs > 1)
692         {
693             ctxt_idx = IHEVC_CAB_INTER_REF_IDX;
694             /* encode the context modelled first bin */
695             TRACE_CABAC_CTXT("ref_idx", ps_cabac->u4_range, ctxt_idx);
696             ref_idx = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
697 
698             if((active_refs > 2) && ref_idx)
699             {
700                 WORD32 value;
701                 /* encode the context modelled second bin */
702                 ctxt_idx++;
703                 value = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
704                 ref_idx += value;
705                 if((active_refs > 3) && value)
706                 {
707                     /* encode remaining bypass bins */
708                     ref_idx = ihevcd_cabac_decode_bypass_bins_tunary(ps_cabac,
709                                                                      ps_bitstrm,
710                                                                      (active_refs - 3)
711                     );
712                     ref_idx += 2;
713                 }
714             }
715             AEV_TRACE("ref_idx", ref_idx, ps_cabac->u4_range);
716         }
717 
718         ref_idx = CLIP3(ref_idx, 0, MAX_DPB_SIZE - 1);
719         ps_pu->mv.i1_l0_ref_idx = ref_idx;
720 
721         ihevcd_parse_mvd(ps_codec, &ps_pu->mv.s_l0_mv);
722 
723         ctxt_idx = IHEVC_CAB_MVP_L0L1;
724         value = ihevcd_cabac_decode_bin(ps_cabac,
725                                         ps_bitstrm,
726                                         ctxt_idx);
727 
728         AEV_TRACE("mvp_l0/l1_flag", value, ps_cabac->u4_range);
729 
730         ps_pu->b1_l0_mvp_idx = value;
731 
732     }
733     /* Decode MVD for L1 for PRED_L1 or PRED_BI */
734     if(inter_pred_idc != PRED_L0)
735     {
736         WORD32 active_refs = ps_slice_hdr->i1_num_ref_idx_l1_active;
737         WORD32 ref_idx = 0;
738         WORD32 ctxt_idx;
739 
740         if(active_refs > 1)
741         {
742 
743             ctxt_idx = IHEVC_CAB_INTER_REF_IDX;
744             TRACE_CABAC_CTXT("ref_idx", ps_cabac->u4_range, ctxt_idx);
745             /* encode the context modelled first bin */
746             ref_idx = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
747 
748             if((active_refs > 2) && ref_idx)
749             {
750                 WORD32 value;
751                 /* encode the context modelled second bin */
752                 ctxt_idx++;
753                 value = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
754                 ref_idx += value;
755                 if((active_refs > 3) && value)
756                 {
757                     /* encode remaining bypass bins */
758                     ref_idx = ihevcd_cabac_decode_bypass_bins_tunary(ps_cabac,
759                                                                      ps_bitstrm,
760                                                                      (active_refs - 3)
761                     );
762                     ref_idx += 2;
763                 }
764             }
765 
766             AEV_TRACE("ref_idx", ref_idx, ps_cabac->u4_range);
767         }
768 
769         ref_idx = CLIP3(ref_idx, 0, MAX_DPB_SIZE - 1);
770         ps_pu->mv.i1_l1_ref_idx = ref_idx;
771 
772         if(ps_slice_hdr->i1_mvd_l1_zero_flag && inter_pred_idc == PRED_BI)
773         {
774             ps_pu->mv.s_l1_mv.i2_mvx = 0;
775             ps_pu->mv.s_l1_mv.i2_mvy = 0;
776         }
777         else
778         {
779             ihevcd_parse_mvd(ps_codec, &ps_pu->mv.s_l1_mv);
780         }
781 
782         ctxt_idx = IHEVC_CAB_MVP_L0L1;
783         value = ihevcd_cabac_decode_bin(ps_cabac,
784                                         ps_bitstrm,
785                                         ctxt_idx);
786 
787         AEV_TRACE("mvp_l0/l1_flag", value, ps_cabac->u4_range);
788         ps_pu->b1_l1_mvp_idx = value;
789 
790     }
791 
792     ps_pu->b2_pred_mode = inter_pred_idc;
793     return ret;
794 }
795 /**
796  *******************************************************************************
797  *
798  * @brief
799  *  Parses Prediction unit
800  *
801  * @par Description:
802  *  Parses Prediction unit as per Section:7.3.9.6
803  *
804  * @param[in] ps_codec
805  *  Pointer to codec context
806  *
807  * @returns  Error from IHEVCD_ERROR_T
808  *
809  * @remarks
810  *
811  *
812  *******************************************************************************
813  */
814 
ihevcd_parse_prediction_unit(codec_t * ps_codec,WORD32 x0,WORD32 y0,WORD32 wd,WORD32 ht)815 IHEVCD_ERROR_T  ihevcd_parse_prediction_unit(codec_t *ps_codec,
816                                              WORD32 x0,
817                                              WORD32 y0,
818                                              WORD32 wd,
819                                              WORD32 ht)
820 {
821     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
822     slice_header_t *ps_slice_hdr;
823     sps_t *ps_sps;
824     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
825     WORD32 ctb_x_base;
826     WORD32 ctb_y_base;
827 
828     pu_t *ps_pu = ps_codec->s_parse.ps_pu;
829     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
830 
831     ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr;
832 
833     /* Set PU structure to default values */
834     memset(ps_pu, 0, sizeof(pu_t));
835 
836     ps_sps = ps_codec->s_parse.ps_sps;
837     ctb_x_base = ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size;
838     ctb_y_base = ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size;
839 
840     ps_pu->b4_pos_x = (x0 - ctb_x_base) >> 2;
841     ps_pu->b4_pos_y = (y0 - ctb_y_base) >> 2;
842     ps_pu->b4_wd = (wd >> 2) - 1;
843     ps_pu->b4_ht = (ht >> 2) - 1;
844 
845     ps_pu->b1_intra_flag = 0;
846     ps_pu->b3_part_mode = ps_codec->s_parse.s_cu.i4_part_mode;
847 
848     if(PRED_MODE_SKIP == ps_codec->s_parse.s_cu.i4_pred_mode)
849     {
850         WORD32 merge_idx = 0;
851         if(ps_slice_hdr->i1_max_num_merge_cand > 1)
852         {
853             WORD32 ctxt_idx = IHEVC_CAB_MERGE_IDX_EXT;
854             WORD32 bin;
855 
856             TRACE_CABAC_CTXT("merge_idx", ps_cabac->u4_range, ctxt_idx);
857             bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
858             if(bin)
859             {
860                 if(ps_slice_hdr->i1_max_num_merge_cand > 2)
861                 {
862                     merge_idx = ihevcd_cabac_decode_bypass_bins_tunary(
863                                     ps_cabac, ps_bitstrm,
864                                     (ps_slice_hdr->i1_max_num_merge_cand - 2));
865                 }
866                 merge_idx++;
867             }
868             AEV_TRACE("merge_idx", merge_idx, ps_cabac->u4_range);
869         }
870         ps_pu->b1_merge_flag = 1;
871         ps_pu->b3_merge_idx = merge_idx;
872 
873     }
874     else
875     {
876         /* MODE_INTER */
877         WORD32 merge_flag;
878         WORD32 ctxt_idx = IHEVC_CAB_MERGE_FLAG_EXT;
879         TRACE_CABAC_CTXT("merge_flag", ps_cabac->u4_range, ctxt_idx);
880         merge_flag = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
881         AEV_TRACE("merge_flag", merge_flag, ps_cabac->u4_range);
882 
883         ps_pu->b1_merge_flag = merge_flag;
884 
885         if(merge_flag)
886         {
887             WORD32 merge_idx = 0;
888             if(ps_slice_hdr->i1_max_num_merge_cand > 1)
889             {
890                 WORD32 ctxt_idx = IHEVC_CAB_MERGE_IDX_EXT;
891                 WORD32 bin;
892                 TRACE_CABAC_CTXT("merge_idx", ps_cabac->u4_range, ctxt_idx);
893                 bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
894                 if(bin)
895                 {
896                     if(ps_slice_hdr->i1_max_num_merge_cand > 2)
897                     {
898                         merge_idx = ihevcd_cabac_decode_bypass_bins_tunary(
899                                         ps_cabac, ps_bitstrm,
900                                         (ps_slice_hdr->i1_max_num_merge_cand - 2));
901                     }
902                     merge_idx++;
903                 }
904                 AEV_TRACE("merge_idx", merge_idx, ps_cabac->u4_range);
905             }
906 
907             ps_pu->b3_merge_idx = merge_idx;
908         }
909         else
910         {
911             ihevcd_parse_pu_mvp(ps_codec, ps_pu);
912         }
913 
914     }
915     STATS_UPDATE_PU_SIZE(ps_pu);
916     /* Increment PU pointer */
917     ps_codec->s_parse.ps_pu++;
918     ps_codec->s_parse.i4_pic_pu_idx++;
919     return ret;
920 }
921 
922 
ihevcd_parse_part_mode_amp(cab_ctxt_t * ps_cabac,bitstrm_t * ps_bitstrm)923 WORD32 ihevcd_parse_part_mode_amp(cab_ctxt_t *ps_cabac, bitstrm_t *ps_bitstrm)
924 {
925     WORD32 ctxt_idx = IHEVC_CAB_PART_MODE;
926     WORD32 part_mode_idx;
927     WORD32 part_mode;
928     WORD32 bin;
929 
930     part_mode = 0;
931     TRACE_CABAC_CTXT("part_mode", ps_cabac->u4_range, ctxt_idx);
932     bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx++);
933 
934     if(!bin)
935     {
936         bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx++);
937         part_mode_idx = bin;
938         part_mode_idx <<= 1;
939 
940         /* Following takes of handling context increment for 3rd bin in part_mode */
941         /* When AMP is enabled and the current is not min CB */
942         /* Context for 3rd bin is 3 and not 2 */
943         ctxt_idx += 1;
944 
945         bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
946         part_mode_idx |= bin;
947 
948         part_mode_idx <<= 1;
949         if(!bin)
950         {
951 
952             bin = ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
953             part_mode_idx |= bin;
954         }
955         part_mode = gau1_part_mode_amp[part_mode_idx];
956     }
957     return part_mode;
958 }
ihevcd_parse_coding_unit_intra(codec_t * ps_codec,WORD32 x0,WORD32 y0,WORD32 log2_cb_size)959 IHEVCD_ERROR_T ihevcd_parse_coding_unit_intra(codec_t *ps_codec,
960                                               WORD32 x0,
961                                               WORD32 y0,
962                                               WORD32 log2_cb_size)
963 {
964     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
965     sps_t *ps_sps;
966     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
967     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
968     WORD32 pcm_flag;
969     WORD32 value;
970     WORD32 cb_size = 1 << log2_cb_size;
971     WORD32 part_mode =  ps_codec->s_parse.s_cu.i4_part_mode;
972     tu_t *ps_tu = ps_codec->s_parse.ps_tu;
973     pu_t *ps_pu = ps_codec->s_parse.ps_pu;
974     WORD32 ctb_x_base;
975     WORD32 ctb_y_base;
976     ps_sps = ps_codec->s_parse.ps_sps;
977     ctb_x_base = ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size;
978     ctb_y_base = ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size;
979 
980     memset(ps_pu, 0, sizeof(pu_t));
981     ps_pu->b1_intra_flag = 1;
982     ps_pu->b4_wd = (cb_size >> 2) - 1;
983     ps_pu->b4_ht = (cb_size >> 2) - 1;
984     ps_pu->b4_pos_x = (x0 - ctb_x_base) >> 2;
985     ps_pu->b4_pos_y = (y0 - ctb_y_base) >> 2;
986 
987     pcm_flag = 0;
988     if((PART_2Nx2N == part_mode) && (ps_sps->i1_pcm_enabled_flag)
989                     && (log2_cb_size
990                                     >= ps_sps->i1_log2_min_pcm_coding_block_size)
991                     && (log2_cb_size
992                                     <= (ps_sps->i1_log2_min_pcm_coding_block_size + ps_sps->i1_log2_diff_max_min_pcm_coding_block_size)))
993     {
994         TRACE_CABAC_CTXT("pcm_flag", ps_cabac->u4_range, 0);
995         pcm_flag = ihevcd_cabac_decode_terminate(ps_cabac, ps_bitstrm);
996         AEV_TRACE("pcm_flag", pcm_flag, ps_cabac->u4_range);
997     }
998 
999     ps_codec->s_parse.i4_cu_pcm_flag = pcm_flag;
1000     if(pcm_flag)
1001     {
1002         UWORD8 *pu1_luma_intra_pred_mode_top, *pu1_luma_intra_pred_mode_left;
1003         WORD32 i,  num_pred_blocks;
1004 
1005         if(ps_codec->s_parse.s_bitstrm.u4_bit_ofst % 8)
1006         {
1007             TRACE_CABAC_CTXT("pcm_alignment_zero_bit", ps_cabac->u4_range, 0);
1008             ihevcd_bits_flush_to_byte_boundary(&ps_codec->s_parse.s_bitstrm);
1009             AEV_TRACE("pcm_alignment_zero_bit", 0, ps_cabac->u4_range);
1010         }
1011 
1012         ihevcd_parse_pcm_sample(ps_codec, x0, y0, log2_cb_size);
1013 
1014         ihevcd_cabac_reset(&ps_codec->s_parse.s_cabac,
1015                            &ps_codec->s_parse.s_bitstrm);
1016 
1017         ps_tu = ps_codec->s_parse.ps_tu;
1018         ps_tu->b1_cb_cbf = 1;
1019         ps_tu->b1_cr_cbf = 1;
1020         ps_tu->b1_y_cbf = 1;
1021         ps_tu->b4_pos_x = ((x0 - ctb_x_base) >> 2);
1022         ps_tu->b4_pos_y = ((y0 - ctb_y_base) >> 2);
1023         ps_tu->b1_transquant_bypass = 1;
1024         ps_tu->b3_size = (log2_cb_size - 2);
1025         ps_tu->b7_qp = ps_codec->s_parse.u4_qp;
1026         ps_tu->b3_chroma_intra_mode_idx = INTRA_PRED_CHROMA_IDX_NONE;
1027         ps_tu->b6_luma_intra_mode   = INTRA_PRED_NONE;
1028 
1029         /* Set the first TU in CU flag */
1030         {
1031             if((ps_codec->s_parse.s_cu.i4_pos_x << 3) == (ps_tu->b4_pos_x << 2) &&
1032                             (ps_codec->s_parse.s_cu.i4_pos_y << 3) == (ps_tu->b4_pos_y << 2))
1033             {
1034                 ps_tu->b1_first_tu_in_cu = 1;
1035             }
1036             else
1037             {
1038                 ps_tu->b1_first_tu_in_cu = 0;
1039             }
1040         }
1041 
1042         /* Update the intra pred mode for PCM to INTRA_DC(default mode) */
1043         pu1_luma_intra_pred_mode_top = ps_codec->s_parse.pu1_luma_intra_pred_mode_top
1044                         + (ps_codec->s_parse.s_cu.i4_pos_x * 2);
1045 
1046         pu1_luma_intra_pred_mode_left = ps_codec->s_parse.pu1_luma_intra_pred_mode_left
1047                         + (ps_codec->s_parse.s_cu.i4_pos_y * 2);
1048 
1049         num_pred_blocks = 1; /* Because PCM part mode will be 2Nx2N */
1050 
1051         ps_codec->s_func_selector.ihevc_memset_fptr(pu1_luma_intra_pred_mode_left, INTRA_DC, (cb_size / num_pred_blocks) / MIN_PU_SIZE);
1052         ps_codec->s_func_selector.ihevc_memset_fptr(pu1_luma_intra_pred_mode_top, INTRA_DC, (cb_size / num_pred_blocks) / MIN_PU_SIZE);
1053 
1054 
1055         /* Set no_loop_filter appropriately */
1056         if(1 == ps_sps->i1_pcm_loop_filter_disable_flag)
1057         {
1058             UWORD8 *pu1_pic_no_loop_filter_flag;
1059             WORD32 numbytes_row;
1060             UWORD32 u4_mask;
1061 
1062             pu1_pic_no_loop_filter_flag = ps_codec->s_parse.pu1_pic_no_loop_filter_flag;
1063             numbytes_row =  (ps_sps->i2_pic_width_in_luma_samples + 63) / 64;
1064             pu1_pic_no_loop_filter_flag += (y0 / 8) * numbytes_row;
1065             pu1_pic_no_loop_filter_flag += (x0 / 64);
1066             /* Generate (cb_size / 8) number of 1s */
1067             /* i.e (log2_cb_size - 2) number of 1s */
1068             u4_mask = LSB_ONES((cb_size >> 3));
1069             for(i = 0; i < (cb_size / 8); i++)
1070             {
1071                 *pu1_pic_no_loop_filter_flag |= (u4_mask << (((x0) / 8) % 8));
1072                 pu1_pic_no_loop_filter_flag += numbytes_row;
1073             }
1074         }
1075         /* Increment ps_tu and tu_idx */
1076         ps_codec->s_parse.ps_tu++;
1077         ps_codec->s_parse.s_cu.i4_tu_cnt++;
1078         ps_codec->s_parse.i4_pic_tu_idx++;
1079 
1080     }
1081     else
1082     {
1083         WORD32 cnt = 0;
1084         WORD32 i;
1085         WORD32 part_cnt;
1086 
1087         part_cnt = (part_mode == PART_NxN) ? 4 : 1;
1088 
1089         for(i = 0; i < part_cnt; i++)
1090         {
1091             TRACE_CABAC_CTXT("prev_intra_pred_luma_flag", ps_cabac->u4_range, IHEVC_CAB_INTRA_LUMA_PRED_FLAG);
1092             value = ihevcd_cabac_decode_bin(ps_cabac,
1093                                             ps_bitstrm,
1094                                             IHEVC_CAB_INTRA_LUMA_PRED_FLAG);
1095 
1096             ps_codec->s_parse.s_cu.ai4_prev_intra_luma_pred_flag[i] =
1097                             value;
1098             AEV_TRACE("prev_intra_pred_luma_flag", value, ps_cabac->u4_range);
1099         }
1100 
1101         for(i = 0; i < part_cnt; i++)
1102         {
1103             if(ps_codec->s_parse.s_cu.ai4_prev_intra_luma_pred_flag[cnt])
1104             {
1105                 value = ihevcd_cabac_decode_bypass_bins_tunary(ps_cabac, ps_bitstrm, 2);
1106                 AEV_TRACE("mpm_idx", value, ps_cabac->u4_range);
1107                 ps_codec->s_parse.s_cu.ai4_mpm_idx[cnt] = value;
1108             }
1109             else
1110             {
1111                 value = ihevcd_cabac_decode_bypass_bins(ps_cabac, ps_bitstrm, 5);
1112                 AEV_TRACE("rem_intra_luma_pred_mode", value,
1113                           ps_cabac->u4_range);
1114                 ps_codec->s_parse.s_cu.ai4_rem_intra_luma_pred_mode[cnt] =
1115                                 value;
1116             }
1117             cnt++;
1118         }
1119         TRACE_CABAC_CTXT("intra_chroma_pred_mode", ps_cabac->u4_range, IHEVC_CAB_CHROMA_PRED_MODE);
1120         value = ihevcd_cabac_decode_bin(ps_cabac,
1121                                         ps_bitstrm,
1122                                         IHEVC_CAB_CHROMA_PRED_MODE);
1123         ps_codec->s_parse.s_cu.i4_intra_chroma_pred_mode_idx = 4;
1124         if(value)
1125         {
1126             ps_codec->s_parse.s_cu.i4_intra_chroma_pred_mode_idx =
1127                             ihevcd_cabac_decode_bypass_bins(ps_cabac,
1128                                                             ps_bitstrm, 2);
1129         }
1130         AEV_TRACE("intra_chroma_pred_mode",
1131                   ps_codec->s_parse.s_cu.i4_intra_chroma_pred_mode_idx,
1132                   ps_cabac->u4_range);
1133 
1134 
1135         ihevcd_intra_pred_mode_prediction(ps_codec, log2_cb_size, x0, y0);
1136     }
1137     STATS_UPDATE_PU_SIZE(ps_pu);
1138     /* Increment PU pointer */
1139     ps_codec->s_parse.ps_pu++;
1140     ps_codec->s_parse.i4_pic_pu_idx++;
1141 
1142     return ret;
1143 }
1144 /**
1145  *******************************************************************************
1146  *
1147  * @brief
1148  *  Parses coding unit
1149  *
1150  * @par Description:
1151  *  Parses coding unit as per Section:7.3.9.5
1152  *
1153  * @param[in] ps_codec
1154  *  Pointer to codec context
1155  *
1156  * @returns  Error from IHEVCD_ERROR_T
1157  *
1158  * @remarks
1159  *
1160  *
1161  *******************************************************************************
1162  */
1163 
ihevcd_parse_coding_unit(codec_t * ps_codec,WORD32 x0,WORD32 y0,WORD32 log2_cb_size)1164 IHEVCD_ERROR_T  ihevcd_parse_coding_unit(codec_t *ps_codec,
1165                                          WORD32 x0,
1166                                          WORD32 y0,
1167                                          WORD32 log2_cb_size)
1168 {
1169     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
1170     sps_t *ps_sps;
1171     pps_t *ps_pps;
1172     WORD32 cb_size;
1173     slice_header_t *ps_slice_hdr;
1174     WORD32 skip_flag;
1175     WORD32 pcm_flag;
1176     UWORD32 *pu4_skip_top = ps_codec->s_parse.pu4_skip_cu_top;
1177     UWORD32 u4_skip_left = ps_codec->s_parse.u4_skip_cu_left;
1178     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
1179     tu_t *ps_tu = ps_codec->s_parse.ps_tu;
1180 
1181     WORD32 cu_pos_x;
1182     WORD32 cu_pos_y;
1183     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
1184 
1185     ASSERT(0 == (x0 % 8));
1186     ASSERT(0 == (y0 % 8));
1187 
1188     ps_codec->s_parse.s_cu.i4_tu_cnt = 0;
1189     ps_sps = ps_codec->s_parse.ps_sps;
1190     ps_pps = ps_codec->s_parse.ps_pps;
1191 
1192     cu_pos_x = ps_codec->s_parse.s_cu.i4_pos_x;
1193     cu_pos_y = ps_codec->s_parse.s_cu.i4_pos_y;
1194 
1195 
1196 
1197     ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr;
1198 
1199 
1200     cb_size = 1 << log2_cb_size;
1201 
1202     ps_codec->s_parse.s_cu.i4_cu_transquant_bypass = 0;
1203 
1204     if(ps_pps->i1_transquant_bypass_enable_flag)
1205     {
1206         TRACE_CABAC_CTXT("cu_transquant_bypass_flag", ps_cabac->u4_range, IHEVC_CAB_CU_TQ_BYPASS_FLAG);
1207         ps_codec->s_parse.s_cu.i4_cu_transquant_bypass =
1208                         ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm,
1209                                                 IHEVC_CAB_CU_TQ_BYPASS_FLAG);
1210         /* Update transquant_bypass in ps_tu */
1211 
1212         AEV_TRACE("cu_transquant_bypass_flag", ps_codec->s_parse.s_cu.i4_cu_transquant_bypass,
1213                   ps_cabac->u4_range);
1214 
1215         if(ps_codec->s_parse.s_cu.i4_cu_transquant_bypass)
1216         {
1217             UWORD8 *pu1_pic_no_loop_filter_flag = ps_codec->s_parse.pu1_pic_no_loop_filter_flag;
1218             UWORD32 u4_mask;
1219             WORD32 i;
1220             WORD32 numbytes_row;
1221             numbytes_row =  (ps_sps->i2_pic_width_in_luma_samples + 63) / 64;
1222             pu1_pic_no_loop_filter_flag += (y0 / 8) * numbytes_row;
1223             pu1_pic_no_loop_filter_flag += (x0 / 64);
1224 
1225             /* Generate (cb_size / 8) number of 1s */
1226             /* i.e (log2_cb_size - 2) number of 1s */
1227             u4_mask = LSB_ONES((cb_size >> 3));
1228             for(i = 0; i < (cb_size / 8); i++)
1229             {
1230                 *pu1_pic_no_loop_filter_flag |= (u4_mask << (((x0) / 8) % 8));
1231                 pu1_pic_no_loop_filter_flag += numbytes_row;
1232             }
1233         }
1234     }
1235 
1236     {
1237         UWORD32 u4_skip_top = 0;
1238         UWORD32 u4_mask;
1239         UWORD32 u4_top_mask, u4_left_mask;
1240         UWORD32 u4_min_cu_x = x0 / 8;
1241         UWORD32 u4_min_cu_y = y0 / 8;
1242 
1243         pu4_skip_top += (u4_min_cu_x / 32);
1244 
1245 
1246         if(ps_slice_hdr->i1_slice_type != ISLICE)
1247         {
1248             WORD32 ctx_idx_inc;
1249             ctx_idx_inc = 0;
1250 
1251             if((0 != cu_pos_y) ||
1252                             ((0 != ps_codec->s_parse.i4_ctb_slice_y) &&
1253                                             (0 != ps_codec->s_parse.i4_ctb_tile_y)))
1254             {
1255                 u4_skip_top = *pu4_skip_top;
1256                 u4_skip_top >>= (u4_min_cu_x % 32);
1257                 if(u4_skip_top & 1)
1258                     ctx_idx_inc++;
1259             }
1260 
1261             /*****************************************************************/
1262             /* If cu_pos_x is non-zero then left is available                */
1263             /* If cu_pos_x is zero then ensure both the following are true   */
1264             /*    Current CTB is not the first CTB in a tile row             */
1265             /*    Current CTB is not the first CTB in a slice                */
1266             /*****************************************************************/
1267             if((0 != cu_pos_x) ||
1268                             (((0 != ps_codec->s_parse.i4_ctb_slice_x) || (0 != ps_codec->s_parse.i4_ctb_slice_y)) &&
1269                                             (0 != ps_codec->s_parse.i4_ctb_tile_x)))
1270             {
1271                 u4_skip_left >>= (u4_min_cu_y % 32);
1272                 if(u4_skip_left & 1)
1273                     ctx_idx_inc++;
1274             }
1275             TRACE_CABAC_CTXT("cu_skip_flag", ps_cabac->u4_range, (IHEVC_CAB_SKIP_FLAG + ctx_idx_inc));
1276             skip_flag = ihevcd_cabac_decode_bin(ps_cabac,
1277                                                 ps_bitstrm,
1278                                                 (IHEVC_CAB_SKIP_FLAG + ctx_idx_inc));
1279 
1280             AEV_TRACE("cu_skip_flag", skip_flag, ps_cabac->u4_range);
1281         }
1282         else
1283             skip_flag = 0;
1284 
1285         /* Update top skip_flag */
1286         u4_skip_top = *pu4_skip_top;
1287         /* Since Max cb_size is 64, maximum of 8 bits will be set or reset */
1288         /* Also since Coding block will be within 64x64 grid, only 8bits within a WORD32
1289          * need to be updated. These 8 bits will not cross 8 bit boundaries
1290          */
1291         u4_mask = LSB_ONES(cb_size / 8);
1292         u4_top_mask = u4_mask << (u4_min_cu_x % 32);
1293 
1294 
1295         if(skip_flag)
1296         {
1297             u4_skip_top |= u4_top_mask;
1298         }
1299         else
1300         {
1301             u4_skip_top &= ~u4_top_mask;
1302         }
1303         *pu4_skip_top = u4_skip_top;
1304 
1305         /* Update left skip_flag */
1306         u4_skip_left = ps_codec->s_parse.u4_skip_cu_left;
1307         u4_mask = LSB_ONES(cb_size / 8);
1308         u4_left_mask = u4_mask << (u4_min_cu_y % 32);
1309 
1310         if(skip_flag)
1311         {
1312             u4_skip_left |= u4_left_mask;
1313         }
1314         else
1315         {
1316             u4_skip_left &= ~u4_left_mask;
1317         }
1318         ps_codec->s_parse.u4_skip_cu_left = u4_skip_left;
1319     }
1320     ps_codec->s_parse.i4_cu_pcm_flag = 0;
1321 
1322     if(skip_flag)
1323     {
1324         WORD32 ctb_x_base;
1325         WORD32 ctb_y_base;
1326 
1327         ctb_x_base = ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size;
1328         ctb_y_base = ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size;
1329 
1330         ps_tu->b1_cb_cbf = 0;
1331         ps_tu->b1_cr_cbf = 0;
1332         ps_tu->b1_y_cbf = 0;
1333         ps_tu->b4_pos_x = ((x0 - ctb_x_base) >> 2);
1334         ps_tu->b4_pos_y = ((y0 - ctb_y_base) >> 2);
1335         ps_tu->b1_transquant_bypass = 0;
1336         ps_tu->b3_size = (log2_cb_size - 2);
1337         ps_tu->b7_qp = ps_codec->s_parse.u4_qp;
1338         ps_tu->b3_chroma_intra_mode_idx = INTRA_PRED_CHROMA_IDX_NONE;
1339         ps_tu->b6_luma_intra_mode   = INTRA_PRED_NONE;
1340 
1341         /* Set the first TU in CU flag */
1342         {
1343             if((ps_codec->s_parse.s_cu.i4_pos_x << 3) == (ps_tu->b4_pos_x << 2) &&
1344                             (ps_codec->s_parse.s_cu.i4_pos_y << 3) == (ps_tu->b4_pos_y << 2))
1345             {
1346                 ps_tu->b1_first_tu_in_cu = 1;
1347             }
1348             else
1349             {
1350                 ps_tu->b1_first_tu_in_cu = 0;
1351             }
1352         }
1353 
1354         ps_codec->s_parse.ps_tu++;
1355         ps_codec->s_parse.s_cu.i4_tu_cnt++;
1356         ps_codec->s_parse.i4_pic_tu_idx++;
1357 
1358         ps_codec->s_parse.s_cu.i4_pred_mode = PRED_MODE_SKIP;
1359         ps_codec->s_parse.s_cu.i4_part_mode = PART_2Nx2N;
1360         {
1361             pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1362             ps_pu->b2_part_idx = 0;
1363             ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size, cb_size);
1364             STATS_UPDATE_PU_SKIP_SIZE(ps_pu);
1365         }
1366     }
1367     else
1368     {
1369         WORD32 pred_mode;
1370         WORD32 part_mode;
1371         WORD32 intra_split_flag;
1372         WORD32 is_mincb;
1373         cb_size = (1 << log2_cb_size);
1374         is_mincb = (cb_size == (1 << ps_sps->i1_log2_min_coding_block_size));
1375         pcm_flag = 0;
1376         if(ps_slice_hdr->i1_slice_type != ISLICE)
1377         {
1378             TRACE_CABAC_CTXT("pred_mode_flag", ps_cabac->u4_range, IHEVC_CAB_PRED_MODE);
1379             pred_mode = ihevcd_cabac_decode_bin(ps_cabac,
1380                                                 ps_bitstrm,
1381                                                 IHEVC_CAB_PRED_MODE);
1382 
1383             AEV_TRACE("pred_mode_flag", pred_mode, ps_cabac->u4_range);
1384         }
1385         else
1386         {
1387             pred_mode = PRED_MODE_INTRA;
1388         }
1389 
1390         /* If current CU is intra then set corresponging bit in picture level intra map */
1391         if(PRED_MODE_INTRA == pred_mode)
1392         {
1393             UWORD8 *pu1_pic_intra_flag = ps_codec->s_parse.pu1_pic_intra_flag;
1394             UWORD32 u4_mask;
1395             WORD32 i;
1396             WORD32 numbytes_row;
1397             numbytes_row =  (ps_sps->i2_pic_width_in_luma_samples + 63) / 64;
1398             pu1_pic_intra_flag += (y0 / 8) * numbytes_row;
1399             pu1_pic_intra_flag += (x0 / 64);
1400 
1401             /* Generate (cb_size / 8) number of 1s */
1402             /* i.e (log2_cb_size - 2) number of 1s */
1403             u4_mask = LSB_ONES((cb_size >> 3));
1404             for(i = 0; i < (cb_size / 8); i++)
1405             {
1406                 *pu1_pic_intra_flag |= (u4_mask << (((x0) / 8) % 8));
1407                 pu1_pic_intra_flag += numbytes_row;
1408             }
1409         }
1410 
1411         ps_codec->s_parse.s_cu.i4_pred_mode = pred_mode;
1412         intra_split_flag = 0;
1413         if((PRED_MODE_INTRA != pred_mode) ||
1414                         is_mincb)
1415         {
1416             UWORD32 bin;
1417             if(PRED_MODE_INTRA == pred_mode)
1418             {
1419                 TRACE_CABAC_CTXT("part_mode", ps_cabac->u4_range, IHEVC_CAB_PART_MODE);
1420                 bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, IHEVC_CAB_PART_MODE);
1421                 part_mode = (bin) ? PART_2Nx2N : PART_NxN;
1422             }
1423             else
1424             {
1425                 WORD32 amp_enabled = ps_sps->i1_amp_enabled_flag;
1426 
1427                 UWORD32 u4_max_bin_cnt = 0;
1428 
1429 
1430 
1431                 if(amp_enabled && !is_mincb)
1432                 {
1433                     part_mode = ihevcd_parse_part_mode_amp(ps_cabac, ps_bitstrm);
1434                 }
1435                 else
1436                 {
1437                     WORD32 ctxt_inc = IHEVC_CAB_PART_MODE;
1438 
1439                     u4_max_bin_cnt = 2;
1440                     if((is_mincb) && (cb_size > 8))
1441                     {
1442                         u4_max_bin_cnt++;
1443                     }
1444 
1445                     part_mode = -1;
1446                     TRACE_CABAC_CTXT("part_mode", ps_cabac->u4_range, IHEVC_CAB_PART_MODE);
1447                     do
1448                     {
1449                         bin = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm,
1450                                                       ctxt_inc++);
1451                         part_mode++;
1452                     }while(--u4_max_bin_cnt && !bin);
1453 
1454                     /* If the last bin was zero, then increment part mode by 1 */
1455                     if(!bin)
1456                         part_mode++;
1457                 }
1458 
1459 
1460             }
1461 
1462             AEV_TRACE("part_mode", part_mode, ps_cabac->u4_range);
1463 
1464         }
1465         else
1466         {
1467             part_mode = 0;
1468             intra_split_flag = 0;
1469         }
1470         ps_codec->s_parse.s_cu.i4_part_mode = part_mode;
1471 
1472         if((PRED_MODE_INTRA == ps_codec->s_parse.s_cu.i4_pred_mode) &&
1473                         (PART_NxN == ps_codec->s_parse.s_cu.i4_part_mode))
1474         {
1475             intra_split_flag = 1;
1476         }
1477         ps_codec->s_parse.s_cu.i4_part_mode = part_mode;
1478         ps_codec->s_parse.s_cu.i4_intra_split_flag = intra_split_flag;
1479         if(pred_mode == PRED_MODE_INTRA)
1480         {
1481             ps_codec->s_parse.i4_cu_pcm_flag = 0;
1482             ihevcd_parse_coding_unit_intra(ps_codec, x0, y0, log2_cb_size);
1483             pcm_flag = ps_codec->s_parse.i4_cu_pcm_flag;
1484 
1485         }
1486         else
1487         {
1488             if(part_mode == PART_2Nx2N)
1489             {
1490                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1491                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size, cb_size);
1492                 ps_pu->b2_part_idx = 0;
1493             }
1494             else if(part_mode == PART_2NxN)
1495             {
1496                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1497 
1498                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size, cb_size / 2);
1499                 ps_pu->b2_part_idx = 0;
1500 
1501                 ps_pu = ps_codec->s_parse.ps_pu;
1502                 ihevcd_parse_prediction_unit(ps_codec, x0, y0 + (cb_size / 2), cb_size, cb_size / 2);
1503 
1504                 ps_pu->b2_part_idx = 1;
1505             }
1506             else if(part_mode == PART_Nx2N)
1507             {
1508                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1509                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size / 2, cb_size);
1510                 ps_pu->b2_part_idx = 0;
1511                 ps_pu = ps_codec->s_parse.ps_pu;
1512                 ihevcd_parse_prediction_unit(ps_codec, x0 + (cb_size / 2), y0, cb_size / 2, cb_size);
1513 
1514                 ps_pu->b2_part_idx = 1;
1515             }
1516             else if(part_mode == PART_2NxnU)
1517             {
1518                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1519                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size, cb_size / 4);
1520                 ps_pu->b2_part_idx = 0;
1521                 ps_pu = ps_codec->s_parse.ps_pu;
1522                 ihevcd_parse_prediction_unit(ps_codec, x0, y0 + (cb_size / 4), cb_size, cb_size * 3 / 4);
1523 
1524                 ps_pu->b2_part_idx = 1;
1525             }
1526             else if(part_mode == PART_2NxnD)
1527             {
1528                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1529                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size, cb_size * 3 / 4);
1530                 ps_pu->b2_part_idx = 0;
1531                 ps_pu = ps_codec->s_parse.ps_pu;
1532                 ihevcd_parse_prediction_unit(ps_codec, x0, y0 + (cb_size * 3 / 4), cb_size, cb_size / 4);
1533 
1534                 ps_pu->b2_part_idx = 1;
1535             }
1536             else if(part_mode == PART_nLx2N)
1537             {
1538                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1539                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size / 4, cb_size);
1540                 ps_pu->b2_part_idx = 0;
1541                 ps_pu = ps_codec->s_parse.ps_pu;
1542                 ihevcd_parse_prediction_unit(ps_codec, x0 + (cb_size / 4), y0, cb_size * 3 / 4, cb_size);
1543 
1544                 ps_pu->b2_part_idx = 1;
1545             }
1546             else if(part_mode == PART_nRx2N)
1547             {
1548                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1549                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size * 3 / 4, cb_size);
1550                 ps_pu->b2_part_idx = 0;
1551                 ps_pu = ps_codec->s_parse.ps_pu;
1552                 ihevcd_parse_prediction_unit(ps_codec, x0 + (cb_size * 3 / 4), y0, cb_size / 4, cb_size);
1553                 ps_pu->b2_part_idx = 1;
1554             }
1555             else
1556             { /* PART_NxN */
1557                 pu_t *ps_pu = ps_codec->s_parse.ps_pu;
1558 
1559                 ihevcd_parse_prediction_unit(ps_codec, x0, y0, cb_size / 2, cb_size / 2);
1560                 ps_pu->b2_part_idx = 0;
1561                 ps_pu = ps_codec->s_parse.ps_pu;
1562                 ihevcd_parse_prediction_unit(ps_codec, x0 + (cb_size / 2), y0, cb_size / 2, cb_size / 2);
1563 
1564                 ps_pu->b2_part_idx = 1;
1565                 ps_pu = ps_codec->s_parse.ps_pu;
1566                 ihevcd_parse_prediction_unit(ps_codec, x0, y0 + (cb_size / 2), cb_size / 2, cb_size / 2);
1567 
1568                 ps_pu->b2_part_idx = 2;
1569                 ps_pu = ps_codec->s_parse.ps_pu;
1570                 ihevcd_parse_prediction_unit(ps_codec, x0 + (cb_size / 2), y0 + (cb_size / 2), cb_size / 2, cb_size / 2);
1571 
1572                 ps_pu->b2_part_idx = 3;
1573             }
1574         }
1575 
1576         if(!pcm_flag)
1577         {
1578             WORD32 no_residual_syntax_flag = 0;
1579             pu_t *ps_pu;
1580             /* Since ps_pu is incremented for each PU parsed, decrement by 1 to
1581              *  access last decoded PU
1582              */
1583             ps_pu = ps_codec->s_parse.ps_pu - 1;
1584             if((PRED_MODE_INTRA != pred_mode) &&
1585                             (!((part_mode == PART_2Nx2N) && ps_pu->b1_merge_flag)))
1586             {
1587 
1588                 TRACE_CABAC_CTXT("rqt_root_cbf", ps_cabac->u4_range, IHEVC_CAB_NORES_IDX);
1589                 no_residual_syntax_flag = ihevcd_cabac_decode_bin(ps_cabac,
1590                                                                   ps_bitstrm,
1591                                                                   IHEVC_CAB_NORES_IDX);
1592 
1593                 AEV_TRACE("rqt_root_cbf", no_residual_syntax_flag,
1594                           ps_cabac->u4_range);
1595                 /* TODO: HACK FOR COMPLIANCE WITH HM REFERENCE DECODER */
1596                 /*********************************************************/
1597                 /* currently the HM decoder expects qtroot cbf instead of */
1598                 /* no_residue_flag which has opposite meaning             */
1599                 /* This will be fixed once the software / spec is fixed   */
1600                 /*********************************************************/
1601                 no_residual_syntax_flag = 1 - no_residual_syntax_flag;
1602             }
1603 
1604             if(!no_residual_syntax_flag)
1605             {
1606 
1607                 ps_codec->s_parse.s_cu.i4_max_trafo_depth = (pred_mode == PRED_MODE_INTRA) ?
1608                                 (ps_sps->i1_max_transform_hierarchy_depth_intra + intra_split_flag) :
1609                                 (ps_sps->i1_max_transform_hierarchy_depth_inter);
1610                 ret = ihevcd_parse_transform_tree(ps_codec, x0, y0, x0, y0,
1611                                                   log2_cb_size, 0, 0,
1612                                                   ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[0]);
1613                 RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
1614             }
1615             else
1616             {
1617                 WORD32 ctb_x_base;
1618                 WORD32 ctb_y_base;
1619 
1620                 ctb_x_base = ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size;
1621                 ctb_y_base = ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size;
1622 
1623                 ps_tu = ps_codec->s_parse.ps_tu;
1624                 ps_tu->b1_cb_cbf = 0;
1625                 ps_tu->b1_cr_cbf = 0;
1626                 ps_tu->b1_y_cbf = 0;
1627                 ps_tu->b4_pos_x = ((x0 - ctb_x_base) >> 2);
1628                 ps_tu->b4_pos_y = ((y0 - ctb_y_base) >> 2);
1629                 ps_tu->b1_transquant_bypass = 0;
1630                 ps_tu->b3_size = (log2_cb_size - 2);
1631                 ps_tu->b7_qp = ps_codec->s_parse.u4_qp;
1632                 ps_tu->b3_chroma_intra_mode_idx = INTRA_PRED_CHROMA_IDX_NONE;
1633                 ps_tu->b6_luma_intra_mode   = ps_codec->s_parse.s_cu.ai4_intra_luma_pred_mode[0];
1634 
1635                 /* Set the first TU in CU flag */
1636                 {
1637                     if((ps_codec->s_parse.s_cu.i4_pos_x << 3) == (ps_tu->b4_pos_x << 2) &&
1638                                     (ps_codec->s_parse.s_cu.i4_pos_y << 3) == (ps_tu->b4_pos_y << 2))
1639                     {
1640                         ps_tu->b1_first_tu_in_cu = 1;
1641                     }
1642                     else
1643                     {
1644                         ps_tu->b1_first_tu_in_cu = 0;
1645                     }
1646                 }
1647                 ps_codec->s_parse.ps_tu++;
1648                 ps_codec->s_parse.s_cu.i4_tu_cnt++;
1649                 ps_codec->s_parse.i4_pic_tu_idx++;
1650 
1651             }
1652         }
1653 
1654     }
1655 
1656 
1657 
1658 
1659     return ret;
1660 }
1661 
1662 
1663 
1664 
1665 /**
1666  *******************************************************************************
1667  *
1668  * @brief
1669  *  Parses Coding Quad Tree
1670  *
1671  * @par Description:
1672  *  Parses Coding Quad Tree as per Section:7.3.9.4
1673  *
1674  * @param[in] ps_codec
1675  *  Pointer to codec context
1676  *
1677  * @returns  Error from IHEVCD_ERROR_T
1678  *
1679  * @remarks
1680  *
1681  *
1682  *******************************************************************************
1683  */
ihevcd_parse_coding_quadtree(codec_t * ps_codec,WORD32 x0,WORD32 y0,WORD32 log2_cb_size,WORD32 ct_depth)1684 IHEVCD_ERROR_T ihevcd_parse_coding_quadtree(codec_t *ps_codec,
1685                                             WORD32 x0,
1686                                             WORD32 y0,
1687                                             WORD32 log2_cb_size,
1688                                             WORD32 ct_depth)
1689 {
1690     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
1691     sps_t *ps_sps;
1692     pps_t *ps_pps;
1693     WORD32 split_cu_flag;
1694     WORD32 x1, y1;
1695     WORD32 cu_pos_x;
1696     WORD32 cu_pos_y;
1697     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
1698     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
1699     WORD32 cb_size = 1 << log2_cb_size;
1700     ps_sps = ps_codec->s_parse.ps_sps;
1701     ps_pps = ps_codec->s_parse.ps_pps;
1702 
1703     /* Compute CU position with respect to current CTB in (8x8) units */
1704     cu_pos_x = (x0 - (ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size)) >> 3;
1705     cu_pos_y = (y0 - (ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size)) >> 3;
1706 
1707     ps_codec->s_parse.s_cu.i4_pos_x = cu_pos_x;
1708     ps_codec->s_parse.s_cu.i4_pos_y = cu_pos_y;
1709 
1710     ps_codec->s_parse.s_cu.i4_log2_cb_size = log2_cb_size;
1711 
1712     ps_codec->s_parse.i4_ct_depth = ct_depth;
1713     {
1714         UWORD32 *pu4_ct_depth_top = ps_codec->s_parse.pu4_ct_depth_top;
1715         UWORD32 u4_ct_depth_left = ps_codec->s_parse.u4_ct_depth_left;
1716         UWORD32 u4_ct_depth_top = 0;
1717         UWORD32 u4_mask;
1718         UWORD32 u4_top_mask, u4_left_mask;
1719         WORD32  ctxt_idx;
1720         UWORD32 u4_min_cu_x = x0 / 8;
1721         UWORD32 u4_min_cu_y = y0 / 8;
1722 
1723         pu4_ct_depth_top += (u4_min_cu_x / 16);
1724 
1725 
1726 
1727 
1728         if(((x0 + (1 << log2_cb_size)) <= ps_sps->i2_pic_width_in_luma_samples) &&
1729                         ((y0 + (1 << log2_cb_size)) <= ps_sps->i2_pic_height_in_luma_samples) &&
1730                         (log2_cb_size > ps_sps->i1_log2_min_coding_block_size))
1731         {
1732 
1733             ctxt_idx = IHEVC_CAB_SPLIT_CU_FLAG;
1734             /* Split cu context increment is decided based on left and top Coding tree
1735              * depth which is stored at frame level
1736              */
1737             /* Check if the CTB is in first row in the current slice or tile */
1738             if((0 != cu_pos_y) ||
1739                             ((0 != ps_codec->s_parse.i4_ctb_slice_y) &&
1740                                             (0 != ps_codec->s_parse.i4_ctb_tile_y)))
1741             {
1742                 u4_ct_depth_top = *pu4_ct_depth_top;
1743                 u4_ct_depth_top >>= ((u4_min_cu_x % 16) * 2);
1744                 u4_ct_depth_top &= 3;
1745 
1746                 if((WORD32)u4_ct_depth_top > ct_depth)
1747                     ctxt_idx++;
1748             }
1749 
1750             /* Check if the CTB is in first column in the current slice or tile */
1751             /*****************************************************************/
1752             /* If cu_pos_x is non-zero then left is available                */
1753             /* If cu_pos_x is zero then ensure both the following are true   */
1754             /*    Current CTB is not the first CTB in a tile row             */
1755             /*    Current CTB is not the first CTB in a slice                */
1756             /*****************************************************************/
1757             if((0 != cu_pos_x) ||
1758                             (((0 != ps_codec->s_parse.i4_ctb_slice_x) || (0 != ps_codec->s_parse.i4_ctb_slice_y)) &&
1759                                             (0 != ps_codec->s_parse.i4_ctb_tile_x)))
1760             {
1761                 u4_ct_depth_left >>= ((u4_min_cu_y % 16) * 2);
1762                 u4_ct_depth_left &= 3;
1763                 if((WORD32)u4_ct_depth_left > ct_depth)
1764                     ctxt_idx++;
1765             }
1766             TRACE_CABAC_CTXT("split_cu_flag", ps_cabac->u4_range, ctxt_idx);
1767             split_cu_flag = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
1768             AEV_TRACE("split_cu_flag", split_cu_flag, ps_cabac->u4_range);
1769         }
1770         else
1771         {
1772             if(log2_cb_size > ps_sps->i1_log2_min_coding_block_size)
1773                 split_cu_flag = 1;
1774             else
1775                 split_cu_flag = 0;
1776         }
1777 
1778         if(0 == split_cu_flag)
1779         {
1780             /* Update top ct_depth */
1781             u4_ct_depth_top = *pu4_ct_depth_top;
1782             /* Since Max cb_size is 64, maximum of 8 bits will be set or reset */
1783             /* Also since Coding block will be within 64x64 grid, only 8bits within a WORD32
1784              * need to be updated. These 8 bits will not cross 8 bit boundaries
1785              */
1786             u4_mask = DUP_LSB_11(cb_size / 8);
1787 
1788             u4_top_mask = u4_mask << ((u4_min_cu_x % 16) * 2);
1789             u4_ct_depth_top &= ~u4_top_mask;
1790 
1791             if(ct_depth)
1792             {
1793                 u4_top_mask = gau4_ct_depth_mask[ct_depth] & u4_mask;
1794 
1795                 u4_top_mask = u4_top_mask << ((u4_min_cu_x % 16) * 2);
1796                 u4_ct_depth_top |= u4_top_mask;
1797             }
1798 
1799             *pu4_ct_depth_top = u4_ct_depth_top;
1800 
1801             /* Update left ct_depth */
1802             u4_ct_depth_left = ps_codec->s_parse.u4_ct_depth_left;
1803 
1804             u4_left_mask = u4_mask << ((u4_min_cu_y % 16) * 2);
1805 
1806             u4_ct_depth_left &= ~u4_left_mask;
1807             if(ct_depth)
1808             {
1809                 u4_left_mask = gau4_ct_depth_mask[ct_depth] & u4_mask;
1810 
1811                 u4_left_mask = u4_left_mask << ((u4_min_cu_y % 16) * 2);
1812                 u4_ct_depth_left |= u4_left_mask;
1813             }
1814 
1815             ps_codec->s_parse.u4_ct_depth_left = u4_ct_depth_left;
1816         }
1817     }
1818     if((ps_pps->i1_cu_qp_delta_enabled_flag) &&
1819                     (log2_cb_size >= ps_pps->i1_log2_min_cu_qp_delta_size))
1820     {
1821         ps_codec->s_parse.i4_is_cu_qp_delta_coded = 0;
1822         ps_codec->s_parse.i4_cu_qp_delta = 0;
1823     }
1824     if(split_cu_flag)
1825     {
1826         x1 = x0 + ((1 << log2_cb_size) >> 1);
1827         y1 = y0 + ((1 << log2_cb_size) >> 1);
1828 
1829         ret = ihevcd_parse_coding_quadtree(ps_codec, x0, y0, log2_cb_size - 1, ct_depth + 1);
1830         RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
1831 
1832         /* At frame boundaries coding quadtree nodes are sent only if they fall within the frame */
1833         if(x1 < ps_sps->i2_pic_width_in_luma_samples)
1834         {
1835             ret = ihevcd_parse_coding_quadtree(ps_codec, x1, y0, log2_cb_size - 1, ct_depth + 1);
1836             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
1837         }
1838 
1839         if(y1 < ps_sps->i2_pic_height_in_luma_samples)
1840         {
1841             ret = ihevcd_parse_coding_quadtree(ps_codec, x0, y1, log2_cb_size - 1, ct_depth + 1);
1842             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
1843         }
1844 
1845         if((x1 < ps_sps->i2_pic_width_in_luma_samples) &&
1846                         (y1 < ps_sps->i2_pic_height_in_luma_samples))
1847         {
1848             ret = ihevcd_parse_coding_quadtree(ps_codec, x1, y1, log2_cb_size - 1, ct_depth + 1);
1849             RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
1850         }
1851     }
1852     else
1853     {
1854         /* Set current group QP if current CU is aligned with the group */
1855         {
1856             WORD32 cu_pos_x = ps_codec->s_parse.s_cu.i4_pos_x << 3;
1857             WORD32 cu_pos_y = ps_codec->s_parse.s_cu.i4_pos_y << 3;
1858 
1859             WORD32 qpg_x = (cu_pos_x - (cu_pos_x & ((1 << ps_pps->i1_log2_min_cu_qp_delta_size) - 1)));
1860             WORD32 qpg_y = (cu_pos_y - (cu_pos_y & ((1 << ps_pps->i1_log2_min_cu_qp_delta_size) - 1)));
1861 
1862             if((cu_pos_x == qpg_x) &&
1863                             (cu_pos_y == qpg_y))
1864             {
1865                 ps_codec->s_parse.u4_qpg = ps_codec->s_parse.u4_qp;
1866 
1867                 ps_codec->s_parse.s_cu.i4_cu_qp_delta = 0;
1868 
1869             }
1870         }
1871 
1872         ret = ihevcd_parse_coding_unit(ps_codec, x0, y0, log2_cb_size);
1873         RETURN_IF((IHEVCD_ERROR_T)IHEVCD_SUCCESS != ret, ret);
1874 
1875         if(ps_pps->i1_cu_qp_delta_enabled_flag)
1876         {
1877             WORD32 qp_pred, qp_left, qp_top;
1878             WORD32 cu_pos_x;
1879             WORD32 cu_pos_y;
1880             WORD32 qpg_x;
1881             WORD32 qpg_y;
1882             WORD32 i, j;
1883             WORD32 qp;
1884             WORD32 cur_cu_offset;
1885             tu_t *ps_tu = ps_codec->s_parse.ps_tu;
1886             WORD32 cb_size = 1 << ps_codec->s_parse.s_cu.i4_log2_cb_size;
1887 
1888             cu_pos_x = ps_codec->s_parse.s_cu.i4_pos_x << 3;
1889             cu_pos_y = ps_codec->s_parse.s_cu.i4_pos_y << 3;
1890 
1891             qpg_x = (cu_pos_x - (cu_pos_x & ((1 << ps_pps->i1_log2_min_cu_qp_delta_size) - 1))) >> 3;
1892             qpg_y = (cu_pos_y - (cu_pos_y & ((1 << ps_pps->i1_log2_min_cu_qp_delta_size) - 1))) >> 3;
1893 
1894             /*previous coded Qp*/
1895             qp_left = ps_codec->s_parse.u4_qpg;
1896             qp_top = ps_codec->s_parse.u4_qpg;
1897 
1898             if(qpg_x > 0)
1899             {
1900                 qp_left = ps_codec->s_parse.ai1_8x8_cu_qp[qpg_x - 1 + (qpg_y * 8)];
1901             }
1902             if(qpg_y > 0)
1903             {
1904                 qp_top = ps_codec->s_parse.ai1_8x8_cu_qp[qpg_x + ((qpg_y - 1) * 8)];
1905             }
1906 
1907             qp_pred = (qp_left + qp_top + 1) >> 1;
1908             /* Since qp_pred + ps_codec->s_parse.s_cu.i4_cu_qp_delta can be negative,
1909             52 is added before taking modulo 52 */
1910             qp = (qp_pred + ps_codec->s_parse.s_cu.i4_cu_qp_delta + 52) % 52;
1911 
1912             cur_cu_offset = (cu_pos_x >> 3) + cu_pos_y;
1913             for(i = 0; i < (cb_size >> 3); i++)
1914             {
1915                 for(j = 0; j < (cb_size >> 3); j++)
1916                 {
1917                     ps_codec->s_parse.ai1_8x8_cu_qp[cur_cu_offset + (i * 8) + j] = qp;
1918                 }
1919             }
1920 
1921             ps_codec->s_parse.u4_qp = qp;
1922             ps_codec->s_parse.s_cu.i4_qp = qp;
1923 
1924 
1925             /* When change in QP is signaled, update the QP in TUs that are already parsed in the CU */
1926             {
1927                 tu_t *ps_tu_tmp;
1928                 ps_tu_tmp = ps_tu - ps_codec->s_parse.s_cu.i4_tu_cnt;
1929                 ps_tu->b7_qp = ps_codec->s_parse.u4_qp;
1930                 while(ps_tu_tmp != ps_tu)
1931                 {
1932                     ps_tu_tmp->b7_qp = ps_codec->s_parse.u4_qp;
1933 
1934                     ps_tu_tmp++;
1935                 }
1936             }
1937             if(ps_codec->s_parse.s_cu.i4_cu_qp_delta)
1938             {
1939                 WORD32 ctb_indx;
1940                 ctb_indx = ps_codec->s_parse.i4_ctb_x + ps_sps->i2_pic_wd_in_ctb * ps_codec->s_parse.i4_ctb_y;
1941                 ps_codec->s_parse.s_bs_ctxt.pu1_pic_qp_const_in_ctb[ctb_indx >> 3] &= (~(1 << (ctb_indx & 7)));
1942             }
1943 
1944         }
1945 
1946     }
1947 
1948 
1949 
1950 
1951     return ret;
1952 }
1953 
1954 
1955 /**
1956  *******************************************************************************
1957  *
1958  * @brief
1959  *  Parses SAO (Sample adaptive offset syntax)
1960  *
1961  * @par Description:
1962  *  Parses SAO (Sample adaptive offset syntax) as per  Section:7.3.9.3
1963  *
1964  * @param[in] ps_codec
1965  *  Pointer to codec context
1966  *
1967  * @returns  Error from IHEVCD_ERROR_T
1968  *
1969  * @remarks
1970  *
1971  *
1972  *******************************************************************************
1973  */
ihevcd_parse_sao(codec_t * ps_codec)1974 IHEVCD_ERROR_T  ihevcd_parse_sao(codec_t *ps_codec)
1975 {
1976     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
1977     sps_t *ps_sps;
1978     sao_t *ps_sao;
1979     WORD32 rx;
1980     WORD32 ry;
1981     WORD32 value;
1982     bitstrm_t *ps_bitstrm = &ps_codec->s_parse.s_bitstrm;
1983     WORD32 sao_merge_left_flag;
1984     WORD32 sao_merge_up_flag;
1985     slice_header_t *ps_slice_hdr;
1986     cab_ctxt_t *ps_cabac = &ps_codec->s_parse.s_cabac;
1987     WORD32 ctxt_idx;
1988 
1989     ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr_base;
1990     ps_slice_hdr += (ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1));
1991 
1992     ps_sps = (ps_codec->s_parse.ps_sps);
1993     rx = ps_codec->s_parse.i4_ctb_x;
1994     ry = ps_codec->s_parse.i4_ctb_y;
1995 
1996     ps_sao = ps_codec->s_parse.ps_pic_sao + rx + ry * ps_sps->i2_pic_wd_in_ctb;
1997 
1998     /* Default values */
1999     ps_sao->b3_y_type_idx = 0;
2000     ps_sao->b3_cb_type_idx = 0;
2001     ps_sao->b3_cr_type_idx = 0;
2002 
2003     UNUSED(value);
2004     ctxt_idx = IHEVC_CAB_SAO_MERGE;
2005     sao_merge_left_flag = 0;
2006     sao_merge_up_flag = 0;
2007     if(rx > 0)
2008     {
2009         /*TODO:Implemented only for slice. condition for tile is not tested*/
2010         if(((0 != ps_codec->s_parse.i4_ctb_slice_x) || (0 != ps_codec->s_parse.i4_ctb_slice_y)) &&
2011                         (0 != ps_codec->s_parse.i4_ctb_tile_x))
2012         {
2013 
2014             TRACE_CABAC_CTXT("sao_merge_flag", ps_cabac->u4_range, ctxt_idx);
2015             sao_merge_left_flag = ihevcd_cabac_decode_bin(ps_cabac,
2016                                                           ps_bitstrm,
2017                                                           ctxt_idx);
2018             AEV_TRACE("sao_merge_flag", sao_merge_left_flag, ps_cabac->u4_range);
2019         }
2020 
2021     }
2022     if(ry > 0 && !sao_merge_left_flag)
2023     {
2024         if((ps_codec->s_parse.i4_ctb_slice_y > 0) && (ps_codec->s_parse.i4_ctb_tile_y > 0))
2025         {
2026             TRACE_CABAC_CTXT("sao_merge_flag", ps_cabac->u4_range, ctxt_idx);
2027             sao_merge_up_flag = ihevcd_cabac_decode_bin(ps_cabac,
2028                                                         ps_bitstrm,
2029                                                         ctxt_idx);
2030             AEV_TRACE("sao_merge_flag", sao_merge_up_flag, ps_cabac->u4_range);
2031         }
2032     }
2033     ctxt_idx = IHEVC_CAB_SAO_TYPE;
2034 
2035     if(sao_merge_left_flag)
2036     {
2037         *ps_sao = *(ps_sao - 1);
2038     }
2039     else if(sao_merge_up_flag)
2040     {
2041         *ps_sao = *(ps_sao - ps_sps->i2_pic_wd_in_ctb);
2042     }
2043     else // if(!sao_merge_up_flag && !sao_merge_left_flag)
2044     {
2045         WORD32 c_idx;
2046         WORD32 sao_type_idx = 0;
2047         for(c_idx = 0; c_idx < 3; c_idx++)
2048         {
2049             if((ps_slice_hdr->i1_slice_sao_luma_flag && c_idx == 0) || (ps_slice_hdr->i1_slice_sao_chroma_flag && c_idx > 0))
2050             {
2051 
2052 
2053                 /* sao_type_idx will be same for c_idx == 1 and c_idx == 2 - hence not initialized to zero for c_idx == 2*/
2054 
2055                 if(c_idx == 0)
2056                 {
2057                     sao_type_idx = 0;
2058                     TRACE_CABAC_CTXT("sao_type_idx", ps_cabac->u4_range, ctxt_idx);
2059                     sao_type_idx = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
2060 
2061                     if(sao_type_idx)
2062                     {
2063                         sao_type_idx += ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
2064                     }
2065                     AEV_TRACE("sao_type_idx", sao_type_idx,  ps_cabac->u4_range);
2066 
2067                     ps_sao->b3_y_type_idx = sao_type_idx;
2068                 }
2069                 if(c_idx == 1)
2070                 {
2071                     sao_type_idx = 0;
2072                     TRACE_CABAC_CTXT("sao_type_idx", ps_cabac->u4_range, ctxt_idx);
2073                     sao_type_idx = ihevcd_cabac_decode_bin(ps_cabac, ps_bitstrm, ctxt_idx);
2074                     if(sao_type_idx)
2075                     {
2076                         sao_type_idx += ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
2077                     }
2078 
2079                     AEV_TRACE("sao_type_idx", sao_type_idx,  ps_cabac->u4_range);
2080 
2081                     ps_sao->b3_cb_type_idx = sao_type_idx;
2082                     ps_sao->b3_cr_type_idx = sao_type_idx;
2083                 }
2084 
2085                 if(sao_type_idx != 0)
2086                 {
2087                     WORD32 i;
2088                     WORD32 sao_offset[4];
2089                     WORD32 sao_band_position = 0;
2090                     WORD32 c_max =  (1 << (MIN(BIT_DEPTH, 10) - 5)) - 1;
2091                     for(i = 0; i < 4; i++)
2092                     {
2093                         sao_offset[i] = ihevcd_cabac_decode_bypass_bins_tunary(ps_cabac, ps_bitstrm, c_max);
2094                         AEV_TRACE("sao_offset_abs", sao_offset[i], ps_cabac->u4_range);
2095 
2096                         if((2 == sao_type_idx) && (i > 1))
2097                         {
2098                             sao_offset[i] = -sao_offset[i];
2099                         }
2100                     }
2101 
2102                     if(sao_type_idx == 1)
2103                     {
2104                         for(i = 0; i < 4; i++)
2105                         {
2106                             if(sao_offset[i] != 0)
2107                             {
2108                                 value = ihevcd_cabac_decode_bypass_bin(ps_cabac, ps_bitstrm);
2109                                 AEV_TRACE("sao_offset_sign", value, ps_cabac->u4_range);
2110 
2111                                 if(value)
2112                                 {
2113                                     sao_offset[i] = -sao_offset[i];
2114                                 }
2115                             }
2116                         }
2117                         value = ihevcd_cabac_decode_bypass_bins(ps_cabac, ps_bitstrm, 5);
2118                         AEV_TRACE("sao_band_position", value, ps_cabac->u4_range);
2119 
2120                         sao_band_position = value;
2121                     }
2122                     else
2123                     {
2124                         if(c_idx == 0)
2125                         {
2126                             value = ihevcd_cabac_decode_bypass_bins(ps_cabac, ps_bitstrm, 2);
2127                             AEV_TRACE("sao_eo_class", value, ps_cabac->u4_range);
2128 
2129                             ps_sao->b3_y_type_idx += value;
2130                         }
2131 
2132                         if(c_idx == 1)
2133                         {
2134                             value = ihevcd_cabac_decode_bypass_bins(ps_cabac, ps_bitstrm, 2);
2135                             AEV_TRACE("sao_eo_class", value, ps_cabac->u4_range);
2136 
2137                             ps_sao->b3_cb_type_idx += value;
2138                             ps_sao->b3_cr_type_idx += value;
2139                         }
2140                     }
2141 
2142                     if(0 == c_idx)
2143                     {
2144                         ps_sao->b4_y_offset_1 = sao_offset[0];
2145                         ps_sao->b4_y_offset_2 = sao_offset[1];
2146                         ps_sao->b4_y_offset_3 = sao_offset[2];
2147                         ps_sao->b4_y_offset_4 = sao_offset[3];
2148 
2149                         ps_sao->b5_y_band_pos = sao_band_position;
2150                     }
2151                     else if(1 == c_idx)
2152                     {
2153                         ps_sao->b4_cb_offset_1 = sao_offset[0];
2154                         ps_sao->b4_cb_offset_2 = sao_offset[1];
2155                         ps_sao->b4_cb_offset_3 = sao_offset[2];
2156                         ps_sao->b4_cb_offset_4 = sao_offset[3];
2157 
2158                         ps_sao->b5_cb_band_pos = sao_band_position;
2159                     }
2160                     else // 2 == c_idx
2161                     {
2162                         ps_sao->b4_cr_offset_1 = sao_offset[0];
2163                         ps_sao->b4_cr_offset_2 = sao_offset[1];
2164                         ps_sao->b4_cr_offset_3 = sao_offset[2];
2165                         ps_sao->b4_cr_offset_4 = sao_offset[3];
2166 
2167                         ps_sao->b5_cr_band_pos = sao_band_position;
2168                     }
2169                 }
2170             }
2171         }
2172     }
2173 
2174     return ret;
2175 }
2176 /**
2177  *******************************************************************************
2178  *
2179  * @brief
2180  *  Set ctb skip
2181  *
2182  * @par Description:
2183  *  During error, sets tu and pu params of a ctb as skip.
2184  *
2185  * @param[in] ps_codec
2186  *  Pointer to codec context
2187  *
2188  * @returns  None
2189  *
2190  * @remarks
2191  *
2192  *
2193  *******************************************************************************
2194  */
ihevcd_set_ctb_skip(codec_t * ps_codec)2195 void ihevcd_set_ctb_skip(codec_t *ps_codec)
2196 {
2197     tu_t *ps_tu;
2198     pu_t *ps_pu;
2199     sps_t *ps_sps = ps_codec->s_parse.ps_sps;
2200     WORD32 ctb_size = 1 << ps_sps->i1_log2_ctb_size;
2201     WORD32 ctb_skip_wd, ctb_skip_ht;
2202     WORD32 rows_remaining, cols_remaining;
2203     WORD32 tu_abs_x, tu_abs_y;
2204     WORD32 numbytes_row =  (ps_sps->i2_pic_width_in_luma_samples + 63) / 64;
2205     UWORD8 *pu1_pic_intra_flag;
2206     UWORD32 u4_mask;
2207     WORD32 pu_x,pu_y;
2208 
2209     /* Set pu wd and ht based on whether the ctb is complete or not */
2210     rows_remaining = ps_sps->i2_pic_height_in_luma_samples
2211                     - (ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size);
2212     ctb_skip_ht = MIN(ctb_size, rows_remaining);
2213 
2214     cols_remaining = ps_sps->i2_pic_width_in_luma_samples
2215                     - (ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size);
2216     ctb_skip_wd = MIN(ctb_size, cols_remaining);
2217 
2218     ps_codec->s_parse.s_cu.i4_pred_mode = PRED_MODE_SKIP;
2219     ps_codec->s_parse.s_cu.i4_part_mode = PART_2Nx2N;
2220 
2221     for (pu_y = 0; pu_y < ctb_skip_ht ; pu_y += MIN_CU_SIZE)
2222     {
2223         for (pu_x = 0; pu_x < ctb_skip_wd ; pu_x += MIN_CU_SIZE)
2224         {
2225             ps_tu = ps_codec->s_parse.ps_tu;
2226             ps_tu->b1_cb_cbf = 0;
2227             ps_tu->b1_cr_cbf = 0;
2228             ps_tu->b1_y_cbf = 0;
2229             ps_tu->b4_pos_x = pu_x >> 2;
2230             ps_tu->b4_pos_y = pu_y >> 2;
2231             ps_tu->b1_transquant_bypass = 0;
2232             ps_tu->b3_size = 1;
2233             ps_tu->b7_qp = ps_codec->s_parse.u4_qp;
2234             ps_tu->b3_chroma_intra_mode_idx = INTRA_PRED_CHROMA_IDX_NONE;
2235             ps_tu->b6_luma_intra_mode   = INTRA_PRED_NONE;
2236             ps_tu->b1_first_tu_in_cu = 1;
2237 
2238             ps_codec->s_parse.ps_tu++;
2239             ps_codec->s_parse.s_cu.i4_tu_cnt++;
2240             ps_codec->s_parse.i4_pic_tu_idx++;
2241 
2242             tu_abs_x = (ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size) + pu_x;
2243             tu_abs_y = (ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size) + pu_y;
2244             pu1_pic_intra_flag = ps_codec->s_parse.pu1_pic_intra_flag;
2245             pu1_pic_intra_flag += (tu_abs_y >> 3) * numbytes_row;
2246             pu1_pic_intra_flag += (tu_abs_x >> 6);
2247             u4_mask = (LSB_ONES((MIN_CU_SIZE >> 3)) << (((tu_abs_x) / 8) % 8));
2248             u4_mask = ~u4_mask;
2249             *pu1_pic_intra_flag &= u4_mask;
2250 
2251             ps_pu = ps_codec->s_parse.ps_pu;
2252             ps_pu->b2_part_idx = 0;
2253             ps_pu->b4_pos_x = pu_x >> 2;
2254             ps_pu->b4_pos_y = pu_y >> 2;
2255             ps_pu->b4_wd = 1;
2256             ps_pu->b4_ht = 1;
2257             ps_pu->b1_intra_flag = 0;
2258             ps_pu->b3_part_mode = ps_codec->s_parse.s_cu.i4_part_mode;
2259             ps_pu->b1_merge_flag = 1;
2260             ps_pu->b3_merge_idx = 0;
2261 
2262             ps_codec->s_parse.ps_pu++;
2263             ps_codec->s_parse.i4_pic_pu_idx++;
2264         }
2265     }
2266 }
2267 
2268 /**
2269  *******************************************************************************
2270  *
2271  * @brief
2272  *  Parses Slice data syntax
2273  *
2274  * @par Description:
2275  *  Parses Slice data syntax as per Section:7.3.9.1
2276  *
2277  * @param[in] ps_codec
2278  *  Pointer to codec context
2279  *
2280  * @returns  Error from IHEVCD_ERROR_T
2281  *
2282  * @remarks
2283  *
2284  *
2285  *******************************************************************************
2286  */
ihevcd_parse_slice_data(codec_t * ps_codec)2287 IHEVCD_ERROR_T ihevcd_parse_slice_data(codec_t *ps_codec)
2288 {
2289 
2290     IHEVCD_ERROR_T ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
2291     WORD32 end_of_slice_flag = 0;
2292     sps_t *ps_sps;
2293     pps_t *ps_pps;
2294     slice_header_t *ps_slice_hdr;
2295     WORD32 end_of_pic;
2296     tile_t *ps_tile, *ps_tile_prev;
2297     WORD32 i;
2298     WORD32 ctb_addr;
2299     WORD32 tile_idx;
2300     WORD32 cabac_init_idc;
2301     WORD32 ctb_size;
2302     WORD32 num_ctb_in_row;
2303     WORD32 num_min4x4_in_ctb;
2304     WORD32 slice_qp;
2305     WORD32 slice_start_ctb_idx;
2306     WORD32 tile_start_ctb_idx;
2307 
2308 
2309     ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr_base;
2310     ps_pps = ps_codec->s_parse.ps_pps_base;
2311     ps_sps = ps_codec->s_parse.ps_sps_base;
2312 
2313     /* Get current slice header, pps and sps */
2314     ps_slice_hdr += (ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1));
2315     ps_pps  += ps_slice_hdr->i1_pps_id;
2316     ps_sps  += ps_pps->i1_sps_id;
2317 
2318     if(0 != ps_codec->s_parse.i4_cur_slice_idx)
2319     {
2320         if(!ps_slice_hdr->i1_dependent_slice_flag)
2321         {
2322             ps_codec->s_parse.i4_cur_independent_slice_idx =
2323                     ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1);
2324         }
2325     }
2326 
2327 
2328     ctb_size = 1 << ps_sps->i1_log2_ctb_size;
2329     num_min4x4_in_ctb = (ctb_size / 4) * (ctb_size / 4);
2330     num_ctb_in_row = ps_sps->i2_pic_wd_in_ctb;
2331 
2332     /* Update the parse context */
2333     if(0 == ps_codec->i4_slice_error)
2334     {
2335         ps_codec->s_parse.i4_ctb_x = ps_slice_hdr->i2_ctb_x;
2336         ps_codec->s_parse.i4_ctb_y = ps_slice_hdr->i2_ctb_y;
2337     }
2338     ps_codec->s_parse.ps_pps = ps_pps;
2339     ps_codec->s_parse.ps_sps = ps_sps;
2340     ps_codec->s_parse.ps_slice_hdr = ps_slice_hdr;
2341 
2342     /* Derive Tile positions for the current CTB */
2343     /* Change this to lookup if required */
2344     ihevcd_get_tile_pos(ps_pps, ps_sps, ps_codec->s_parse.i4_ctb_x,
2345                         ps_codec->s_parse.i4_ctb_y,
2346                         &ps_codec->s_parse.i4_ctb_tile_x,
2347                         &ps_codec->s_parse.i4_ctb_tile_y,
2348                         &tile_idx);
2349     ps_codec->s_parse.ps_tile = ps_pps->ps_tile + tile_idx;
2350     ps_codec->s_parse.i4_cur_tile_idx = tile_idx;
2351     ps_tile = ps_codec->s_parse.ps_tile;
2352     if(tile_idx)
2353         ps_tile_prev = ps_tile - 1;
2354     else
2355         ps_tile_prev = ps_tile;
2356 
2357     /* If the present slice is dependent, then store the previous
2358      * independent slices' ctb x and y values for decoding process */
2359     if(0 == ps_codec->i4_slice_error)
2360     {
2361         if(1 == ps_slice_hdr->i1_dependent_slice_flag)
2362         {
2363             /*If slice is present at the start of a new tile*/
2364             if((0 == ps_codec->s_parse.i4_ctb_tile_x) && (0 == ps_codec->s_parse.i4_ctb_tile_y))
2365             {
2366                 ps_codec->s_parse.i4_ctb_slice_x = 0;
2367                 ps_codec->s_parse.i4_ctb_slice_y = 0;
2368             }
2369         }
2370 
2371         if(!ps_slice_hdr->i1_dependent_slice_flag)
2372         {
2373             ps_codec->s_parse.i4_ctb_slice_x = 0;
2374             ps_codec->s_parse.i4_ctb_slice_y = 0;
2375         }
2376     }
2377 
2378     /* Frame level initializations */
2379     if((0 == ps_codec->s_parse.i4_ctb_y) &&
2380                     (0 == ps_codec->s_parse.i4_ctb_x))
2381     {
2382         ret = ihevcd_parse_pic_init(ps_codec);
2383         RETURN_IF((ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS), ret);
2384 
2385         ps_codec->s_parse.pu4_pic_tu_idx[0] = 0;
2386         ps_codec->s_parse.pu4_pic_pu_idx[0] = 0;
2387         ps_codec->s_parse.i4_cur_independent_slice_idx = 0;
2388         ps_codec->s_parse.i4_ctb_tile_x = 0;
2389         ps_codec->s_parse.i4_ctb_tile_y = 0;
2390     }
2391 
2392     {
2393         /* Updating the poc list of current slice to ps_mv_buf */
2394         mv_buf_t *ps_mv_buf = ps_codec->s_parse.ps_cur_mv_buf;
2395 
2396         if(ps_slice_hdr->i1_num_ref_idx_l1_active != 0)
2397         {
2398             for(i = 0; i < ps_slice_hdr->i1_num_ref_idx_l1_active; i++)
2399             {
2400                 ps_mv_buf->ai4_l1_collocated_poc[(ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1))][i] = ((pic_buf_t *)ps_slice_hdr->as_ref_pic_list1[i].pv_pic_buf)->i4_abs_poc;
2401                 ps_mv_buf->ai1_l1_collocated_poc_lt[(ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1))][i] = ((pic_buf_t *)ps_slice_hdr->as_ref_pic_list1[i].pv_pic_buf)->u1_used_as_ref;
2402             }
2403         }
2404 
2405         if(ps_slice_hdr->i1_num_ref_idx_l0_active != 0)
2406         {
2407             for(i = 0; i < ps_slice_hdr->i1_num_ref_idx_l0_active; i++)
2408             {
2409                 ps_mv_buf->ai4_l0_collocated_poc[(ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1))][i] = ((pic_buf_t *)ps_slice_hdr->as_ref_pic_list0[i].pv_pic_buf)->i4_abs_poc;
2410                 ps_mv_buf->ai1_l0_collocated_poc_lt[(ps_codec->s_parse.i4_cur_slice_idx & (MAX_SLICE_HDR_CNT - 1))][i] = ((pic_buf_t *)ps_slice_hdr->as_ref_pic_list0[i].pv_pic_buf)->u1_used_as_ref;
2411             }
2412         }
2413     }
2414 
2415     /*Initialize the low delay flag at the beginning of every slice*/
2416     if((0 == ps_codec->s_parse.i4_ctb_slice_x) || (0 == ps_codec->s_parse.i4_ctb_slice_y))
2417     {
2418         /* Lowdelay flag */
2419         WORD32 cur_poc, ref_list_poc, flag = 1;
2420         cur_poc = ps_slice_hdr->i4_abs_pic_order_cnt;
2421         for(i = 0; i < ps_slice_hdr->i1_num_ref_idx_l0_active; i++)
2422         {
2423             ref_list_poc = ((mv_buf_t *)ps_slice_hdr->as_ref_pic_list0[i].pv_mv_buf)->i4_abs_poc;
2424             if(ref_list_poc > cur_poc)
2425             {
2426                 flag = 0;
2427                 break;
2428             }
2429         }
2430         if(flag && (ps_slice_hdr->i1_slice_type == BSLICE))
2431         {
2432             for(i = 0; i < ps_slice_hdr->i1_num_ref_idx_l1_active; i++)
2433             {
2434                 ref_list_poc = ((mv_buf_t *)ps_slice_hdr->as_ref_pic_list1[i].pv_mv_buf)->i4_abs_poc;
2435                 if(ref_list_poc > cur_poc)
2436                 {
2437                     flag = 0;
2438                     break;
2439                 }
2440             }
2441         }
2442         ps_slice_hdr->i1_low_delay_flag = flag;
2443     }
2444 
2445     /* initialize the cabac init idc based on slice type */
2446     if(ps_slice_hdr->i1_slice_type == ISLICE)
2447     {
2448         cabac_init_idc = 0;
2449     }
2450     else if(ps_slice_hdr->i1_slice_type == PSLICE)
2451     {
2452         cabac_init_idc = ps_slice_hdr->i1_cabac_init_flag ? 2 : 1;
2453     }
2454     else
2455     {
2456         cabac_init_idc = ps_slice_hdr->i1_cabac_init_flag ? 1 : 2;
2457     }
2458 
2459     slice_qp = ps_slice_hdr->i1_slice_qp_delta + ps_pps->i1_pic_init_qp;
2460     slice_qp = CLIP3(slice_qp, 0, 51);
2461 
2462     /*Update QP value for every indepndent slice or for every dependent slice that begins at the start of a new tile*/
2463     if((0 == ps_slice_hdr->i1_dependent_slice_flag) ||
2464                     ((1 == ps_slice_hdr->i1_dependent_slice_flag) && ((0 == ps_codec->s_parse.i4_ctb_tile_x) && (0 == ps_codec->s_parse.i4_ctb_tile_y))))
2465     {
2466         ps_codec->s_parse.u4_qp = slice_qp;
2467     }
2468 
2469     /*Cabac init at the beginning of a slice*/
2470     //If the slice is a dependent slice, not present at the start of a tile
2471     if(0 == ps_codec->i4_slice_error)
2472     {
2473         if((1 == ps_slice_hdr->i1_dependent_slice_flag) && (!((ps_codec->s_parse.i4_ctb_tile_x == 0) && (ps_codec->s_parse.i4_ctb_tile_y == 0))))
2474         {
2475             if((0 == ps_pps->i1_entropy_coding_sync_enabled_flag) || (ps_pps->i1_entropy_coding_sync_enabled_flag && (0 != ps_codec->s_parse.i4_ctb_x)))
2476             {
2477                 ihevcd_cabac_reset(&ps_codec->s_parse.s_cabac,
2478                                    &ps_codec->s_parse.s_bitstrm);
2479             }
2480         }
2481         else if((0 == ps_pps->i1_entropy_coding_sync_enabled_flag) || (ps_pps->i1_entropy_coding_sync_enabled_flag && (0 != ps_codec->s_parse.i4_ctb_x)))
2482         {
2483             ret = ihevcd_cabac_init(&ps_codec->s_parse.s_cabac,
2484                                     &ps_codec->s_parse.s_bitstrm,
2485                                     slice_qp,
2486                                     cabac_init_idc,
2487                                     &gau1_ihevc_cab_ctxts[cabac_init_idc][slice_qp][0]);
2488             if(ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS)
2489             {
2490                 ps_codec->i4_slice_error = 1;
2491                 end_of_slice_flag = 1;
2492                 ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
2493             }
2494         }
2495     }
2496 
2497 
2498     do
2499     {
2500 
2501         {
2502             WORD32 cur_ctb_idx = ps_codec->s_parse.i4_ctb_x
2503                             + ps_codec->s_parse.i4_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
2504             if(1 == ps_codec->i4_num_cores && 0 == cur_ctb_idx % RESET_TU_BUF_NCTB)
2505             {
2506                 ps_codec->s_parse.ps_tu = ps_codec->s_parse.ps_pic_tu;
2507                 ps_codec->s_parse.i4_pic_tu_idx = 0;
2508             }
2509         }
2510 
2511         end_of_pic = 0;
2512         /* Section:7.3.7 Coding tree unit syntax */
2513         /* coding_tree_unit() inlined here */
2514         /* If number of cores is greater than 1, then add job to the queue */
2515         //TODO: Dual core implementation might need a different algo for better load balancing
2516         /* At the start of ctb row parsing in a tile, queue a job for processing the current tile row */
2517         ps_codec->s_parse.i4_ctb_num_pcm_blks = 0;
2518 
2519 
2520         /*At the beginning of each tile-which is not the beginning of a slice, cabac context must be initialized.
2521          * Hence, check for the tile beginning here */
2522         if(((0 == ps_codec->s_parse.i4_ctb_tile_x) && (0 == ps_codec->s_parse.i4_ctb_tile_y))
2523                         && (!((ps_tile->u1_pos_x == 0) && (ps_tile->u1_pos_y == 0)))
2524                         && (!((0 == ps_codec->s_parse.i4_ctb_slice_x) && (0 == ps_codec->s_parse.i4_ctb_slice_y))))
2525         {
2526             slice_qp = ps_slice_hdr->i1_slice_qp_delta + ps_pps->i1_pic_init_qp;
2527             slice_qp = CLIP3(slice_qp, 0, 51);
2528             ps_codec->s_parse.u4_qp = slice_qp;
2529 
2530             ihevcd_get_tile_pos(ps_pps, ps_sps, ps_codec->s_parse.i4_ctb_x,
2531                                 ps_codec->s_parse.i4_ctb_y,
2532                                 &ps_codec->s_parse.i4_ctb_tile_x,
2533                                 &ps_codec->s_parse.i4_ctb_tile_y,
2534                                 &tile_idx);
2535 
2536             ps_codec->s_parse.ps_tile = ps_pps->ps_tile + tile_idx;
2537             ps_codec->s_parse.i4_cur_tile_idx = tile_idx;
2538             ps_tile_prev = ps_tile - 1;
2539 
2540             tile_start_ctb_idx = ps_tile->u1_pos_x
2541                             + ps_tile->u1_pos_y * (ps_sps->i2_pic_wd_in_ctb);
2542 
2543             slice_start_ctb_idx =  ps_slice_hdr->i2_ctb_x
2544                             + ps_slice_hdr->i2_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
2545 
2546             /*For slices that span across multiple tiles*/
2547             if(slice_start_ctb_idx < tile_start_ctb_idx)
2548             {       /* 2 Cases
2549              * 1 - slice spans across frame-width- but does not start from 1st column
2550              * 2 - Slice spans across multiple tiles anywhere is a frame
2551              */
2552                 ps_codec->s_parse.i4_ctb_slice_y = ps_tile->u1_pos_y - ps_slice_hdr->i2_ctb_y;
2553                 if(!(((ps_slice_hdr->i2_ctb_x + ps_tile_prev->u2_wd) % ps_sps->i2_pic_wd_in_ctb) == ps_tile->u1_pos_x)) //Case 2
2554                 {
2555                     if(ps_slice_hdr->i2_ctb_y <= ps_tile->u1_pos_y)
2556                     {
2557                         //Check if ctb x is before or after
2558                         if(ps_slice_hdr->i2_ctb_x > ps_tile->u1_pos_x)
2559                         {
2560                             ps_codec->s_parse.i4_ctb_slice_y -= 1;
2561                         }
2562                     }
2563                 }
2564                 /*ps_codec->s_parse.i4_ctb_slice_y = ps_tile->u1_pos_y - ps_slice_hdr->i2_ctb_y;
2565                 if (ps_slice_hdr->i2_ctb_y <= ps_tile->u1_pos_y)
2566                 {
2567                     //Check if ctb x is before or after
2568                     if (ps_slice_hdr->i2_ctb_x > ps_tile->u1_pos_x )
2569                     {
2570                         ps_codec->s_parse.i4_ctb_slice_y -= 1 ;
2571                     }
2572                 }*/
2573             }
2574 
2575             /* Cabac init is done unconditionally at the start of the tile irrespective
2576              * of whether it is a dependent or an independent slice */
2577             if(0 == ps_codec->i4_slice_error)
2578             {
2579                 ret = ihevcd_cabac_init(&ps_codec->s_parse.s_cabac,
2580                                         &ps_codec->s_parse.s_bitstrm,
2581                                         slice_qp,
2582                                         cabac_init_idc,
2583                                         &gau1_ihevc_cab_ctxts[cabac_init_idc][slice_qp][0]);
2584                 if(ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS)
2585                 {
2586                     ps_codec->i4_slice_error = 1;
2587                     end_of_slice_flag = 1;
2588                     ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
2589                 }
2590 
2591             }
2592         }
2593         /* If number of cores is greater than 1, then add job to the queue */
2594         //TODO: Dual core implementation might need a different algo for better load balancing
2595         /* At the start of ctb row parsing in a tile, queue a job for processing the current tile row */
2596 
2597         if(0 == ps_codec->s_parse.i4_ctb_tile_x)
2598         {
2599 
2600             if(1 < ps_codec->i4_num_cores)
2601             {
2602                 proc_job_t s_job;
2603                 IHEVCD_ERROR_T ret;
2604                 s_job.i4_cmd    = CMD_PROCESS;
2605                 s_job.i2_ctb_cnt = (WORD16)ps_tile->u2_wd;
2606                 s_job.i2_ctb_x = (WORD16)ps_codec->s_parse.i4_ctb_x;
2607                 s_job.i2_ctb_y = (WORD16)ps_codec->s_parse.i4_ctb_y;
2608                 s_job.i2_slice_idx = (WORD16)ps_codec->s_parse.i4_cur_slice_idx;
2609                 s_job.i4_tu_coeff_data_ofst = (UWORD8 *)ps_codec->s_parse.pv_tu_coeff_data -
2610                                 (UWORD8 *)ps_codec->s_parse.pv_pic_tu_coeff_data;
2611                 ret = ihevcd_jobq_queue((jobq_t *)ps_codec->s_parse.pv_proc_jobq, &s_job, sizeof(proc_job_t), 1);
2612 
2613                 if(ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS)
2614                     return ret;
2615             }
2616             else
2617             {
2618                 process_ctxt_t *ps_proc = &ps_codec->as_process[0];
2619                 WORD32 tu_coeff_data_ofst = (UWORD8 *)ps_codec->s_parse.pv_tu_coeff_data -
2620                                 (UWORD8 *)ps_codec->s_parse.pv_pic_tu_coeff_data;
2621 
2622                 /* If the codec is running in single core mode,
2623                  * initialize zeroth process context
2624                  * TODO: Dual core mode might need a different implementation instead of jobq
2625                  */
2626 
2627                 ps_proc->i4_ctb_cnt = ps_tile->u2_wd;
2628                 ps_proc->i4_ctb_x   = ps_codec->s_parse.i4_ctb_x;
2629                 ps_proc->i4_ctb_y   = ps_codec->s_parse.i4_ctb_y;
2630                 ps_proc->i4_cur_slice_idx = ps_codec->s_parse.i4_cur_slice_idx;
2631 
2632                 ihevcd_init_proc_ctxt(ps_proc, tu_coeff_data_ofst);
2633             }
2634         }
2635 
2636 
2637         /* Restore cabac context model from top right CTB if entropy sync is enabled */
2638         if(ps_pps->i1_entropy_coding_sync_enabled_flag)
2639         {
2640             /*TODO Handle single CTB and top-right belonging to a different slice */
2641             if(0 == ps_codec->s_parse.i4_ctb_x && 0 == ps_codec->i4_slice_error)
2642             {
2643                 //WORD32 size = sizeof(ps_codec->s_parse.s_cabac.au1_ctxt_models);
2644                 WORD32 default_ctxt = 0;
2645 
2646                 if((0 == ps_codec->s_parse.i4_ctb_slice_y) && (!ps_slice_hdr->i1_dependent_slice_flag))
2647                     default_ctxt = 1;
2648                 if(1 == ps_sps->i2_pic_wd_in_ctb)
2649                     default_ctxt = 1;
2650 
2651                 ps_codec->s_parse.u4_qp = slice_qp;
2652                 if(default_ctxt)
2653                 {
2654                     //memcpy(&ps_codec->s_parse.s_cabac.au1_ctxt_models, &gau1_ihevc_cab_ctxts[cabac_init_idc][slice_qp][0], size);
2655                     ret = ihevcd_cabac_init(&ps_codec->s_parse.s_cabac,
2656                                             &ps_codec->s_parse.s_bitstrm,
2657                                             slice_qp,
2658                                             cabac_init_idc,
2659                                             &gau1_ihevc_cab_ctxts[cabac_init_idc][slice_qp][0]);
2660 
2661                     if(ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS)
2662                     {
2663                         ps_codec->i4_slice_error = 1;
2664                         end_of_slice_flag = 1;
2665                         ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
2666                     }
2667                 }
2668                 else
2669                 {
2670                     //memcpy(&ps_codec->s_parse.s_cabac.au1_ctxt_models, &ps_codec->s_parse.s_cabac.au1_ctxt_models_sync, size);
2671                     ret = ihevcd_cabac_init(&ps_codec->s_parse.s_cabac,
2672                                             &ps_codec->s_parse.s_bitstrm,
2673                                             slice_qp,
2674                                             cabac_init_idc,
2675                                             (const UWORD8 *)&ps_codec->s_parse.s_cabac.au1_ctxt_models_sync);
2676 
2677                     if(ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS)
2678                     {
2679                         ps_codec->i4_slice_error = 1;
2680                         end_of_slice_flag = 1;
2681                         ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
2682                     }
2683                 }
2684             }
2685         }
2686 
2687 
2688 
2689         if(0 == ps_codec->i4_slice_error)
2690         {
2691             if(ps_slice_hdr->i1_slice_sao_luma_flag || ps_slice_hdr->i1_slice_sao_chroma_flag)
2692                 ihevcd_parse_sao(ps_codec);
2693         }
2694         else
2695         {
2696             sao_t *ps_sao = ps_codec->s_parse.ps_pic_sao +
2697                             ps_codec->s_parse.i4_ctb_x +
2698                             ps_codec->s_parse.i4_ctb_y * ps_sps->i2_pic_wd_in_ctb;
2699 
2700             /* Default values */
2701             ps_sao->b3_y_type_idx = 0;
2702             ps_sao->b3_cb_type_idx = 0;
2703             ps_sao->b3_cr_type_idx = 0;
2704         }
2705 
2706         //AEV_TRACE("CTB x", ps_codec->s_parse.i4_ctb_x, 0);
2707         //AEV_TRACE("CTB y", ps_codec->s_parse.i4_ctb_y, 0);
2708 
2709         {
2710             WORD32 ctb_indx;
2711             ctb_indx = ps_codec->s_parse.i4_ctb_x + ps_sps->i2_pic_wd_in_ctb * ps_codec->s_parse.i4_ctb_y;
2712             ps_codec->s_parse.s_bs_ctxt.pu1_pic_qp_const_in_ctb[ctb_indx >> 3] |= (1 << (ctb_indx & 7));
2713             {
2714                 UWORD16 *pu1_slice_idx = ps_codec->s_parse.pu1_slice_idx;
2715                 pu1_slice_idx[ctb_indx] = ps_codec->s_parse.i4_cur_independent_slice_idx;
2716             }
2717         }
2718 
2719         if(0 == ps_codec->i4_slice_error)
2720         {
2721             tu_t *ps_tu = ps_codec->s_parse.ps_tu;
2722             WORD32 i4_tu_cnt = ps_codec->s_parse.s_cu.i4_tu_cnt;
2723             WORD32 i4_pic_tu_idx = ps_codec->s_parse.i4_pic_tu_idx;
2724 
2725             pu_t *ps_pu = ps_codec->s_parse.ps_pu;
2726             WORD32 i4_pic_pu_idx = ps_codec->s_parse.i4_pic_pu_idx;
2727 
2728             UWORD8 *pu1_tu_coeff_data = (UWORD8 *)ps_codec->s_parse.pv_tu_coeff_data;
2729 
2730             ret = ihevcd_parse_coding_quadtree(ps_codec,
2731                                                (ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size),
2732                                                (ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size),
2733                                                ps_sps->i1_log2_ctb_size,
2734                                                0);
2735             /* Check for error */
2736             if (ret != (IHEVCD_ERROR_T)IHEVCD_SUCCESS)
2737             {
2738                 /* Reset tu and pu parameters, and signal current ctb as skip */
2739                 WORD32 tu_coeff_data_reset_size;
2740 
2741                 ps_codec->s_parse.ps_tu = ps_tu;
2742                 ps_codec->s_parse.s_cu.i4_tu_cnt = i4_tu_cnt;
2743                 ps_codec->s_parse.i4_pic_tu_idx = i4_pic_tu_idx;
2744 
2745                 ps_codec->s_parse.ps_pu = ps_pu;
2746                 ps_codec->s_parse.i4_pic_pu_idx = i4_pic_pu_idx;
2747 
2748                 tu_coeff_data_reset_size = (UWORD8 *)ps_codec->s_parse.pv_tu_coeff_data - pu1_tu_coeff_data;
2749                 memset(pu1_tu_coeff_data, 0, tu_coeff_data_reset_size);
2750                 ps_codec->s_parse.pv_tu_coeff_data = (void *)pu1_tu_coeff_data;
2751 
2752                 ihevcd_set_ctb_skip(ps_codec);
2753 
2754                 /* Set slice error to suppress further parsing and
2755                  * signal end of slice.
2756                  */
2757                 ps_codec->i4_slice_error = 1;
2758                 end_of_slice_flag = 1;
2759                 ret = (IHEVCD_ERROR_T)IHEVCD_SUCCESS;
2760             }
2761         }
2762         else
2763         {
2764             ihevcd_set_ctb_skip(ps_codec);
2765         }
2766 
2767         if(0 == ps_codec->i4_slice_error)
2768             end_of_slice_flag = ihevcd_cabac_decode_terminate(&ps_codec->s_parse.s_cabac, &ps_codec->s_parse.s_bitstrm);
2769 
2770         AEV_TRACE("end_of_slice_flag", end_of_slice_flag, ps_codec->s_parse.s_cabac.u4_range);
2771 
2772 
2773         /* In case of tiles or entropy sync, terminate cabac and copy cabac context backed up at the end of top-right CTB */
2774         if(ps_pps->i1_tiles_enabled_flag || ps_pps->i1_entropy_coding_sync_enabled_flag)
2775         {
2776             WORD32 end_of_tile = 0;
2777             WORD32 end_of_tile_row = 0;
2778 
2779             /* Take a back up of cabac context models if entropy sync is enabled */
2780             if(ps_pps->i1_entropy_coding_sync_enabled_flag || ps_pps->i1_tiles_enabled_flag)
2781             {
2782                 if(1 == ps_codec->s_parse.i4_ctb_x)
2783                 {
2784                     WORD32 size = sizeof(ps_codec->s_parse.s_cabac.au1_ctxt_models);
2785                     memcpy(&ps_codec->s_parse.s_cabac.au1_ctxt_models_sync, &ps_codec->s_parse.s_cabac.au1_ctxt_models, size);
2786                 }
2787             }
2788 
2789             /* Since tiles and entropy sync are not enabled simultaneously, the following will not result in any problems */
2790             if((ps_codec->s_parse.i4_ctb_tile_x + 1) == (ps_tile->u2_wd))
2791             {
2792                 end_of_tile_row = 1;
2793                 if((ps_codec->s_parse.i4_ctb_tile_y + 1) == ps_tile->u2_ht)
2794                     end_of_tile = 1;
2795             }
2796             if((0 == end_of_slice_flag) && (0 == ps_codec->i4_slice_error) &&
2797                             ((ps_pps->i1_tiles_enabled_flag && end_of_tile) ||
2798                                             (ps_pps->i1_entropy_coding_sync_enabled_flag && end_of_tile_row)))
2799             {
2800                 WORD32 end_of_sub_stream_one_bit;
2801                 end_of_sub_stream_one_bit = ihevcd_cabac_decode_terminate(&ps_codec->s_parse.s_cabac, &ps_codec->s_parse.s_bitstrm);
2802                 AEV_TRACE("end_of_sub_stream_one_bit", end_of_sub_stream_one_bit, ps_codec->s_parse.s_cabac.u4_range);
2803 
2804                 /* TODO: Remove the check for offset when HM is updated to include a byte unconditionally even for aligned location */
2805                 /* For Ittiam streams this check should not be there, for HM9.1 streams this should be there */
2806                 if(ps_codec->s_parse.s_bitstrm.u4_bit_ofst % 8)
2807                     ihevcd_bits_flush_to_byte_boundary(&ps_codec->s_parse.s_bitstrm);
2808 
2809                 UNUSED(end_of_sub_stream_one_bit);
2810             }
2811         }
2812         {
2813             WORD32 ctb_indx;
2814 
2815             ctb_addr = ps_codec->s_parse.i4_ctb_y * num_ctb_in_row + ps_codec->s_parse.i4_ctb_x;
2816 
2817             ctb_indx = ++ctb_addr;
2818 
2819             /* Store pu_idx for next CTB in frame level pu_idx array */
2820 
2821             //In case of multiple tiles, if end-of-tile row is reached
2822             if((ps_tile->u2_wd == (ps_codec->s_parse.i4_ctb_tile_x + 1)) && (ps_tile->u2_wd != ps_sps->i2_pic_wd_in_ctb))
2823             {
2824                 ctb_indx = (ps_sps->i2_pic_wd_in_ctb * (ps_codec->s_parse.i4_ctb_tile_y + 1 + ps_tile->u1_pos_y)) + ps_tile->u1_pos_x; //idx is the beginning of next row in current tile.
2825                 if(ps_tile->u2_ht == (ps_codec->s_parse.i4_ctb_tile_y + 1))
2826                 {
2827                     //If the current ctb is the last tile's last ctb
2828                     if((ps_tile->u2_wd + ps_tile->u1_pos_x == ps_sps->i2_pic_wd_in_ctb) && ((ps_tile->u2_ht + ps_tile->u1_pos_y == ps_sps->i2_pic_ht_in_ctb)))
2829                     {
2830                         ctb_indx = ctb_addr; //Next continuous ctb address
2831                     }
2832                     else //Not last tile's end , but a tile end
2833                     {
2834                         tile_t *ps_next_tile = ps_codec->s_parse.ps_tile + 1;
2835                         ctb_indx = ps_next_tile->u1_pos_x + (ps_next_tile->u1_pos_y * ps_sps->i2_pic_wd_in_ctb); //idx is the beginning of first row in next tile.
2836                     }
2837                 }
2838             }
2839 
2840             ps_codec->s_parse.pu4_pic_pu_idx[ctb_indx] = ps_codec->s_parse.i4_pic_pu_idx;
2841             ps_codec->s_parse.i4_next_pu_ctb_cnt = ctb_indx;
2842 
2843             ps_codec->s_parse.pu1_pu_map += num_min4x4_in_ctb;
2844 
2845             /* Store tu_idx for next CTB in frame level tu_idx array */
2846             if(1 == ps_codec->i4_num_cores)
2847             {
2848                 ctb_indx = (0 == ctb_addr % RESET_TU_BUF_NCTB) ?
2849                                 RESET_TU_BUF_NCTB : ctb_addr % RESET_TU_BUF_NCTB;
2850 
2851                 //In case of multiple tiles, if end-of-tile row is reached
2852                 if((ps_tile->u2_wd == (ps_codec->s_parse.i4_ctb_tile_x + 1)) && (ps_tile->u2_wd != ps_sps->i2_pic_wd_in_ctb))
2853                 {
2854                     ctb_indx = (ps_sps->i2_pic_wd_in_ctb * (ps_codec->s_parse.i4_ctb_tile_y + 1 + ps_tile->u1_pos_y)) + ps_tile->u1_pos_x; //idx is the beginning of next row in current tile.
2855                     if(ps_tile->u2_ht == (ps_codec->s_parse.i4_ctb_tile_y + 1))
2856                     {
2857                         //If the current ctb is the last tile's last ctb
2858                         if((ps_tile->u2_wd + ps_tile->u1_pos_x == ps_sps->i2_pic_wd_in_ctb) && ((ps_tile->u2_ht + ps_tile->u1_pos_y == ps_sps->i2_pic_ht_in_ctb)))
2859                         {
2860                             ctb_indx = (0 == ctb_addr % RESET_TU_BUF_NCTB) ?
2861                                             RESET_TU_BUF_NCTB : ctb_addr % RESET_TU_BUF_NCTB;
2862                         }
2863                         else  //Not last tile's end , but a tile end
2864                         {
2865                             tile_t *ps_next_tile = ps_codec->s_parse.ps_tile + 1;
2866                             ctb_indx =  ps_next_tile->u1_pos_x + (ps_next_tile->u1_pos_y * ps_sps->i2_pic_wd_in_ctb); //idx is the beginning of first row in next tile.
2867                         }
2868                     }
2869                 }
2870                 ps_codec->s_parse.i4_next_tu_ctb_cnt = ctb_indx;
2871                 ps_codec->s_parse.pu4_pic_tu_idx[ctb_indx] = ps_codec->s_parse.i4_pic_tu_idx;
2872             }
2873             else
2874             {
2875                 ctb_indx = ctb_addr;
2876                 if((ps_tile->u2_wd == (ps_codec->s_parse.i4_ctb_tile_x + 1)) && (ps_tile->u2_wd != ps_sps->i2_pic_wd_in_ctb))
2877                 {
2878                     ctb_indx = (ps_sps->i2_pic_wd_in_ctb * (ps_codec->s_parse.i4_ctb_tile_y + 1 + ps_tile->u1_pos_y)) + ps_tile->u1_pos_x; //idx is the beginning of next row in current tile.
2879                     if(ps_tile->u2_ht == (ps_codec->s_parse.i4_ctb_tile_y + 1))
2880                     {
2881                         //If the current ctb is the last tile's last ctb
2882                         if((ps_tile->u2_wd + ps_tile->u1_pos_x == ps_sps->i2_pic_wd_in_ctb) && ((ps_tile->u2_ht + ps_tile->u1_pos_y == ps_sps->i2_pic_ht_in_ctb)))
2883                         {
2884                             ctb_indx = ctb_addr;
2885                         }
2886                         else  //Not last tile's end , but a tile end
2887                         {
2888                             tile_t *ps_next_tile = ps_codec->s_parse.ps_tile + 1;
2889                             ctb_indx =  ps_next_tile->u1_pos_x + (ps_next_tile->u1_pos_y * ps_sps->i2_pic_wd_in_ctb); //idx is the beginning of first row in next tile.
2890                         }
2891                     }
2892                 }
2893                 ps_codec->s_parse.i4_next_tu_ctb_cnt = ctb_indx;
2894                 ps_codec->s_parse.pu4_pic_tu_idx[ctb_indx] = ps_codec->s_parse.i4_pic_tu_idx;
2895             }
2896             ps_codec->s_parse.pu1_tu_map += num_min4x4_in_ctb;
2897         }
2898 
2899         /* QP array population has to be done if deblocking is enabled in the picture
2900          * but some of the slices in the pic have it disabled */
2901         if((0 != ps_codec->i4_disable_deblk_pic) &&
2902                 (1 == ps_slice_hdr->i1_slice_disable_deblocking_filter_flag))
2903         {
2904             bs_ctxt_t *ps_bs_ctxt = &ps_codec->s_parse.s_bs_ctxt;
2905             WORD32 log2_ctb_size = ps_sps->i1_log2_ctb_size;
2906             UWORD8 *pu1_qp;
2907             WORD32 qp_strd;
2908             WORD32 u4_qp_const_in_ctb;
2909             WORD32 cur_ctb_idx;
2910             WORD32 next_ctb_idx;
2911             WORD32 cur_tu_idx;
2912             WORD32 i4_ctb_tu_cnt;
2913             tu_t *ps_tu;
2914 
2915             cur_ctb_idx = ps_codec->s_parse.i4_ctb_x + ps_sps->i2_pic_wd_in_ctb * ps_codec->s_parse.i4_ctb_y;
2916             /* ctb_size/8 elements per CTB */
2917             qp_strd = ps_sps->i2_pic_wd_in_ctb << (log2_ctb_size - 3);
2918             pu1_qp = ps_bs_ctxt->pu1_pic_qp + ((ps_codec->s_parse.i4_ctb_x + ps_codec->s_parse.i4_ctb_y * qp_strd) << (log2_ctb_size - 3));
2919 
2920             u4_qp_const_in_ctb = ps_bs_ctxt->pu1_pic_qp_const_in_ctb[cur_ctb_idx >> 3] & (1 << (cur_ctb_idx & 7));
2921 
2922             next_ctb_idx = ps_codec->s_parse.i4_next_tu_ctb_cnt;
2923             if(1 == ps_codec->i4_num_cores)
2924             {
2925                 i4_ctb_tu_cnt = ps_codec->s_parse.pu4_pic_tu_idx[next_ctb_idx] -
2926                                 ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx % RESET_TU_BUF_NCTB];
2927 
2928                 cur_tu_idx = ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx % RESET_TU_BUF_NCTB];
2929             }
2930             else
2931             {
2932                 i4_ctb_tu_cnt = ps_codec->s_parse.pu4_pic_tu_idx[next_ctb_idx] -
2933                                 ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx];
2934 
2935                 cur_tu_idx = ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx];
2936             }
2937 
2938             ps_tu = &ps_codec->s_parse.ps_pic_tu[cur_tu_idx];
2939 
2940             if(u4_qp_const_in_ctb)
2941             {
2942                 pu1_qp[0] = ps_tu->b7_qp;
2943             }
2944             else
2945             {
2946                 for(i = 0; i < i4_ctb_tu_cnt; i++, ps_tu++)
2947                 {
2948                     WORD32 start_pos_x;
2949                     WORD32 start_pos_y;
2950                     WORD32 tu_size;
2951 
2952                     /* start_pos_x and start_pos_y are in units of min TU size (4x4) */
2953                     start_pos_x = ps_tu->b4_pos_x;
2954                     start_pos_y = ps_tu->b4_pos_y;
2955 
2956                     tu_size = 1 << (ps_tu->b3_size + 2);
2957                     tu_size >>= 2; /* TU size divided by 4 */
2958 
2959                     if(0 == (start_pos_x & 1) && 0 == (start_pos_y & 1))
2960                     {
2961                         WORD32 row, col;
2962                         for(row = start_pos_y; row < start_pos_y + tu_size; row += 2)
2963                         {
2964                             for(col = start_pos_x; col < start_pos_x + tu_size; col += 2)
2965                             {
2966                                 pu1_qp[(row >> 1) * qp_strd + (col >> 1)] = ps_tu->b7_qp;
2967                             }
2968                         }
2969                     }
2970                 }
2971             }
2972         }
2973 
2974         if(ps_codec->i4_num_cores <= MV_PRED_NUM_CORES_THRESHOLD)
2975         {
2976             /*************************************************/
2977             /****************   MV pred **********************/
2978             /*************************************************/
2979             WORD8 u1_top_ctb_avail = 1;
2980             WORD8 u1_left_ctb_avail = 1;
2981             WORD8 u1_top_lt_ctb_avail = 1;
2982             WORD8 u1_top_rt_ctb_avail = 1;
2983             WORD16 i2_wd_in_ctb;
2984 
2985             tile_start_ctb_idx = ps_tile->u1_pos_x
2986                             + ps_tile->u1_pos_y * (ps_sps->i2_pic_wd_in_ctb);
2987 
2988             slice_start_ctb_idx =  ps_slice_hdr->i2_ctb_x
2989                             + ps_slice_hdr->i2_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
2990 
2991             if((slice_start_ctb_idx < tile_start_ctb_idx))
2992             {
2993                 //Slices span across multiple tiles.
2994                 i2_wd_in_ctb = ps_sps->i2_pic_wd_in_ctb;
2995             }
2996             else
2997             {
2998                 i2_wd_in_ctb = ps_tile->u2_wd;
2999             }
3000             /* slice and tile boundaries */
3001             if((0 == ps_codec->s_parse.i4_ctb_y) || (0 == ps_codec->s_parse.i4_ctb_tile_y))
3002             {
3003                 u1_top_ctb_avail = 0;
3004                 u1_top_lt_ctb_avail = 0;
3005                 u1_top_rt_ctb_avail = 0;
3006             }
3007 
3008             if((0 == ps_codec->s_parse.i4_ctb_x) || (0 == ps_codec->s_parse.i4_ctb_tile_x))
3009             {
3010                 u1_left_ctb_avail = 0;
3011                 u1_top_lt_ctb_avail = 0;
3012                 if((0 == ps_codec->s_parse.i4_ctb_slice_y) || (0 == ps_codec->s_parse.i4_ctb_tile_y))
3013                 {
3014                     u1_top_ctb_avail = 0;
3015                     if((i2_wd_in_ctb - 1) != ps_codec->s_parse.i4_ctb_slice_x) //TODO: For tile, not implemented
3016                     {
3017                         u1_top_rt_ctb_avail = 0;
3018                     }
3019                 }
3020             }
3021             /*For slices not beginning at start of a ctb row*/
3022             else if(ps_codec->s_parse.i4_ctb_x > 0)
3023             {
3024                 if((0 == ps_codec->s_parse.i4_ctb_slice_y) || (0 == ps_codec->s_parse.i4_ctb_tile_y))
3025                 {
3026                     u1_top_ctb_avail = 0;
3027                     u1_top_lt_ctb_avail = 0;
3028                     if(0 == ps_codec->s_parse.i4_ctb_slice_x)
3029                     {
3030                         u1_left_ctb_avail = 0;
3031                     }
3032                     if((i2_wd_in_ctb - 1) != ps_codec->s_parse.i4_ctb_slice_x)
3033                     {
3034                         u1_top_rt_ctb_avail = 0;
3035                     }
3036                 }
3037                 else if((1 == ps_codec->s_parse.i4_ctb_slice_y) && (0 == ps_codec->s_parse.i4_ctb_slice_x))
3038                 {
3039                     u1_top_lt_ctb_avail = 0;
3040                 }
3041             }
3042 
3043             if(((ps_sps->i2_pic_wd_in_ctb - 1) == ps_codec->s_parse.i4_ctb_x) || ((ps_tile->u2_wd - 1) == ps_codec->s_parse.i4_ctb_tile_x))
3044             {
3045                 u1_top_rt_ctb_avail = 0;
3046             }
3047 
3048             if(PSLICE == ps_slice_hdr->i1_slice_type
3049                             || BSLICE == ps_slice_hdr->i1_slice_type)
3050             {
3051                 mv_ctxt_t s_mv_ctxt;
3052                 process_ctxt_t *ps_proc;
3053                 UWORD32 *pu4_ctb_top_pu_idx;
3054                 UWORD32 *pu4_ctb_left_pu_idx;
3055                 UWORD32 *pu4_ctb_top_left_pu_idx;
3056                 WORD32 i4_ctb_pu_cnt;
3057                 WORD32 cur_ctb_idx;
3058                 WORD32 next_ctb_idx;
3059                 WORD32 cur_pu_idx;
3060                 ps_proc = &ps_codec->as_process[(ps_codec->i4_num_cores == 1) ? 1 : (ps_codec->i4_num_cores - 1)];
3061                 cur_ctb_idx = ps_codec->s_parse.i4_ctb_x
3062                                 + ps_codec->s_parse.i4_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
3063                 next_ctb_idx = ps_codec->s_parse.i4_next_pu_ctb_cnt;
3064                 i4_ctb_pu_cnt = ps_codec->s_parse.pu4_pic_pu_idx[next_ctb_idx]
3065                                 - ps_codec->s_parse.pu4_pic_pu_idx[cur_ctb_idx];
3066 
3067                 cur_pu_idx = ps_codec->s_parse.pu4_pic_pu_idx[cur_ctb_idx];
3068 
3069                 pu4_ctb_top_pu_idx = ps_proc->pu4_pic_pu_idx_top
3070                                 + (ps_codec->s_parse.i4_ctb_x * ctb_size / MIN_PU_SIZE);
3071                 pu4_ctb_left_pu_idx = ps_proc->pu4_pic_pu_idx_left;
3072                 pu4_ctb_top_left_pu_idx = &ps_proc->u4_ctb_top_left_pu_idx;
3073 
3074                 /* Initializing s_mv_ctxt */
3075                 {
3076                     s_mv_ctxt.ps_pps = ps_pps;
3077                     s_mv_ctxt.ps_sps = ps_sps;
3078                     s_mv_ctxt.ps_slice_hdr = ps_slice_hdr;
3079                     s_mv_ctxt.i4_ctb_x = ps_codec->s_parse.i4_ctb_x;
3080                     s_mv_ctxt.i4_ctb_y = ps_codec->s_parse.i4_ctb_y;
3081                     s_mv_ctxt.ps_pu = &ps_codec->s_parse.ps_pic_pu[cur_pu_idx];
3082                     s_mv_ctxt.ps_pic_pu = ps_codec->s_parse.ps_pic_pu;
3083                     s_mv_ctxt.ps_tile = ps_tile;
3084                     s_mv_ctxt.pu4_pic_pu_idx_map = ps_proc->pu4_pic_pu_idx_map;
3085                     s_mv_ctxt.pu4_pic_pu_idx = ps_codec->s_parse.pu4_pic_pu_idx;
3086                     s_mv_ctxt.pu1_pic_pu_map = ps_codec->s_parse.pu1_pic_pu_map;
3087                     s_mv_ctxt.i4_ctb_pu_cnt = i4_ctb_pu_cnt;
3088                     s_mv_ctxt.i4_ctb_start_pu_idx = cur_pu_idx;
3089                     s_mv_ctxt.u1_top_ctb_avail = u1_top_ctb_avail;
3090                     s_mv_ctxt.u1_top_rt_ctb_avail = u1_top_rt_ctb_avail;
3091                     s_mv_ctxt.u1_top_lt_ctb_avail = u1_top_lt_ctb_avail;
3092                     s_mv_ctxt.u1_left_ctb_avail = u1_left_ctb_avail;
3093                 }
3094 
3095                 ihevcd_get_mv_ctb(&s_mv_ctxt, pu4_ctb_top_pu_idx,
3096                                   pu4_ctb_left_pu_idx, pu4_ctb_top_left_pu_idx);
3097 
3098             }
3099             else
3100             {
3101                 WORD32 num_minpu_in_ctb = (ctb_size / MIN_PU_SIZE) * (ctb_size / MIN_PU_SIZE);
3102                 UWORD8 *pu1_pic_pu_map_ctb = ps_codec->s_parse.pu1_pic_pu_map +
3103                                 (ps_codec->s_parse.i4_ctb_x + ps_codec->s_parse.i4_ctb_y * ps_sps->i2_pic_wd_in_ctb) * num_minpu_in_ctb;
3104                 process_ctxt_t *ps_proc = &ps_codec->as_process[(ps_codec->i4_num_cores == 1) ? 1 : (ps_codec->i4_num_cores - 1)];
3105                 WORD32 row, col;
3106                 WORD32 pu_cnt;
3107                 WORD32 num_pu_per_ctb;
3108                 WORD32 cur_ctb_idx;
3109                 WORD32 next_ctb_idx;
3110                 WORD32 ctb_start_pu_idx;
3111                 UWORD32 *pu4_nbr_pu_idx = ps_proc->pu4_pic_pu_idx_map;
3112                 WORD32 nbr_pu_idx_strd = MAX_CTB_SIZE / MIN_PU_SIZE + 2;
3113                 pu_t *ps_pu;
3114                 WORD32 ctb_size_in_min_pu = (ctb_size / MIN_PU_SIZE);
3115 
3116                 /* Neighbor PU idx update inside CTB */
3117                 /* 1byte per 4x4. Indicates the PU idx that 4x4 block belongs to */
3118 
3119                 cur_ctb_idx = ps_codec->s_parse.i4_ctb_x
3120                                 + ps_codec->s_parse.i4_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
3121                 next_ctb_idx = ps_codec->s_parse.i4_next_pu_ctb_cnt;
3122                 num_pu_per_ctb = ps_codec->s_parse.pu4_pic_pu_idx[next_ctb_idx]
3123                                 - ps_codec->s_parse.pu4_pic_pu_idx[cur_ctb_idx];
3124                 ctb_start_pu_idx = ps_codec->s_parse.pu4_pic_pu_idx[cur_ctb_idx];
3125                 ps_pu = &ps_codec->s_parse.ps_pic_pu[ctb_start_pu_idx];
3126 
3127                 for(pu_cnt = 0; pu_cnt < num_pu_per_ctb; pu_cnt++, ps_pu++)
3128                 {
3129                     UWORD32 cur_pu_idx;
3130                     WORD32 pu_ht = (ps_pu->b4_ht + 1) << 2;
3131                     WORD32 pu_wd = (ps_pu->b4_wd + 1) << 2;
3132 
3133                     cur_pu_idx = ctb_start_pu_idx + pu_cnt;
3134 
3135                     for(row = 0; row < pu_ht / MIN_PU_SIZE; row++)
3136                         for(col = 0; col < pu_wd / MIN_PU_SIZE; col++)
3137                             pu4_nbr_pu_idx[(1 + ps_pu->b4_pos_x + col)
3138                                             + (1 + ps_pu->b4_pos_y + row)
3139                                             * nbr_pu_idx_strd] =
3140                                             cur_pu_idx;
3141                 }
3142 
3143                 /* Updating Top and Left pointers */
3144                 {
3145                     WORD32 rows_remaining = ps_sps->i2_pic_height_in_luma_samples
3146                                     - (ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size);
3147                     WORD32 ctb_size_left = MIN(ctb_size, rows_remaining);
3148 
3149                     /* Top Left */
3150                     /* saving top left before updating top ptr, as updating top ptr will overwrite the top left for the next ctb */
3151                     ps_proc->u4_ctb_top_left_pu_idx = ps_proc->pu4_pic_pu_idx_top[(ps_codec->s_parse.i4_ctb_x * ctb_size / MIN_PU_SIZE) + ctb_size / MIN_PU_SIZE - 1];
3152                     for(i = 0; i < ctb_size / MIN_PU_SIZE; i++)
3153                     {
3154                         /* Left */
3155                         /* Last column of au4_nbr_pu_idx */
3156                         ps_proc->pu4_pic_pu_idx_left[i] = pu4_nbr_pu_idx[(ctb_size / MIN_PU_SIZE)
3157                                         + (i + 1) * nbr_pu_idx_strd];
3158                         /* Top */
3159                         /* Last row of au4_nbr_pu_idx */
3160                         ps_proc->pu4_pic_pu_idx_top[(ps_codec->s_parse.i4_ctb_x * ctb_size / MIN_PU_SIZE) + i] =
3161                                         pu4_nbr_pu_idx[(ctb_size_left / MIN_PU_SIZE) * nbr_pu_idx_strd + i + 1];
3162 
3163                     }
3164                 }
3165 
3166                 /* Updating the CTB level PU idx (Used for collocated MV pred)*/
3167                 {
3168                     WORD32 ctb_row, ctb_col, index_pic_map, index_nbr_map;
3169                     WORD32 first_pu_of_ctb;
3170                     first_pu_of_ctb = pu4_nbr_pu_idx[1 + nbr_pu_idx_strd];
3171                     UWORD32 cur_ctb_ht_in_min_pu = MIN(((ps_sps->i2_pic_height_in_luma_samples
3172                             - (ps_codec->s_parse.i4_ctb_y << ps_sps->i1_log2_ctb_size)) / MIN_PU_SIZE), ctb_size_in_min_pu);
3173                     UWORD32 cur_ctb_wd_in_min_pu = MIN(((ps_sps->i2_pic_width_in_luma_samples
3174                                 - (ps_codec->s_parse.i4_ctb_x << ps_sps->i1_log2_ctb_size)) / MIN_PU_SIZE), ctb_size_in_min_pu);
3175 
3176                     index_pic_map = 0 * ctb_size_in_min_pu + 0;
3177                     index_nbr_map = (0 + 1) * nbr_pu_idx_strd + (0 + 1);
3178 
3179                     for(ctb_row = 0; ctb_row < cur_ctb_ht_in_min_pu; ctb_row++)
3180                     {
3181                         for(ctb_col = 0; ctb_col < cur_ctb_wd_in_min_pu; ctb_col++)
3182                         {
3183                             pu1_pic_pu_map_ctb[index_pic_map + ctb_col] = pu4_nbr_pu_idx[index_nbr_map + ctb_col]
3184                                             - first_pu_of_ctb;
3185                         }
3186                         index_pic_map += ctb_size_in_min_pu;
3187                         index_nbr_map += nbr_pu_idx_strd;
3188                     }
3189                 }
3190             }
3191 
3192             /*************************************************/
3193             /******************  BS, QP  *********************/
3194             /*************************************************/
3195             /* Check if deblock is disabled for the current slice or if it is disabled for the current picture
3196              * because of disable deblock api
3197              */
3198             if(0 == ps_codec->i4_disable_deblk_pic)
3199             {
3200                 /* Boundary strength calculation is done irrespective of whether deblocking is disabled
3201                  * in the slice or not, to handle deblocking slice boundaries */
3202                 if((0 == ps_codec->i4_slice_error))
3203                 {
3204                     WORD32 i4_ctb_tu_cnt;
3205                     WORD32 cur_ctb_idx, next_ctb_idx;
3206                     WORD32 cur_pu_idx;
3207                     WORD32 cur_tu_idx;
3208                     process_ctxt_t *ps_proc;
3209 
3210                     ps_proc = &ps_codec->as_process[(ps_codec->i4_num_cores == 1) ? 1 : (ps_codec->i4_num_cores - 1)];
3211                     cur_ctb_idx = ps_codec->s_parse.i4_ctb_x
3212                                     + ps_codec->s_parse.i4_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
3213 
3214                     cur_pu_idx = ps_codec->s_parse.pu4_pic_pu_idx[cur_ctb_idx];
3215                     next_ctb_idx = ps_codec->s_parse.i4_next_tu_ctb_cnt;
3216                     if(1 == ps_codec->i4_num_cores)
3217                     {
3218                         i4_ctb_tu_cnt = ps_codec->s_parse.pu4_pic_tu_idx[next_ctb_idx] -
3219                                         ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx % RESET_TU_BUF_NCTB];
3220 
3221                         cur_tu_idx = ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx % RESET_TU_BUF_NCTB];
3222                     }
3223                     else
3224                     {
3225                         i4_ctb_tu_cnt = ps_codec->s_parse.pu4_pic_tu_idx[next_ctb_idx] -
3226                                         ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx];
3227 
3228                         cur_tu_idx = ps_codec->s_parse.pu4_pic_tu_idx[cur_ctb_idx];
3229                     }
3230 
3231                     ps_codec->s_parse.s_bs_ctxt.ps_pps = ps_codec->s_parse.ps_pps;
3232                     ps_codec->s_parse.s_bs_ctxt.ps_sps = ps_codec->s_parse.ps_sps;
3233                     ps_codec->s_parse.s_bs_ctxt.ps_codec = ps_codec;
3234                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_tu_cnt = i4_ctb_tu_cnt;
3235                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_x = ps_codec->s_parse.i4_ctb_x;
3236                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_y = ps_codec->s_parse.i4_ctb_y;
3237                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_tile_x = ps_codec->s_parse.i4_ctb_tile_x;
3238                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_tile_y = ps_codec->s_parse.i4_ctb_tile_y;
3239                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_slice_x = ps_codec->s_parse.i4_ctb_slice_x;
3240                     ps_codec->s_parse.s_bs_ctxt.i4_ctb_slice_y = ps_codec->s_parse.i4_ctb_slice_y;
3241                     ps_codec->s_parse.s_bs_ctxt.ps_tu = &ps_codec->s_parse.ps_pic_tu[cur_tu_idx];
3242                     ps_codec->s_parse.s_bs_ctxt.ps_pu = &ps_codec->s_parse.ps_pic_pu[cur_pu_idx];
3243                     ps_codec->s_parse.s_bs_ctxt.pu4_pic_pu_idx_map = ps_proc->pu4_pic_pu_idx_map;
3244                     ps_codec->s_parse.s_bs_ctxt.i4_next_pu_ctb_cnt = ps_codec->s_parse.i4_next_pu_ctb_cnt;
3245                     ps_codec->s_parse.s_bs_ctxt.i4_next_tu_ctb_cnt = ps_codec->s_parse.i4_next_tu_ctb_cnt;
3246                     ps_codec->s_parse.s_bs_ctxt.pu1_slice_idx = ps_codec->s_parse.pu1_slice_idx;
3247                     ps_codec->s_parse.s_bs_ctxt.ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr;
3248                     ps_codec->s_parse.s_bs_ctxt.ps_tile = ps_codec->s_parse.ps_tile;
3249 
3250                     if(ISLICE == ps_slice_hdr->i1_slice_type)
3251                     {
3252                         ihevcd_ctb_boundary_strength_islice(&ps_codec->s_parse.s_bs_ctxt);
3253                     }
3254                     else
3255                     {
3256                         ihevcd_ctb_boundary_strength_pbslice(&ps_codec->s_parse.s_bs_ctxt);
3257                     }
3258                 }
3259 
3260                 /* Boundary strength is set to zero if deblocking is disabled for the current slice */
3261                 if(0 != ps_slice_hdr->i1_slice_disable_deblocking_filter_flag)
3262                 {
3263                     WORD32 bs_strd = (ps_sps->i2_pic_wd_in_ctb + 1) * (ctb_size * ctb_size / 8 / 16);
3264 
3265                     UWORD32 *pu4_vert_bs = (UWORD32 *)((UWORD8 *)ps_codec->s_parse.s_bs_ctxt.pu4_pic_vert_bs +
3266                                     ps_codec->s_parse.i4_ctb_x * (ctb_size * ctb_size / 8 / 16) +
3267                                     ps_codec->s_parse.i4_ctb_y * bs_strd);
3268                     UWORD32 *pu4_horz_bs = (UWORD32 *)((UWORD8 *)ps_codec->s_parse.s_bs_ctxt.pu4_pic_horz_bs +
3269                                     ps_codec->s_parse.i4_ctb_x * (ctb_size * ctb_size / 8 / 16) +
3270                                     ps_codec->s_parse.i4_ctb_y * bs_strd);
3271 
3272                     memset(pu4_vert_bs, 0, (ctb_size / 8) * (ctb_size / 4) / 8 * 2);
3273                     memset(pu4_horz_bs, 0, (ctb_size / 8) * (ctb_size / 4) / 8 * 2);
3274                 }
3275             }
3276 
3277         }
3278 
3279         DATA_SYNC();
3280 
3281         /* Update the parse status map */
3282         {
3283             sps_t *ps_sps = ps_codec->s_parse.ps_sps;
3284             UWORD8 *pu1_buf;
3285             WORD32 idx;
3286             idx = (ps_codec->s_parse.i4_ctb_x);
3287             idx += ((ps_codec->s_parse.i4_ctb_y) * ps_sps->i2_pic_wd_in_ctb);
3288             pu1_buf = (ps_codec->pu1_parse_map + idx);
3289             *pu1_buf = 1;
3290         }
3291 
3292         /* Increment CTB x and y positions */
3293         ps_codec->s_parse.i4_ctb_tile_x++;
3294         ps_codec->s_parse.i4_ctb_x++;
3295         ps_codec->s_parse.i4_ctb_slice_x++;
3296 
3297         /*If tiles are enabled, handle the slice counters differently*/
3298         if(ps_pps->i1_tiles_enabled_flag)
3299         {
3300             //Indicates multiple tiles in a slice case
3301             tile_start_ctb_idx = ps_tile->u1_pos_x
3302                             + ps_tile->u1_pos_y * (ps_sps->i2_pic_wd_in_ctb);
3303 
3304             slice_start_ctb_idx =  ps_slice_hdr->i2_ctb_x
3305                             + ps_slice_hdr->i2_ctb_y * (ps_sps->i2_pic_wd_in_ctb);
3306 
3307             if((slice_start_ctb_idx < tile_start_ctb_idx))
3308             {
3309                 if(ps_codec->s_parse.i4_ctb_slice_x == (ps_tile->u1_pos_x + ps_tile->u2_wd))
3310                 {
3311                     /* Reached end of slice row within a tile /frame */
3312                     ps_codec->s_parse.i4_ctb_slice_y++;
3313                     ps_codec->s_parse.i4_ctb_slice_x = ps_tile->u1_pos_x; //todo:Check
3314                 }
3315             }
3316             //Indicates multiple slices in a tile case - hence, reset slice_x
3317             else if(ps_codec->s_parse.i4_ctb_slice_x == (ps_tile->u2_wd))
3318             {
3319                 ps_codec->s_parse.i4_ctb_slice_y++;
3320                 ps_codec->s_parse.i4_ctb_slice_x = 0;
3321             }
3322         }
3323         else
3324         {
3325             if(ps_codec->s_parse.i4_ctb_slice_x == ps_tile->u2_wd)
3326             {
3327                 /* Reached end of slice row within a tile /frame */
3328                 ps_codec->s_parse.i4_ctb_slice_y++;
3329                 ps_codec->s_parse.i4_ctb_slice_x = 0;
3330             }
3331         }
3332 
3333 
3334         if(ps_codec->s_parse.i4_ctb_tile_x == (ps_tile->u2_wd))
3335         {
3336             /* Reached end of tile row */
3337             ps_codec->s_parse.i4_ctb_tile_x = 0;
3338             ps_codec->s_parse.i4_ctb_x = ps_tile->u1_pos_x;
3339 
3340             ps_codec->s_parse.i4_ctb_tile_y++;
3341             ps_codec->s_parse.i4_ctb_y++;
3342 
3343             if(ps_codec->s_parse.i4_ctb_tile_y == (ps_tile->u2_ht))
3344             {
3345                 /* Reached End of Tile */
3346                 ps_codec->s_parse.i4_ctb_tile_y = 0;
3347                 ps_codec->s_parse.i4_ctb_tile_x = 0;
3348                 ps_codec->s_parse.ps_tile++;
3349 
3350                 if((ps_tile->u2_ht + ps_tile->u1_pos_y  ==  ps_sps->i2_pic_ht_in_ctb) && (ps_tile->u2_wd + ps_tile->u1_pos_x  ==  ps_sps->i2_pic_wd_in_ctb))
3351                 {
3352                     /* Reached end of frame */
3353                     end_of_pic = 1;
3354                     ps_codec->s_parse.i4_ctb_x = 0;
3355                     ps_codec->s_parse.i4_ctb_y = ps_sps->i2_pic_ht_in_ctb;
3356                 }
3357                 else
3358                 {
3359                     /* Initialize ctb_x and ctb_y to start of next tile */
3360                     ps_tile = ps_codec->s_parse.ps_tile;
3361                     ps_codec->s_parse.i4_ctb_x = ps_tile->u1_pos_x;
3362                     ps_codec->s_parse.i4_ctb_y = ps_tile->u1_pos_y;
3363                     ps_codec->s_parse.i4_ctb_tile_y = 0;
3364                     ps_codec->s_parse.i4_ctb_tile_x = 0;
3365                     ps_codec->s_parse.i4_ctb_slice_x = ps_tile->u1_pos_x;
3366                     ps_codec->s_parse.i4_ctb_slice_y = ps_tile->u1_pos_y;
3367 
3368                 }
3369             }
3370 
3371         }
3372 
3373         ps_codec->s_parse.i4_next_ctb_indx = ps_codec->s_parse.i4_ctb_x +
3374                         ps_codec->s_parse.i4_ctb_y * ps_sps->i2_pic_wd_in_ctb;
3375 
3376         /* If the current slice is in error, check if the next slice's address
3377          * is reached and mark the end_of_slice flag */
3378         if(ps_codec->i4_slice_error)
3379         {
3380             slice_header_t *ps_slice_hdr_next = ps_slice_hdr + 1;
3381             WORD32 next_slice_addr = ps_slice_hdr_next->i2_ctb_x +
3382                             ps_slice_hdr_next->i2_ctb_y * ps_sps->i2_pic_wd_in_ctb;
3383 
3384             if(ps_codec->s_parse.i4_next_ctb_indx == next_slice_addr)
3385                 end_of_slice_flag = 1;
3386         }
3387 
3388         /* If the codec is running in single core mode
3389          * then call process function for current CTB
3390          */
3391         if((1 == ps_codec->i4_num_cores) && (ps_codec->s_parse.i4_ctb_tile_x == 0))
3392         {
3393             process_ctxt_t *ps_proc = &ps_codec->as_process[0];
3394 //          ps_proc->i4_ctb_cnt = ihevcd_nctb_cnt(ps_codec, ps_sps);
3395             ps_proc->i4_ctb_cnt = ps_proc->ps_tile->u2_wd;
3396             ihevcd_process(ps_proc);
3397         }
3398 
3399         /* If the bytes for the current slice are exhausted
3400          * set end_of_slice flag to 1
3401          * This slice will be treated as incomplete */
3402         if((UWORD8 *)ps_codec->s_parse.s_bitstrm.pu1_buf_max + BITSTRM_OFF_THRS <
3403                                         ((UWORD8 *)ps_codec->s_parse.s_bitstrm.pu4_buf + (ps_codec->s_parse.s_bitstrm.u4_bit_ofst / 8)))
3404         {
3405             // end_of_slice_flag = ps_codec->i4_slice_error ? 0 : 1;
3406 
3407             if(0 == ps_codec->i4_slice_error)
3408                 end_of_slice_flag = 1;
3409         }
3410 
3411 
3412         if(end_of_pic)
3413             break;
3414     } while(!end_of_slice_flag);
3415 
3416     /* Reset slice error */
3417     ps_codec->i4_slice_error = 0;
3418 
3419     /* Increment the slice index for parsing next slice */
3420     if(0 == end_of_pic)
3421     {
3422         while(1)
3423         {
3424 
3425             WORD32 parse_slice_idx;
3426             parse_slice_idx = ps_codec->s_parse.i4_cur_slice_idx;
3427             parse_slice_idx++;
3428 
3429             {
3430                 /* If the next slice header is not initialized, update cur_slice_idx and break */
3431                 if((1 == ps_codec->i4_num_cores) || (0 != (parse_slice_idx & (MAX_SLICE_HDR_CNT - 1))))
3432                 {
3433                     ps_codec->s_parse.i4_cur_slice_idx = parse_slice_idx;
3434                     break;
3435                 }
3436 
3437                 /* If the next slice header is initialised, wait for the parsed slices to be processed */
3438                 else
3439                 {
3440                     WORD32 ctb_indx = 0;
3441 
3442                     while(ctb_indx != ps_sps->i4_pic_size_in_ctb)
3443                     {
3444                         WORD32 parse_status = *(ps_codec->pu1_parse_map + ctb_indx);
3445                         volatile WORD32 proc_status = *(ps_codec->pu1_proc_map + ctb_indx) & 1;
3446 
3447                         if(parse_status == proc_status)
3448                             ctb_indx++;
3449                     }
3450                     ps_codec->s_parse.i4_cur_slice_idx = parse_slice_idx;
3451                     break;
3452                 }
3453 
3454             }
3455         }
3456 
3457     }
3458     else
3459     {
3460 #if FRAME_ILF_PAD
3461         if(FRAME_ILF_PAD && 1 == ps_codec->i4_num_cores)
3462         {
3463             if(ps_slice_hdr->i4_abs_pic_order_cnt == 0)
3464             {
3465                 DUMP_PRE_ILF(ps_codec->as_process[0].pu1_cur_pic_luma,
3466                              ps_codec->as_process[0].pu1_cur_pic_chroma,
3467                              ps_sps->i2_pic_width_in_luma_samples,
3468                              ps_sps->i2_pic_height_in_luma_samples,
3469                              ps_codec->i4_strd);
3470 
3471                 DUMP_BS(ps_codec->as_process[0].s_bs_ctxt.pu4_pic_vert_bs,
3472                         ps_codec->as_process[0].s_bs_ctxt.pu4_pic_horz_bs,
3473                         ps_sps->i2_pic_wd_in_ctb * (ctb_size * ctb_size / 8 / 16) * ps_sps->i2_pic_ht_in_ctb,
3474                         (ps_sps->i2_pic_wd_in_ctb + 1) * (ctb_size * ctb_size / 8 / 16) * ps_sps->i2_pic_ht_in_ctb);
3475 
3476                 DUMP_QP(ps_codec->as_process[0].s_bs_ctxt.pu1_pic_qp,
3477                         (ps_sps->i2_pic_height_in_luma_samples * ps_sps->i2_pic_width_in_luma_samples) / (MIN_CU_SIZE * MIN_CU_SIZE));
3478 
3479                 DUMP_QP_CONST_IN_CTB(ps_codec->as_process[0].s_bs_ctxt.pu1_pic_qp_const_in_ctb,
3480                                      (ps_sps->i2_pic_height_in_luma_samples * ps_sps->i2_pic_width_in_luma_samples) / (MIN_CTB_SIZE * MIN_CTB_SIZE) / 8);
3481 
3482                 DUMP_NO_LOOP_FILTER(ps_codec->as_process[0].pu1_pic_no_loop_filter_flag,
3483                                     (ps_sps->i2_pic_width_in_luma_samples / MIN_CU_SIZE) * (ps_sps->i2_pic_height_in_luma_samples / MIN_CU_SIZE) / 8);
3484 
3485                 DUMP_OFFSETS(ps_slice_hdr->i1_beta_offset_div2,
3486                              ps_slice_hdr->i1_tc_offset_div2,
3487                              ps_pps->i1_pic_cb_qp_offset,
3488                              ps_pps->i1_pic_cr_qp_offset);
3489             }
3490             ps_codec->s_parse.s_deblk_ctxt.ps_pps = ps_codec->s_parse.ps_pps;
3491             ps_codec->s_parse.s_deblk_ctxt.ps_sps = ps_codec->s_parse.ps_sps;
3492             ps_codec->s_parse.s_deblk_ctxt.ps_codec = ps_codec;
3493             ps_codec->s_parse.s_deblk_ctxt.ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr;
3494             ps_codec->s_parse.s_deblk_ctxt.is_chroma_yuv420sp_vu = (ps_codec->e_ref_chroma_fmt == IV_YUV_420SP_VU);
3495 
3496             ps_codec->s_parse.s_sao_ctxt.ps_pps = ps_codec->s_parse.ps_pps;
3497             ps_codec->s_parse.s_sao_ctxt.ps_sps = ps_codec->s_parse.ps_sps;
3498             ps_codec->s_parse.s_sao_ctxt.ps_codec = ps_codec;
3499             ps_codec->s_parse.s_sao_ctxt.ps_slice_hdr = ps_codec->s_parse.ps_slice_hdr;
3500 
3501             ihevcd_ilf_pad_frame(&ps_codec->s_parse.s_deblk_ctxt, &ps_codec->s_parse.s_sao_ctxt);
3502 
3503         }
3504 #endif
3505         ps_codec->s_parse.i4_end_of_frame = 1;
3506     }
3507     return ret;
3508 }
3509 
3510 
3511 
3512 
3513 
3514 
3515 
3516 
3517