• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * Copyright (c) 2011 Intel Corporation. All Rights Reserved.
3  * Copyright (c) Imagination Technologies Limited, UK
4  *
5  * Permission is hereby granted, free of charge, to any person obtaining a
6  * copy of this software and associated documentation files (the
7  * "Software"), to deal in the Software without restriction, including
8  * without limitation the rights to use, copy, modify, merge, publish,
9  * distribute, sub license, and/or sell copies of the Software, and to
10  * permit persons to whom the Software is furnished to do so, subject to
11  * the following conditions:
12  *
13  * The above copyright notice and this permission notice (including the
14  * next paragraph) shall be included in all copies or substantial portions
15  * of the Software.
16  *
17  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
18  * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
19  * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NON-INFRINGEMENT.
20  * IN NO EVENT SHALL PRECISION INSIGHT AND/OR ITS SUPPLIERS BE LIABLE FOR
21  * ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT,
22  * TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE
23  * SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
24  *
25  * Authors:
26  *    Elaine Wang <elaine.wang@intel.com>
27  *    Zeng Li <zeng.li@intel.com>
28  *    Edward Lin <edward.lin@intel.com>
29  *
30  */
31 
32 #include "psb_drv_video.h"
33 //#include "tng_H263ES.h"
34 #include "tng_hostheader.h"
35 #include "tng_hostcode.h"
36 #include "psb_def.h"
37 #include "psb_drv_debug.h"
38 #include "psb_cmdbuf.h"
39 #include "psb_buffer.h"
40 #include <stdio.h>
41 #include "psb_output.h"
42 #include "tng_picmgmt.h"
43 #include "tng_hostbias.h"
44 #include "tng_hostair.h"
45 #ifdef _TOPAZHP_PDUMP_
46 #include "tng_trace.h"
47 #endif
48 #include <wsbm/wsbm_manager.h>
49 
50 #include "hwdefs/topazhp_core_regs.h"
51 #include "hwdefs/topazhp_multicore_regs_old.h"
52 #include "hwdefs/topaz_db_regs.h"
53 #include "hwdefs/topaz_vlc_regs.h"
54 #include "hwdefs/mvea_regs.h"
55 #include "hwdefs/topazhp_default_params.h"
56 
57 #define ALIGN_TO(value, align) ((value + align - 1) & ~(align - 1))
58 #define PAGE_ALIGN(value) ALIGN_TO(value, 4096)
59 #define DEFAULT_MVCALC_CONFIG   ((0x00040303)|(MASK_TOPAZHP_CR_MVCALC_JITTER_POINTER_RST))
60 #define DEFAULT_MVCALC_COLOCATED        (0x00100100)
61 #define MVEA_MV_PARAM_REGION_SIZE 16
62 #define MVEA_ABOVE_PARAM_REGION_SIZE 96
63 #define QUANT_LISTS_SIZE                (224)
64 #define _1080P_30FPS (((1920*1088)/256)*30)
65 #define tng_align_64(X)  (((X)+63) &~63)
66 #define tng_align_4(X)  (((X)+3) &~3)
67 
68 /* #define MTX_CONTEXT_ITEM_OFFSET(type, member) (size_t)&(((type*)0)->member) */
69 
70 #define DEFAULT_CABAC_DB_MARGIN    (0x190)
71 #define NOT_USED_BY_TOPAZ 0
72 /*
73 #define _TOPAZHP_CMDBUF_
74 */
75 #ifdef _TOPAZHP_CMDBUF_
tng__trace_cmdbuf_words(tng_cmdbuf_p cmdbuf)76 static void tng__trace_cmdbuf_words(tng_cmdbuf_p cmdbuf)
77 {
78     int i = 0;
79     IMG_UINT32 *ptmp = (IMG_UINT32 *)(cmdbuf->cmd_start);
80     IMG_UINT32 *pend = (IMG_UINT32 *)(cmdbuf->cmd_idx);
81     do {
82         drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: command words [%d] = 0x%08x\n", __FUNCTION__, i++, (unsigned int)(*ptmp++));
83     } while(ptmp < pend);
84     return ;
85 }
86 #endif
87 
88 #if 0
89 static IMG_UINT32 tng__get_codedbuffer_size(
90     IMG_STANDARD eStandard,
91     IMG_UINT16 ui16MBWidth,
92     IMG_UINT16 ui16MBHeight,
93     IMG_RC_PARAMS * psRCParams
94 )
95 {
96     if (eStandard == IMG_STANDARD_H264) {
97         // allocate based on worst case qp size
98         return ((IMG_UINT32)ui16MBWidth * (IMG_UINT32)ui16MBHeight * 400);
99     }
100 
101     if (psRCParams->ui32InitialQp <= 5)
102         return ((IMG_UINT32)ui16MBWidth * (IMG_UINT32)ui16MBHeight * 1600);
103 
104     return ((IMG_UINT32)ui16MBWidth * (IMG_UINT32)ui16MBHeight * 900);
105 }
106 
107 
108 static IMG_UINT32 tng__get_codedbuf_size_according_bitrate(
109     IMG_RC_PARAMS * psRCParams
110 )
111 {
112     return ((psRCParams->ui32BitsPerSecond + psRCParams->ui32FrameRate / 2) / psRCParams->ui32FrameRate) * 2;
113 }
114 
115 static IMG_UINT32 tng__get_buffer_size(IMG_UINT32 src_size)
116 {
117     return (src_size + 0x1000) & (~0xfff);
118 }
119 #endif
120 
121 //static inline
tng__alloc_init_buffer(psb_driver_data_p driver_data,unsigned int size,psb_buffer_type_t type,psb_buffer_p buf)122 VAStatus tng__alloc_init_buffer(
123     psb_driver_data_p driver_data,
124     unsigned int size,
125     psb_buffer_type_t type,
126     psb_buffer_p buf)
127 {
128     unsigned char *pch_virt_addr;
129     VAStatus vaStatus = VA_STATUS_SUCCESS;
130     vaStatus = psb_buffer_create(driver_data, size, type, buf);
131     if (VA_STATUS_SUCCESS != vaStatus) {
132         drv_debug_msg(VIDEO_DEBUG_ERROR, "alloc mem params buffer");
133         return vaStatus;
134     }
135 
136     vaStatus = psb_buffer_map(buf, &pch_virt_addr);
137     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: phy addr 0x%08x, vir addr 0x%08x\n", __FUNCTION__, buf->drm_buf, pch_virt_addr);
138     if ((vaStatus) || (pch_virt_addr == NULL)) {
139         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: map buf 0x%08x\n", __FUNCTION__, (IMG_UINT32)pch_virt_addr);
140         psb_buffer_destroy(buf);
141     } else {
142         memset(pch_virt_addr, 0, size);
143         psb_buffer_unmap(buf);
144     }
145 
146     return vaStatus;
147 }
148 
tng__alloc_context_buffer(context_ENC_p ctx,IMG_UINT8 ui8IsJpeg,IMG_UINT32 ui32StreamID)149 static VAStatus tng__alloc_context_buffer(context_ENC_p ctx, IMG_UINT8 ui8IsJpeg, IMG_UINT32 ui32StreamID)
150 {
151     VAStatus vaStatus = VA_STATUS_SUCCESS;
152     IMG_UINT32 ui32_pic_width, ui32_pic_height;
153     IMG_UINT32 ui32_mb_per_row, ui32_mb_per_column;
154     IMG_UINT32 ui32_adj_mb_per_row = 0;
155     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
156     psb_driver_data_p ps_driver_data = ctx->obj_context->driver_data;
157     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamID]);
158     context_ENC_mem_size *ps_mem_size = &(ctx->ctx_mem_size);
159 
160     if (ctx->eStandard == IMG_STANDARD_H264) {
161         ctx->ui8PipesToUse = tng__min(ctx->ui8PipesToUse, ctx->ui8SlicesPerPicture);
162     } else {
163         ctx->ui8PipesToUse = 1;
164     }
165 
166     ctx->i32PicNodes  = (psRCParams->b16Hierarchical ? MAX_REF_B_LEVELS : 0) + 4;
167     ctx->i32MVStores = (ctx->i32PicNodes * 2);
168     ctx->i32CodedBuffers = (IMG_INT32)(ctx->ui8PipesToUse) * (ctx->bIsInterlaced ? 3 : 2);
169     ctx->ui8SlotsInUse = psRCParams->ui16BFrames + 2;
170 
171     if (0 != ui8IsJpeg) {
172         ctx->jpeg_pic_params_size = (sizeof(JPEG_MTX_QUANT_TABLE) + 0x3f) & (~0x3f);
173         ctx->jpeg_header_mem_size = (sizeof(JPEG_MTX_DMA_SETUP) + 0x3f) & (~0x3f);
174         ctx->jpeg_header_interface_mem_size = (sizeof(JPEG_MTX_WRITEBACK_MEMORY) + 0x3f) & (~0x3f);
175 
176         //write back region
177         ps_mem_size->writeback = tng_align_KB(COMM_WB_DATA_BUF_SIZE);
178         tng__alloc_init_buffer(ps_driver_data, WB_FIFO_SIZE * ps_mem_size->writeback, psb_bt_cpu_vpu, &(ctx->bufs_writeback));
179 
180         drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: end\n", __FUNCTION__);
181         return vaStatus;
182     }
183 
184     /* width and height should be source surface's w and h or ?? */
185     ui32_pic_width = ctx->obj_context->picture_width;
186     ui32_mb_per_row = (ctx->obj_context->picture_width + 15) >> 4;
187     ui32_pic_height = ctx->obj_context->picture_height;
188     ui32_mb_per_column = (ctx->obj_context->picture_height + 15) >> 4;
189     ui32_adj_mb_per_row = ((ui32_mb_per_row + 7)>>3)<<3;  // Ensure multiple of 8 MBs per row
190 
191     //command buffer use
192     ps_mem_size->pic_template = ps_mem_size->slice_template =
193     ps_mem_size->seq_header = tng_align_KB(TNG_HEADER_SIZE);
194     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->seq_header,
195         psb_bt_cpu_vpu, &(ps_mem->bufs_seq_header));
196 
197     if (ctx->bEnableMVC)
198         tng__alloc_init_buffer(ps_driver_data, ps_mem_size->seq_header,
199             psb_bt_cpu_vpu, &(ps_mem->bufs_sub_seq_header));
200 
201     tng__alloc_init_buffer(ps_driver_data, 4 * ps_mem_size->pic_template,
202         psb_bt_cpu_vpu, &(ps_mem->bufs_pic_template));
203 
204     tng__alloc_init_buffer(ps_driver_data, NUM_SLICE_TYPES * ps_mem_size->slice_template,
205         psb_bt_cpu_vpu, &(ps_mem->bufs_slice_template));
206 
207     ps_mem_size->mtx_context = tng_align_KB(MTX_CONTEXT_SIZE);
208     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->mtx_context,
209         psb_bt_cpu_vpu, &(ps_mem->bufs_mtx_context));
210 
211     //sei header(AUDHeader+SEIBufferPeriodMem+SEIPictureTimingHeaderMem)
212     ps_mem_size->sei_header = tng_align_KB(64);
213     tng__alloc_init_buffer(ps_driver_data, 3 * ps_mem_size->sei_header,
214         psb_bt_cpu_vpu, &(ps_mem->bufs_sei_header));
215 
216     //gop header
217     ps_mem_size->flat_gop = ps_mem_size->hierar_gop = tng_align_KB(64);
218     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->flat_gop,
219         psb_bt_cpu_vpu, &(ps_mem->bufs_flat_gop));
220     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->hierar_gop,
221         psb_bt_cpu_vpu, &(ps_mem->bufs_hierar_gop));
222 
223     //above params
224     ps_mem_size->above_params = tng_align_KB(MVEA_ABOVE_PARAM_REGION_SIZE * tng_align_64(ui32_mb_per_row));
225     tng__alloc_init_buffer(ps_driver_data, (IMG_UINT32)(ctx->ui8PipesToUse) * ps_mem_size->above_params,
226         psb_bt_cpu_vpu, &(ps_mem->bufs_above_params));
227 
228     //ctx->mv_setting_btable_size = tng_align_KB(MAX_BFRAMES * (tng_align_64(sizeof(IMG_MV_SETTINGS) * MAX_BFRAMES)));
229     ps_mem_size->mv_setting_btable = tng_align_KB(MAX_BFRAMES * MV_ROW_STRIDE);
230     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->mv_setting_btable,
231         psb_bt_cpu_vpu, &(ps_mem->bufs_mv_setting_btable));
232 
233     ps_mem_size->mv_setting_hierar = tng_align_KB(MAX_BFRAMES * sizeof(IMG_MV_SETTINGS));
234     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->mv_setting_hierar,
235         psb_bt_cpu_vpu, &(ps_mem->bufs_mv_setting_hierar));
236 
237     //colocated params
238     ps_mem_size->colocated = tng_align_KB(MVEA_MV_PARAM_REGION_SIZE * tng_align_4(ui32_mb_per_row * ui32_mb_per_column));
239     tng__alloc_init_buffer(ps_driver_data, ctx->i32PicNodes * ps_mem_size->colocated,
240         psb_bt_cpu_vpu, &(ps_mem->bufs_colocated));
241 
242     ps_mem_size->interview_mv = ps_mem_size->mv = ps_mem_size->colocated;
243     tng__alloc_init_buffer(ps_driver_data, ctx->i32MVStores * ps_mem_size->mv,
244         psb_bt_cpu_vpu, &(ps_mem->bufs_mv));
245 
246     if (ctx->bEnableMVC) {
247         tng__alloc_init_buffer(ps_driver_data, 2 * ps_mem_size->interview_mv,
248             psb_bt_cpu_vpu, &(ps_mem->bufs_interview_mv));
249     }
250 
251     //write back region
252     ps_mem_size->writeback = tng_align_KB(COMM_WB_DATA_BUF_SIZE);
253     tng__alloc_init_buffer(ps_driver_data, WB_FIFO_SIZE * ps_mem_size->writeback,
254         psb_bt_cpu_vpu, &(ctx->bufs_writeback));
255 
256     ps_mem_size->slice_map = tng_align_KB(0x1500); //(1 + MAX_SLICESPERPIC * 2 + 15) & ~15);
257     tng__alloc_init_buffer(ps_driver_data, ctx->ui8SlotsInUse * ps_mem_size->slice_map,
258         psb_bt_cpu_vpu, &(ps_mem->bufs_slice_map));
259 
260     ps_mem_size->weighted_prediction = tng_align_KB(sizeof(WEIGHTED_PREDICTION_VALUES));
261     tng__alloc_init_buffer(ps_driver_data, ctx->ui8SlotsInUse * ps_mem_size->weighted_prediction,
262         psb_bt_cpu_vpu, &(ps_mem->bufs_weighted_prediction));
263 
264 #ifdef LTREFHEADER
265     ps_mem_size->lt_ref_header = tng_align_KB((sizeof(MTX_HEADER_PARAMS)+63)&~63);
266     tng__alloc_init_buffer(ps_driver_data, ctx->ui8SlotsInUse * ps_mem_size->lt_ref_header,
267         psb_bt_cpu_vpu, &(ps_mem->bufs_lt_ref_header));
268 #endif
269 
270     ps_mem_size->recon_pictures = tng_align_KB((tng_align_64(ui32_pic_width)*tng_align_64(ui32_pic_height))*3/2);
271     tng__alloc_init_buffer(ps_driver_data, ctx->i32PicNodes * ps_mem_size->recon_pictures,
272         psb_bt_cpu_vpu, &(ps_mem->bufs_recon_pictures));
273 
274     ctx->ctx_mem_size.first_pass_out_params = tng_align_KB(sizeof(IMG_FIRST_STAGE_MB_PARAMS) * ui32_mb_per_row *  ui32_mb_per_column);
275     tng__alloc_init_buffer(ps_driver_data, ctx->ui8SlotsInUse * ctx->ctx_mem_size.first_pass_out_params,
276         psb_bt_cpu_vpu, &(ps_mem->bufs_first_pass_out_params));
277 
278 #ifndef EXCLUDE_BEST_MP_DECISION_DATA
279     ctx->ctx_mem_size.first_pass_out_best_multipass_param = tng_align_KB(ui32_mb_per_column * (((5*ui32_mb_per_row)+3)>>2) * 64);
280     tng__alloc_init_buffer(ps_driver_data, ctx->ui8SlotsInUse * ctx->ctx_mem_size.first_pass_out_best_multipass_param,
281         psb_bt_cpu_vpu, &(ps_mem->bufs_first_pass_out_best_multipass_param));
282 #endif
283 
284     ctx->ctx_mem_size.mb_ctrl_in_params = tng_align_KB(sizeof(IMG_FIRST_STAGE_MB_PARAMS) * ui32_adj_mb_per_row *  ui32_mb_per_column);
285     tng__alloc_init_buffer(ps_driver_data, ctx->ui8SlotsInUse * ctx->ctx_mem_size.mb_ctrl_in_params,
286         psb_bt_cpu_vpu, &(ps_mem->bufs_mb_ctrl_in_params));
287 
288     ctx->ctx_mem_size.lowpower_params = tng_align_KB(TNG_HEADER_SIZE);
289     tng__alloc_init_buffer(ps_driver_data, ps_mem_size->lowpower_params,
290         psb_bt_cpu_vpu, &(ps_mem->bufs_lowpower_params));
291 
292     ctx->ctx_mem_size.lowpower_data = tng_align_KB(0x10000);
293 
294     return vaStatus;
295 }
296 
tng__free_context_buffer(context_ENC_p ctx,unsigned char is_JPEG,unsigned int stream_id)297 static void tng__free_context_buffer(context_ENC_p ctx, unsigned char is_JPEG, unsigned int stream_id)
298 {
299     context_ENC_mem *ps_mem = &(ctx->ctx_mem[stream_id]);
300 
301     if (0 != is_JPEG) {
302         psb_buffer_destroy(&(ctx->bufs_writeback));
303         return;
304     }
305     psb_buffer_destroy(&(ps_mem->bufs_seq_header));
306     if (ctx->bEnableMVC)
307         psb_buffer_destroy(&(ps_mem->bufs_sub_seq_header));
308     psb_buffer_destroy(&(ps_mem->bufs_pic_template));
309     psb_buffer_destroy(&(ps_mem->bufs_slice_template));
310     psb_buffer_destroy(&(ps_mem->bufs_mtx_context));
311     psb_buffer_destroy(&(ps_mem->bufs_sei_header));
312 
313     psb_buffer_destroy(&(ps_mem->bufs_flat_gop));
314     psb_buffer_destroy(&(ps_mem->bufs_hierar_gop));
315     psb_buffer_destroy(&(ps_mem->bufs_above_params));
316     psb_buffer_destroy(&(ps_mem->bufs_mv_setting_btable));
317     psb_buffer_destroy(&(ps_mem->bufs_mv_setting_hierar));
318     psb_buffer_destroy(&(ps_mem->bufs_colocated));
319     psb_buffer_destroy(&(ps_mem->bufs_mv));
320     if (ctx->bEnableMVC)
321         psb_buffer_destroy(&(ps_mem->bufs_interview_mv));
322 
323     psb_buffer_destroy(&(ctx->bufs_writeback));
324     psb_buffer_destroy(&(ps_mem->bufs_slice_map));
325     psb_buffer_destroy(&(ps_mem->bufs_weighted_prediction));
326 #ifdef LTREFHEADER
327     psb_buffer_destroy(&(ps_mem->bufs_lt_ref_header));
328 #endif
329     psb_buffer_destroy(&(ps_mem->bufs_recon_pictures));
330     psb_buffer_destroy(&(ps_mem->bufs_first_pass_out_params));
331 #ifndef EXCLUDE_BEST_MP_DECISION_DATA
332     psb_buffer_destroy(&(ps_mem->bufs_first_pass_out_best_multipass_param));
333 #endif
334     psb_buffer_destroy(&(ps_mem->bufs_mb_ctrl_in_params));
335     psb_buffer_destroy(&(ps_mem->bufs_lowpower_params));
336 
337     return ;
338 }
339 
tng__get_ipe_control(IMG_CODEC eEncodingFormat)340 unsigned int tng__get_ipe_control(IMG_CODEC  eEncodingFormat)
341 {
342     unsigned int RegVal = 0;
343 
344     RegVal = F_ENCODE(2, MVEA_CR_IPE_GRID_FINE_SEARCH) |
345     F_ENCODE(0, MVEA_CR_IPE_GRID_SEARCH_SIZE) |
346     F_ENCODE(1, MVEA_CR_IPE_Y_FINE_SEARCH);
347 
348     switch (eEncodingFormat) {
349         case IMG_CODEC_H263_NO_RC:
350         case IMG_CODEC_H263_VBR:
351         case IMG_CODEC_H263_CBR:
352             RegVal |= F_ENCODE(0, MVEA_CR_IPE_BLOCKSIZE) | F_ENCODE(0, MVEA_CR_IPE_ENCODING_FORMAT);
353         break;
354         case IMG_CODEC_MPEG4_NO_RC:
355         case IMG_CODEC_MPEG4_VBR:
356         case IMG_CODEC_MPEG4_CBR:
357             RegVal |= F_ENCODE(1, MVEA_CR_IPE_BLOCKSIZE) | F_ENCODE(1, MVEA_CR_IPE_ENCODING_FORMAT);
358         default:
359         break;
360         case IMG_CODEC_H264_NO_RC:
361         case IMG_CODEC_H264_VBR:
362         case IMG_CODEC_H264_CBR:
363         case IMG_CODEC_H264_VCM:
364             RegVal |= F_ENCODE(2, MVEA_CR_IPE_BLOCKSIZE) | F_ENCODE(2, MVEA_CR_IPE_ENCODING_FORMAT);
365         break;
366     }
367     RegVal |= F_ENCODE(6, MVEA_CR_IPE_Y_CANDIDATE_NUM);
368     return RegVal;
369 }
370 
tng__setup_enc_profile_features(context_ENC_p ctx,IMG_UINT32 ui32EncProfile)371 void tng__setup_enc_profile_features(context_ENC_p ctx, IMG_UINT32 ui32EncProfile)
372 {
373     IMG_ENCODE_FEATURES * pEncFeatures = &ctx->sEncFeatures;
374     /* Set the default values first */
375     pEncFeatures->bDisableBPicRef_0 = IMG_FALSE;
376     pEncFeatures->bDisableBPicRef_1 = IMG_FALSE;
377 
378     pEncFeatures->bDisableInter8x8 = IMG_FALSE;
379     pEncFeatures->bRestrictInter4x4 = IMG_FALSE;
380 
381     pEncFeatures->bDisableIntra4x4  = IMG_FALSE;
382     pEncFeatures->bDisableIntra8x8  = IMG_FALSE;
383     pEncFeatures->bDisableIntra16x16 = IMG_FALSE;
384 
385     pEncFeatures->bEnable8x16MVDetect   = IMG_TRUE;
386     pEncFeatures->bEnable16x8MVDetect   = IMG_TRUE;
387     pEncFeatures->bDisableBFrames       = IMG_FALSE;
388 
389     pEncFeatures->eMinBlkSz = BLK_SZ_DEFAULT;
390 
391     switch (ui32EncProfile) {
392         case ENC_PROFILE_LOWCOMPLEXITY:
393             pEncFeatures->bDisableInter8x8  = IMG_TRUE;
394             pEncFeatures->bRestrictInter4x4 = IMG_TRUE;
395             pEncFeatures->bDisableIntra4x4  = IMG_TRUE;
396             pEncFeatures->bDisableIntra8x8  = IMG_TRUE;
397             pEncFeatures->bRestrictInter4x4 = IMG_TRUE;
398             pEncFeatures->eMinBlkSz         = BLK_SZ_16x16;
399             pEncFeatures->bDisableBFrames   = IMG_TRUE;
400             break;
401 
402         case ENC_PROFILE_HIGHCOMPLEXITY:
403             pEncFeatures->bDisableBPicRef_0 = IMG_FALSE;
404             pEncFeatures->bDisableBPicRef_1 = IMG_FALSE;
405 
406             pEncFeatures->bDisableInter8x8 = IMG_FALSE;
407             pEncFeatures->bRestrictInter4x4 = IMG_FALSE;
408 
409             pEncFeatures->bDisableIntra4x4  = IMG_FALSE;
410             pEncFeatures->bDisableIntra8x8  = IMG_FALSE;
411             pEncFeatures->bDisableIntra16x16 = IMG_FALSE;
412 
413             pEncFeatures->bEnable8x16MVDetect   = IMG_TRUE;
414             pEncFeatures->bEnable16x8MVDetect   = IMG_TRUE;
415             break;
416     }
417 
418     if (ctx->eStandard != IMG_STANDARD_H264) {
419 	pEncFeatures->bEnable8x16MVDetect = IMG_FALSE;
420 	pEncFeatures->bEnable16x8MVDetect = IMG_FALSE;
421     }
422 
423     return;
424 }
425 
tng__patch_hw_profile(context_ENC_p ctx)426 VAStatus tng__patch_hw_profile(context_ENC_p ctx)
427 {
428     IMG_UINT32 ui32IPEControl = 0;
429     IMG_UINT32 ui32PredCombControl = 0;
430     IMG_ENCODE_FEATURES * psEncFeatures = &(ctx->sEncFeatures);
431 
432     // bDisableIntra4x4
433     if (psEncFeatures->bDisableIntra4x4)
434         ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTRA4X4_DISABLE);
435 
436     //bDisableIntra8x8
437     if (psEncFeatures->bDisableIntra8x8)
438         ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTRA8X8_DISABLE);
439 
440     //bDisableIntra16x16, check if atleast one of the other Intra mode is enabled
441     if ((psEncFeatures->bDisableIntra16x16) &&
442         (!(psEncFeatures->bDisableIntra8x8) || !(psEncFeatures->bDisableIntra4x4))) {
443         ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTRA16X16_DISABLE);
444     }
445 
446     if (psEncFeatures->bRestrictInter4x4) {
447 //        ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTER4X4_RESTRICT);
448         ui32IPEControl |= F_ENCODE(1, TOPAZHP_CR_IPE_MV_NUMBER_RESTRICTION);
449     }
450 
451     if (psEncFeatures->bDisableInter8x8)
452         ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTER8X8_DISABLE);
453 
454     if (psEncFeatures->bDisableBPicRef_1)
455         ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_B_PIC1_DISABLE);
456     else if (psEncFeatures->bDisableBPicRef_0)
457         ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_B_PIC0_DISABLE);
458 
459     // save predictor combiner control in video encode parameter set
460     ctx->ui32PredCombControl = ui32PredCombControl;
461 
462     // set blocksize
463     ui32IPEControl |= F_ENCODE(psEncFeatures->eMinBlkSz, TOPAZHP_CR_IPE_BLOCKSIZE);
464 
465     if (psEncFeatures->bEnable8x16MVDetect)
466         ui32IPEControl |= F_ENCODE(1, TOPAZHP_CR_IPE_8X16_ENABLE);
467 
468     if (psEncFeatures->bEnable16x8MVDetect)
469         ui32IPEControl |= F_ENCODE(1, TOPAZHP_CR_IPE_16X8_ENABLE);
470 
471     if (psEncFeatures->bDisableBFrames)
472         ctx->sRCParams.ui16BFrames = 0;
473 
474     //save IPE-control register
475     ctx->ui32IPEControl = ui32IPEControl;
476 
477     return VA_STATUS_SUCCESS;
478 }
479 
480 #ifdef _TOPAZHP_CMDBUF_
tng__trace_cmdbuf(tng_cmdbuf_p cmdbuf,int idx)481 static void tng__trace_cmdbuf(tng_cmdbuf_p cmdbuf, int idx)
482 {
483     IMG_UINT32 ui32CmdTmp[4];
484     IMG_UINT32 *ptmp = (IMG_UINT32 *)(cmdbuf->cmd_start);
485     IMG_UINT32 *pend = (IMG_UINT32 *)(cmdbuf->cmd_idx);
486     IMG_UINT32 ui32Len;
487 
488     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: start, stream (%d), ptmp (0x%08x), pend (0x%08x}\n", __FUNCTION__, idx, (unsigned int)ptmp, (unsigned int)pend);
489 
490     if (idx)
491         return ;
492 
493     while (ptmp < pend) {
494         drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: ptmp (0x%08x}\n", __FUNCTION__, *ptmp);
495         if ((*ptmp & 0x7f) == MTX_CMDID_SW_NEW_CODEC) {
496             ptmp += 4;
497         } else if ((*ptmp & 0x7f) == MTX_CMDID_SW_LEAVE_LOWPOWER) {
498             ptmp += 2;
499         } else if ((*ptmp & 0x7f) == MTX_CMDID_SW_WRITEREG) {
500             ui32Len = *(++ptmp);
501             drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: len = %d\n", __FUNCTION__, ui32Len);
502             ptmp += (ui32Len * 3) + 1;
503             drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: reg ptmp (0x%08x}\n", __FUNCTION__, *ptmp);
504         } else if ((*ptmp & 0x7f) == MTX_CMDID_DO_HEADER) {
505             ui32CmdTmp[0] = *ptmp++;
506             ui32CmdTmp[1] = *ptmp++;
507             ui32CmdTmp[2] = *ptmp++;
508             ui32CmdTmp[3] = 0;
509             //topazhp_dump_command((unsigned int*)ui32CmdTmp);
510             ptmp += 2;
511         } else if (
512             ((*ptmp & 0x7f) == MTX_CMDID_SETVIDEO)||
513             ((*ptmp & 0x7f) == MTX_CMDID_SHUTDOWN)) {
514             ui32CmdTmp[0] = *ptmp++;
515             ui32CmdTmp[1] = *ptmp++;
516             ui32CmdTmp[2] = *ptmp++;
517             ui32CmdTmp[3] = *ptmp++;
518             //topazhp_dump_command((unsigned int*)ui32CmdTmp);
519         } else if (
520             ((*ptmp & 0x7f) == MTX_CMDID_PROVIDE_SOURCE_BUFFER) ||
521             ((*ptmp & 0x7f) == MTX_CMDID_PROVIDE_REF_BUFFER) ||
522             ((*ptmp & 0x7f) == MTX_CMDID_PROVIDE_CODED_BUFFER) ||
523             ((*ptmp & 0x7f) == MTX_CMDID_PICMGMT) ||
524             ((*ptmp & 0x7f) == MTX_CMDID_ENCODE_FRAME)) {
525             ui32CmdTmp[0] = *ptmp++;
526             ui32CmdTmp[1] = *ptmp++;
527             ui32CmdTmp[2] = *ptmp++;
528             ui32CmdTmp[3] = 0;
529             //topazhp_dump_command((unsigned int*)ui32CmdTmp);
530         } else {
531             drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: error leave lowpower = 0x%08x\n", __FUNCTION__, *ptmp++);
532         }
533     }
534 
535     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: end\n", __FUNCTION__);
536 
537     return ;
538 }
539 #endif
540 
tng_DestroyContext(object_context_p obj_context,unsigned char is_JPEG)541 void tng_DestroyContext(object_context_p obj_context, unsigned char is_JPEG)
542 {
543     context_ENC_p ctx;
544 //    tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
545     ctx = (context_ENC_p)obj_context->format_data;
546     FRAME_ORDER_INFO *psFrameInfo = &(ctx->sFrameOrderInfo);
547 
548     if (psFrameInfo->slot_consume_dpy_order != NULL)
549         free(psFrameInfo->slot_consume_dpy_order);
550     if (psFrameInfo->slot_consume_enc_order != NULL)
551         free(psFrameInfo->slot_consume_enc_order);
552 
553     tng_air_buf_free(ctx);
554 
555     tng__free_context_buffer(ctx, is_JPEG, 0);
556 
557     if (ctx->bEnableMVC)
558         tng__free_context_buffer(ctx, is_JPEG, 1);
559 
560     free(obj_context->format_data);
561     obj_context->format_data = NULL;
562 }
563 
tng__init_rc_params(context_ENC_p ctx,object_config_p obj_config)564 static VAStatus tng__init_rc_params(context_ENC_p ctx, object_config_p obj_config)
565 {
566     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
567     unsigned int eRCmode = 0;
568     memset(psRCParams, 0, sizeof(IMG_RC_PARAMS));
569     IMG_INT32 i;
570 
571     //set RC mode
572     for (i = 0; i < obj_config->attrib_count; i++) {
573         if (obj_config->attrib_list[i].type == VAConfigAttribRateControl)
574             break;
575     }
576 
577     if (i >= obj_config->attrib_count) {
578         eRCmode = VA_RC_NONE;
579     } else {
580         eRCmode = obj_config->attrib_list[i].value;
581     }
582 
583     ctx->sRCParams.bRCEnable = IMG_TRUE;
584     ctx->sRCParams.bDisableBitStuffing = IMG_FALSE;
585 
586     if (eRCmode == VA_RC_NONE) {
587         ctx->sRCParams.bRCEnable = IMG_FALSE;
588         ctx->sRCParams.eRCMode = IMG_RCMODE_NONE;
589     } else if (eRCmode == VA_RC_CBR) {
590         ctx->sRCParams.eRCMode = IMG_RCMODE_CBR;
591     } else if (eRCmode == VA_RC_VBR) {
592         ctx->sRCParams.eRCMode = IMG_RCMODE_VBR;
593     } else if (eRCmode == VA_RC_VCM) {
594         ctx->sRCParams.eRCMode = IMG_RCMODE_VCM;
595     } else {
596         ctx->sRCParams.bRCEnable = IMG_FALSE;
597         drv_debug_msg(VIDEO_DEBUG_ERROR, "not support this RT Format\n");
598         return VA_STATUS_ERROR_UNSUPPORTED_RT_FORMAT;
599     }
600 
601     psRCParams->bScDetectDisable = IMG_FALSE;
602     psRCParams->ui32SliceByteLimit = 0;
603     psRCParams->ui32SliceMBLimit = 0;
604     psRCParams->bIsH264Codec = (ctx->eStandard == IMG_STANDARD_H264) ? IMG_TRUE : IMG_FALSE;
605     return VA_STATUS_SUCCESS;
606 }
607 
608 /**************************************************************************************************
609 * Function:             IMG_C_GetEncoderCaps
610 * Description:  Get the capabilities of the encoder for the given codec
611 *
612 ***************************************************************************************************/
613 //FIXME
614 static const IMG_UINT32 g_ui32PipesAvailable = TOPAZHP_PIPE_NUM;
615 static const IMG_UINT32 g_ui32CoreDes1 = TOPAZHP_PIPE_NUM;
616 static const IMG_UINT32 g_ui32CoreRev = 0x00030401;
617 
tng__get_num_pipes()618 static IMG_UINT32 tng__get_num_pipes()
619 {
620     return g_ui32PipesAvailable;
621 }
622 
tng__get_core_des1()623 static IMG_UINT32 tng__get_core_des1()
624 {
625     return g_ui32CoreDes1;
626 }
627 
tng__get_core_rev()628 static IMG_UINT32 tng__get_core_rev()
629 {
630     return g_ui32CoreRev;
631 }
632 
tng__get_encoder_caps(context_ENC_p ctx)633 static VAStatus tng__get_encoder_caps(context_ENC_p ctx)
634 {
635     IMG_ENC_CAPS *psCaps = &(ctx->sCapsParams);
636     IMG_UINT16 ui16Height = ctx->ui16FrameHeight;
637     IMG_UINT32 ui32NumCores = 0;
638     IMG_UINT16 ui16MBRows = 0; //MB Rows in a GOB(slice);
639 
640     ctx->ui32CoreRev = tng__get_core_rev();
641     psCaps->ui32CoreFeatures = tng__get_core_des1();
642 
643     /* get the actual number of cores */
644     ui32NumCores = tng__get_num_pipes();
645 
646     switch (ctx->eStandard) {
647         case IMG_STANDARD_JPEG:
648             psCaps->ui16MaxSlices = ui16Height / 8;
649             psCaps->ui16MinSlices = 1;
650             psCaps->ui16RecommendedSlices = ui32NumCores;
651             break;
652         case IMG_STANDARD_H264:
653             psCaps->ui16MaxSlices = ui16Height / 16;
654             psCaps->ui16MinSlices = 1;
655             psCaps->ui16RecommendedSlices = ui32NumCores;
656             break;
657         case IMG_STANDARD_MPEG2:
658             psCaps->ui16MaxSlices = 174; // Slice labelling dictates a maximum of 174 slices
659             psCaps->ui16MinSlices = 1;
660             psCaps->ui16RecommendedSlices = (ui16Height + 15) / 16;
661             break;
662         case IMG_STANDARD_H263:
663             // if the original height of the pic is less than 400 , k is 1. refer standard.
664             if (ui16Height <= 400) {
665                 ui16MBRows = 1;
666             } else if (ui16Height < 800) { // if between 400 and 800 it's 2.
667                 ui16MBRows = 2;
668             } else {
669                 ui16MBRows = 4;
670             }
671             // before rounding is done for the height.
672             // get the GOB's based on this MB Rows and not vice-versa.
673             psCaps->ui16RecommendedSlices = (ui16Height + 15) >> (4 + (ui16MBRows >> 1));
674             psCaps->ui16MaxSlices = psCaps->ui16MinSlices = psCaps->ui16RecommendedSlices;
675             break;
676         case IMG_STANDARD_MPEG4:
677             psCaps->ui16MaxSlices = 1;
678             psCaps->ui16MinSlices = 1;
679             psCaps->ui16RecommendedSlices = 1;
680             break;
681         default:
682             break;
683     }
684     return VA_STATUS_SUCCESS;
685 }
686 
tng__init_context(context_ENC_p ctx)687 static VAStatus tng__init_context(context_ENC_p ctx)
688 {
689     VAStatus vaStatus = 0;
690 
691     /* Mostly sure about the following video parameters */
692     //ctx->ui32HWProfile = pParams->ui32HWProfile;
693     ctx->ui32FrameCount[0] = ctx->ui32FrameCount[1] = 0;
694     /* Using Extended parameters */
695     ctx->ui8PipesToUse = (IMG_UINT8)(tng__get_num_pipes() & (IMG_UINT32)0xff);
696     //carc params
697     ctx->sCARCParams.bCARC             = 0;
698     ctx->sCARCParams.i32CARCBaseline   = 0;
699     ctx->sCARCParams.ui32CARCThreshold = TOPAZHP_DEFAULT_uCARCThreshold;
700     ctx->sCARCParams.ui32CARCCutoff    = TOPAZHP_DEFAULT_uCARCCutoff;
701     ctx->sCARCParams.ui32CARCNegRange  = TOPAZHP_DEFAULT_uCARCNegRange;
702     ctx->sCARCParams.ui32CARCNegScale  = TOPAZHP_DEFAULT_uCARCNegScale;
703     ctx->sCARCParams.ui32CARCPosRange  = TOPAZHP_DEFAULT_uCARCPosRange;
704     ctx->sCARCParams.ui32CARCPosScale  = TOPAZHP_DEFAULT_uCARCPosScale;
705     ctx->sCARCParams.ui32CARCShift     = TOPAZHP_DEFAULT_uCARCShift;
706 
707     ctx->bUseDefaultScalingList = IMG_FALSE;
708     ctx->ui32CabacBinLimit = TOPAZHP_DEFAULT_uCABACBinLimit; //This parameter need not be exposed
709     if (ctx->ui32CabacBinLimit == 0)
710         ctx->ui32CabacBinFlex = 0;//This parameter need not be exposed
711     else
712         ctx->ui32CabacBinFlex = TOPAZHP_DEFAULT_uCABACBinFlex;//This parameter need not be exposed
713 
714     ctx->ui32FCode = 4;                     //This parameter need not be exposed
715     ctx->iFineYSearchSize = 2;//This parameter need not be exposed
716     ctx->ui32VopTimeResolution = 15;//This parameter need not be exposed
717 //    ctx->bEnabledDynamicBPic = IMG_FALSE;//Related to Rate Control,which is no longer needed.
718     ctx->bH264IntraConstrained = IMG_FALSE;//This parameter need not be exposed
719     ctx->bEnableInpCtrl     = IMG_FALSE;//This parameter need not be exposed
720     ctx->bEnableAIR = 0;
721     ctx->bEnableCIR = 0;
722     ctx->bEnableHostBias = (ctx->bEnableAIR != 0);//This parameter need not be exposed
723     ctx->bEnableHostQP = IMG_FALSE; //This parameter need not be exposed
724     ctx->ui8CodedSkippedIndex = 3;//This parameter need not be exposed
725     ctx->ui8InterIntraIndex         = 3;//This parameter need not be exposed
726     ctx->uMaxChunks = 0xA0;//This parameter need not be exposed
727     ctx->uChunksPerMb = 0x40;//This parameter need not be exposed
728     ctx->uPriorityChunks = (0xA0 - 0x60);//This parameter need not be exposed
729     ctx->bWeightedPrediction = IMG_FALSE;//Weighted Prediction is not supported in TopazHP Version 3.0
730     ctx->ui8VPWeightedImplicitBiPred = 0;//Weighted Prediction is not supported in TopazHP Version 3.0
731     ctx->bSkipDuplicateVectors = IMG_FALSE;//By default false Newly Added
732     ctx->bEnableCumulativeBiases = IMG_FALSE;//By default false Newly Added
733     ctx->ui16UseCustomScalingLists = 0;//By default false Newly Added
734     ctx->bPpsScaling = IMG_FALSE;//By default false Newly Added
735     ctx->ui8MPEG2IntraDCPrecision = 0;//By default 0 Newly Added
736     ctx->uMBspS = 0;//By default 0 Newly Added
737     ctx->bMultiReferenceP = IMG_FALSE;//By default false Newly Added
738     ctx->ui8RefSpacing=0;//By default 0 Newly Added
739     ctx->bSpatialDirect = 0;//By default 0 Newly Added
740     ctx->ui32DebugCRCs = 0;//By default false Newly Added
741     ctx->bEnableMVC = IMG_FALSE;//By default false Newly Added
742     ctx->ui16MVCViewIdx = (IMG_UINT16)(NON_MVC_VIEW);//Newly Added
743     ctx->bSrcAllocInternally = IMG_FALSE;//By default false Newly Added
744     ctx->bCodedAllocInternally = IMG_FALSE;//By default true Newly Added
745     ctx->bHighLatency = IMG_TRUE;//Newly Added
746     ctx->i32NumAIRMBs = -1;
747     ctx->i32AIRThreshold = -1;
748     ctx->i16AIRSkipCnt = -1;
749     ctx->i32LastCIRIndex = -1;
750     //Need to check on the following parameters
751     ctx->ui8EnableSelStatsFlags  = IMG_FALSE;//Default Value ?? Extended Parameter ??
752     ctx->bH2648x8Transform = IMG_FALSE;//Default Value ?? Extended Parameter or OMX_VIDEO_PARAM_AVCTYPE -> bDirect8x8Inference??
753     //FIXME: Zhaohan, eStandard is always 0 here.
754     ctx->bNoOffscreenMv = (ctx->eStandard == IMG_STANDARD_H263) ? IMG_TRUE : IMG_FALSE; //Default Value ?? Extended Parameter and bUseOffScreenMVUserSetting
755     ctx->bNoSequenceHeaders = IMG_FALSE;
756     ctx->bTopFieldFirst = IMG_TRUE;
757     ctx->sBiasTables.ui32FCode = ctx->ui32FCode;
758     ctx->ui32pseudo_rand_seed = UNINIT_PARAM;
759     ctx->bVPAdaptiveRoundingDisable = IMG_TRUE;
760 
761     //Default fcode is 4
762     if (!ctx->sBiasTables.ui32FCode)
763 	ctx->sBiasTables.ui32FCode = 4;
764 
765     ctx->uiCbrBufferTenths = TOPAZHP_DEFAULT_uiCbrBufferTenths;
766 
767     tng__setup_enc_profile_features(ctx, ENC_PROFILE_DEFAULT);
768 
769     vaStatus = tng__patch_hw_profile(ctx);
770     if (vaStatus != VA_STATUS_SUCCESS) {
771         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: tng__patch_hw_profile\n", __FUNCTION__);
772     }
773 
774     return VA_STATUS_SUCCESS;
775 }
776 
tng_CreateContext(object_context_p obj_context,object_config_p obj_config,unsigned char is_JPEG)777 VAStatus tng_CreateContext(
778     object_context_p obj_context,
779     object_config_p obj_config,
780     unsigned char is_JPEG)
781 {
782     VAStatus vaStatus = 0;
783     unsigned short ui16Width, ui16Height;
784     context_ENC_p ctx;
785 
786     ui16Width = obj_context->picture_width;
787     ui16Height = obj_context->picture_height;
788     ctx = (context_ENC_p) calloc(1, sizeof(struct context_ENC_s));
789     if (NULL == ctx) {
790         vaStatus = VA_STATUS_ERROR_ALLOCATION_FAILED;
791         DEBUG_FAILURE;
792         return vaStatus;
793     }
794 
795     memset((void*)ctx, 0, sizeof(struct context_ENC_s));
796 
797     obj_context->format_data = (void*) ctx;
798     ctx->obj_context = obj_context;
799 
800     if (is_JPEG == 0) {
801         ctx->ui16Width = (unsigned short)(~0xf & (ui16Width + 0xf));
802         ctx->ui16FrameHeight = (unsigned short)(~0xf & (ui16Height + 0xf));
803 
804         vaStatus = tng__init_context(ctx);
805         if (vaStatus != VA_STATUS_SUCCESS) {
806             drv_debug_msg(VIDEO_DEBUG_ERROR, "init Context params");
807         }
808 
809         vaStatus = tng__init_rc_params(ctx, obj_config);
810         if (vaStatus != VA_STATUS_SUCCESS) {
811             drv_debug_msg(VIDEO_DEBUG_ERROR, "init rc params");
812         }
813     } else {
814         /*JPEG only require them are even*/
815         ctx->ui16Width = (unsigned short)(~0x1 & (ui16Width + 0x1));
816         ctx->ui16FrameHeight = (unsigned short)(~0x1 & (ui16Height + 0x1));
817     }
818 
819     ctx->eFormat = IMG_CODEC_PL12;     // use default
820 
821     tng__setup_enc_profile_features(ctx, ENC_PROFILE_DEFAULT);
822 
823     if (is_JPEG) {
824         vaStatus = tng__alloc_context_buffer(ctx, is_JPEG, 0);
825         if (vaStatus != VA_STATUS_SUCCESS) {
826             drv_debug_msg(VIDEO_DEBUG_ERROR, "setup enc profile");
827         }
828     }
829 
830     return vaStatus;
831 }
832 
tng_BeginPicture(context_ENC_p ctx)833 VAStatus tng_BeginPicture(context_ENC_p ctx)
834 {
835     VAStatus vaStatus = VA_STATUS_SUCCESS;
836     context_ENC_frame_buf *ps_buf = &(ctx->ctx_frame_buf);
837     tng_cmdbuf_p cmdbuf;
838     int ret;
839 
840     ctx->ui32StreamID = 0;
841 
842     if (ctx->ui32RawFrameCount != 0)
843         ps_buf->previous_src_surface = ps_buf->src_surface;
844     ps_buf->src_surface = ctx->obj_context->current_render_target;
845 
846     vaStatus = tng__get_encoder_caps(ctx);
847     if (vaStatus != VA_STATUS_SUCCESS) {
848         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: tng__get_encoder_caps\n", __FUNCTION__);
849     }
850 
851     /* clear frameskip flag to 0 */
852     CLEAR_SURFACE_INFO_skipped_flag(ps_buf->src_surface->psb_surface);
853 
854     /* Initialise the command buffer */
855     ret = tng_context_get_next_cmdbuf(ctx->obj_context);
856     if (ret) {
857         drv_debug_msg(VIDEO_DEBUG_ERROR, "get next cmdbuf fail\n");
858         vaStatus = VA_STATUS_ERROR_UNKNOWN;
859         return vaStatus;
860     }
861     cmdbuf = ctx->obj_context->tng_cmdbuf;
862 
863     //FIXME
864     /* only map topaz param when necessary */
865     cmdbuf->topaz_in_params_I_p = NULL;
866     cmdbuf->topaz_in_params_P_p = NULL;
867     ctx->obj_context->slice_count = 0;
868 
869     tng_cmdbuf_buffer_ref(cmdbuf, &(ctx->obj_context->current_render_target->psb_surface->buf));
870 
871     return vaStatus;
872 }
873 
tng__provide_buffer_BFrames(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)874 static VAStatus tng__provide_buffer_BFrames(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
875 {
876     IMG_RC_PARAMS * psRCParams = &(ctx->sRCParams);
877     FRAME_ORDER_INFO *psFrameInfo = &(ctx->sFrameOrderInfo);
878     int slot_index = 0;
879     unsigned long long display_order = 0;
880     IMG_INT32  i32SlotBuf  = (IMG_INT32)(psRCParams->ui16BFrames + 2);
881     IMG_UINT32 ui32SlotBuf = (IMG_UINT32)(psRCParams->ui16BFrames + 2);
882     IMG_UINT32 ui32FrameIdx = ctx->ui32FrameCount[ui32StreamIndex];
883 
884     if (ui32StreamIndex == 0)
885         getFrameDpyOrder(ui32FrameIdx, psRCParams->ui16BFrames, ctx->ui32IntraCnt,
886              ctx->ui32IdrPeriod, psFrameInfo, &display_order);
887 
888     slot_index = psFrameInfo->last_slot;
889 
890     drv_debug_msg(VIDEO_DEBUG_GENERAL,
891         "%s: (int)ui32FrameIdx = %d, psRCParams->ui16BFrames = %d, psRCParams->ui32IntraFreq = %d, ctx->ui32IdrPeriod = %d\n",
892         __FUNCTION__, (int)ui32FrameIdx, (int)psRCParams->ui16BFrames, (int)psRCParams->ui32IntraFreq, ctx->ui32IdrPeriod);
893 
894     drv_debug_msg(VIDEO_DEBUG_GENERAL,
895         "%s: last_slot = %d, last_frame_type = %d, display_order = %d\n",
896         __FUNCTION__, psFrameInfo->last_slot, psFrameInfo->last_frame_type, display_order);
897 
898     if (ui32FrameIdx < ui32SlotBuf) {
899         if (ui32FrameIdx == 0) {
900             tng_send_source_frame(ctx, 0, 0);
901         } else if (ui32FrameIdx == 1) {
902             slot_index = 1;
903             do {
904                 tng_send_source_frame(ctx, slot_index, slot_index);
905                 ++slot_index;
906             } while(slot_index < i32SlotBuf);
907         } else {
908             slot_index = ui32FrameIdx - 1;
909             tng_send_source_frame(ctx, slot_index, slot_index);
910         }
911     } else {
912         tng_send_source_frame(ctx, slot_index , display_order);
913     }
914 
915     return VA_STATUS_SUCCESS;
916 }
917 
tng__provide_buffer_PFrames(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)918 VAStatus tng__provide_buffer_PFrames(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
919 {
920     IMG_UINT32 ui32FrameIdx = ctx->ui32FrameCount[ui32StreamIndex];
921 
922     drv_debug_msg(VIDEO_DEBUG_GENERAL,
923         "%s: frame count = %d, SlotsInUse = %d, ui32FrameIdx = %d\n",
924         __FUNCTION__, (int)ui32FrameIdx, ctx->ui8SlotsInUse, ui32FrameIdx);
925 
926     tng_send_source_frame(ctx, ctx->ui8SlotsCoded, ui32FrameIdx);
927 /*
928     if (ctx->ui32IntraCnt == 0)
929         ctx->eFrameType = IMG_INTRA_FRAME;
930     else
931         if (ui32FrameIdx % ctx->ui32IntraCnt == 0)
932             ctx->eFrameType = IMG_INTRA_FRAME;
933         else
934             ctx->eFrameType = IMG_INTER_P;
935 
936     if (ctx->ui32IdrPeriod == 0) {
937         if (ui32FrameIdx == 0)
938             ctx->eFrameType = IMG_INTRA_IDR;
939     } else {
940         if (ctx->ui32IntraCnt == 0) {
941             if (ui32FrameIdx % ctx->ui32IdrPeriod == 0)
942                 ctx->eFrameType = IMG_INTRA_IDR;
943         } else {
944             if (ui32FrameIdx % (ctx->ui32IntraCnt * ctx->ui32IdrPeriod) == 0)
945                 ctx->eFrameType = IMG_INTRA_IDR;
946         }
947     }
948 */
949     ctx->eFrameType = IMG_INTER_P;
950 
951     if (ui32FrameIdx % ctx->ui32IntraCnt == 0)
952         ctx->eFrameType = IMG_INTRA_FRAME;
953 
954     if (ui32FrameIdx % (ctx->ui32IdrPeriod * ctx->ui32IntraCnt) == 0)
955         ctx->eFrameType = IMG_INTRA_IDR;
956 
957     drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: ctx->eFrameType = %d\n", __FUNCTION__, ctx->eFrameType);
958 
959     return VA_STATUS_SUCCESS;
960 }
961 
962 static IMG_UINT16 H264_ROUNDING_OFFSETS[18][4] = {
963     {  683, 683, 683, 683 },   /* 0  I-Slice - INTRA4  LUMA */
964     {  683, 683, 683, 683 },   /* 1  P-Slice - INTRA4  LUMA */
965     {  683, 683, 683, 683 },   /* 2  B-Slice - INTRA4  LUMA */
966 
967     {  683, 683, 683, 683 },   /* 3  I-Slice - INTRA8  LUMA */
968     {  683, 683, 683, 683 },   /* 4  P-Slice - INTRA8  LUMA */
969     {  683, 683, 683, 683 },   /* 5  B-Slice - INTRA8  LUMA */
970     {  341, 341, 341, 341 },   /* 6  P-Slice - INTER8  LUMA */
971     {  341, 341, 341, 341 },   /* 7  B-Slice - INTER8  LUMA */
972 
973     {  683, 683, 683, 000 },   /* 8  I-Slice - INTRA16 LUMA */
974     {  683, 683, 683, 000 },   /* 9  P-Slice - INTRA16 LUMA */
975     {  683, 683, 683, 000 },   /* 10 B-Slice - INTRA16 LUMA */
976     {  341, 341, 341, 341 },   /* 11 P-Slice - INTER16 LUMA */
977     {  341, 341, 341, 341 },   /* 12 B-Slice - INTER16 LUMA */
978 
979     {  683, 683, 683, 000 },   /* 13 I-Slice - INTRA16 CHROMA */
980     {  683, 683, 683, 000 },   /* 14 P-Slice - INTRA16 CHROMA */
981     {  683, 683, 683, 000 },   /* 15 B-Slice - INTRA16 CHROMA */
982     {  341, 341, 341, 000 },   /* 16 P-Slice - INTER16 CHROMA */
983     {  341, 341, 341, 000 } /* 17 B-Slice - INTER16 CHROMA */
984 };
985 
tng__create_gop_frame(IMG_UINT8 * pui8Level,IMG_BOOL bReference,IMG_UINT8 ui8Pos,IMG_UINT8 ui8Ref0Level,IMG_UINT8 ui8Ref1Level,IMG_FRAME_TYPE eFrameType)986 static IMG_UINT16 tng__create_gop_frame(
987     IMG_UINT8 * pui8Level, IMG_BOOL bReference,
988     IMG_UINT8 ui8Pos, IMG_UINT8 ui8Ref0Level,
989     IMG_UINT8 ui8Ref1Level, IMG_FRAME_TYPE eFrameType)
990 {
991     *pui8Level = ((ui8Ref0Level > ui8Ref1Level) ? ui8Ref0Level : ui8Ref1Level)  + 1;
992 
993     return F_ENCODE(bReference, GOP_REFERENCE) |
994            F_ENCODE(ui8Pos, GOP_POS) |
995            F_ENCODE(ui8Ref0Level, GOP_REF0) |
996            F_ENCODE(ui8Ref1Level, GOP_REF1) |
997            F_ENCODE(eFrameType, GOP_FRAMETYPE);
998 }
999 
tng__minigop_generate_flat(void * buffer_p,IMG_UINT32 ui32BFrameCount,IMG_UINT32 ui32RefSpacing,IMG_UINT8 aui8PicOnLevel[])1000 static void tng__minigop_generate_flat(void* buffer_p, IMG_UINT32 ui32BFrameCount, IMG_UINT32 ui32RefSpacing, IMG_UINT8 aui8PicOnLevel[])
1001 {
1002     /* B B B B P */
1003     IMG_UINT8 ui8EncodeOrderPos;
1004     IMG_UINT8 ui8Level;
1005     IMG_UINT16 * psGopStructure = (IMG_UINT16 *)buffer_p;
1006 
1007     psGopStructure[0] = tng__create_gop_frame(&ui8Level, IMG_TRUE, MAX_BFRAMES, ui32RefSpacing, 0, IMG_INTER_P);
1008     aui8PicOnLevel[ui8Level]++;
1009 
1010     for (ui8EncodeOrderPos = 1; ui8EncodeOrderPos < MAX_GOP_SIZE; ui8EncodeOrderPos++) {
1011         psGopStructure[ui8EncodeOrderPos] = tng__create_gop_frame(&ui8Level, IMG_FALSE,
1012                                             ui8EncodeOrderPos - 1, ui32RefSpacing, ui32RefSpacing + 1, IMG_INTER_B);
1013         aui8PicOnLevel[ui8Level] = ui32BFrameCount;
1014     }
1015 
1016     for( ui8EncodeOrderPos = 0; ui8EncodeOrderPos < MAX_GOP_SIZE; ui8EncodeOrderPos++) {
1017         drv_debug_msg(VIDEO_DEBUG_GENERAL,
1018             "%s: psGopStructure = 0x%06x\n", __FUNCTION__, psGopStructure[ui8EncodeOrderPos]);
1019     }
1020 
1021     return ;
1022 }
1023 
tng__gop_split(IMG_UINT16 ** pasGopStructure,IMG_INT8 i8Ref0,IMG_INT8 i8Ref1,IMG_UINT8 ui8Ref0Level,IMG_UINT8 ui8Ref1Level,IMG_UINT8 aui8PicOnLevel[])1024 static void tng__gop_split(IMG_UINT16 ** pasGopStructure, IMG_INT8 i8Ref0, IMG_INT8 i8Ref1,
1025                            IMG_UINT8 ui8Ref0Level, IMG_UINT8 ui8Ref1Level, IMG_UINT8 aui8PicOnLevel[])
1026 {
1027     IMG_UINT8 ui8Distance = i8Ref1 - i8Ref0;
1028     IMG_UINT8 ui8Position = i8Ref0 + (ui8Distance >> 1);
1029     IMG_UINT8 ui8Level;
1030 
1031     if (ui8Distance == 1)
1032         return;
1033 
1034     /* mark middle as this level */
1035 
1036     (*pasGopStructure)++;
1037     **pasGopStructure = tng__create_gop_frame(&ui8Level, ui8Distance >= 3, ui8Position, ui8Ref0Level, ui8Ref1Level, IMG_INTER_B);
1038     aui8PicOnLevel[ui8Level]++;
1039 
1040     if (ui8Distance >= 4)
1041         tng__gop_split(pasGopStructure, i8Ref0, ui8Position, ui8Ref0Level, ui8Level, aui8PicOnLevel);
1042 
1043     if (ui8Distance >= 3)
1044         tng__gop_split(pasGopStructure, ui8Position, i8Ref1, ui8Level, ui8Ref1Level, aui8PicOnLevel);
1045 }
1046 
tng_minigop_generate_hierarchical(void * buffer_p,IMG_UINT32 ui32BFrameCount,IMG_UINT32 ui32RefSpacing,IMG_UINT8 aui8PicOnLevel[])1047 static void tng_minigop_generate_hierarchical(void* buffer_p, IMG_UINT32 ui32BFrameCount,
1048         IMG_UINT32 ui32RefSpacing, IMG_UINT8 aui8PicOnLevel[])
1049 {
1050     IMG_UINT8 ui8Level;
1051     IMG_UINT16 * psGopStructure = (IMG_UINT16 *)buffer_p;
1052 
1053     psGopStructure[0] = tng__create_gop_frame(&ui8Level, IMG_TRUE, ui32BFrameCount, ui32RefSpacing, 0, IMG_INTER_P);
1054     aui8PicOnLevel[ui8Level]++;
1055 
1056     tng__gop_split(&psGopStructure, -1, ui32BFrameCount, ui32RefSpacing, ui32RefSpacing + 1, aui8PicOnLevel);
1057 }
1058 
tng__generate_scale_tables(IMG_MTX_VIDEO_CONTEXT * psMtxEncCtx)1059 static void tng__generate_scale_tables(IMG_MTX_VIDEO_CONTEXT* psMtxEncCtx)
1060 {
1061     psMtxEncCtx->ui32InterIntraScale[0] = 0x0004;  // Force intra by scaling its cost by 0
1062     psMtxEncCtx->ui32InterIntraScale[1] = 0x0103;  // favour intra by a factor 3
1063     psMtxEncCtx->ui32InterIntraScale[2] = 0x0102;  // favour intra by a factor 2
1064     psMtxEncCtx->ui32InterIntraScale[3] = 0x0101;  // no bias
1065     psMtxEncCtx->ui32InterIntraScale[4] = 0x0101;  // no bias
1066     psMtxEncCtx->ui32InterIntraScale[5] = 0x0201;  // favour inter by a factor 2
1067     psMtxEncCtx->ui32InterIntraScale[6] = 0x0301;  // favour inter by a factor 3
1068     psMtxEncCtx->ui32InterIntraScale[7] = 0x0400;  // Force inter by scaling it's cost by 0
1069 
1070     psMtxEncCtx->ui32SkippedCodedScale[0] = 0x0004;  // Force coded by scaling its cost by 0
1071     psMtxEncCtx->ui32SkippedCodedScale[1] = 0x0103;  // favour coded by a factor 3
1072     psMtxEncCtx->ui32SkippedCodedScale[2] = 0x0102;  // favour coded by a factor 2
1073     psMtxEncCtx->ui32SkippedCodedScale[3] = 0x0101;  // no bias
1074     psMtxEncCtx->ui32SkippedCodedScale[4] = 0x0101;  // no bias
1075     psMtxEncCtx->ui32SkippedCodedScale[5] = 0x0201;  // favour skipped by a factor 2
1076     psMtxEncCtx->ui32SkippedCodedScale[6] = 0x0301;  // favour skipped by a factor 3
1077     psMtxEncCtx->ui32SkippedCodedScale[7] = 0x0400;  // Force skipped by scaling it's cost by 0
1078     return ;
1079 }
1080 
1081 /*!
1082 ******************************************************************************
1083  @Function      tng_update_driver_mv_scaling
1084  @details
1085         Setup the registers for scaling candidate motion vectors to take into account
1086         how far away (temporally) the reference pictures are
1087 ******************************************************************************/
1088 
tng__abs(IMG_INT a)1089 static IMG_INT tng__abs(IMG_INT a)
1090 {
1091     if (a < 0)
1092         return -a;
1093     else
1094         return a;
1095 }
1096 
tng__abs32(IMG_INT32 a)1097 static IMG_INT tng__abs32(IMG_INT32 a)
1098 {
1099     if (a < 0)
1100         return -a;
1101     else
1102         return a;
1103 }
1104 
tng_update_driver_mv_scaling(IMG_UINT32 uFrameNum,IMG_UINT32 uRef0Num,IMG_UINT32 uRef1Num,IMG_UINT32 ui32PicFlags,IMG_BOOL bSkipDuplicateVectors,IMG_UINT32 * pui32MVCalc_Below,IMG_UINT32 * pui32MVCalc_Colocated,IMG_UINT32 * pui32MVCalc_Config)1105 void tng_update_driver_mv_scaling(
1106     IMG_UINT32 uFrameNum,
1107     IMG_UINT32 uRef0Num,
1108     IMG_UINT32 uRef1Num,
1109     IMG_UINT32 ui32PicFlags,
1110     IMG_BOOL   bSkipDuplicateVectors,
1111     IMG_UINT32 * pui32MVCalc_Below,
1112     IMG_UINT32 * pui32MVCalc_Colocated,
1113     IMG_UINT32 * pui32MVCalc_Config)
1114 {
1115     IMG_UINT32 uMvCalcConfig = 0;
1116     IMG_UINT32 uMvCalcColocated = F_ENCODE(0x10, TOPAZHP_CR_TEMPORAL_BLEND);
1117     IMG_UINT32 uMvCalcBelow = 0;
1118 
1119     //If b picture calculate scaling factor for colocated motion vectors
1120     if (ui32PicFlags & ISINTERB_FLAGS) {
1121         IMG_INT tb, td, tx;
1122         IMG_INT iDistScale;
1123 
1124         //calculation taken from H264 spec
1125         tb = (uFrameNum * 2) - (uRef1Num * 2);
1126         td = (uRef0Num  * 2) - (uRef1Num * 2);
1127         tx = (16384 + tng__abs(td / 2)) / td;
1128         iDistScale = (tb * tx + 32) >> 6;
1129         if (iDistScale > 1023) iDistScale = 1023;
1130         if (iDistScale < -1024) iDistScale = -1024;
1131         uMvCalcColocated |= F_ENCODE(iDistScale, TOPAZHP_CR_COL_DIST_SCALE_FACT);
1132 
1133         //We assume the below temporal mvs are from the latest reference frame
1134         //rather then the most recently encoded B frame (as Bs aren't reference)
1135 
1136         //Fwd temporal is same as colocated mv scale
1137         uMvCalcBelow     |= F_ENCODE(iDistScale, TOPAZHP_CR_PIC0_DIST_SCALE_FACTOR);
1138 
1139         //Bkwd temporal needs to be scaled by the recipricol amount in the other direction
1140         tb = (uFrameNum * 2) - (uRef0Num * 2);
1141         td = (uRef0Num  * 2) - (uRef1Num * 2);
1142         tx = (16384 + tng__abs(td / 2)) / td;
1143         iDistScale = (tb * tx + 32) >> 6;
1144         if (iDistScale > 1023) iDistScale = 1023;
1145         if (iDistScale < -1024) iDistScale = -1024;
1146         uMvCalcBelow |= F_ENCODE(iDistScale, TOPAZHP_CR_PIC1_DIST_SCALE_FACTOR);
1147     } else {
1148         //Don't scale the temporal below mvs
1149         uMvCalcBelow |= F_ENCODE(1 << 8, TOPAZHP_CR_PIC0_DIST_SCALE_FACTOR);
1150 
1151         if (uRef0Num != uRef1Num) {
1152             IMG_INT iRef0Dist, iRef1Dist;
1153             IMG_INT iScale;
1154 
1155             //Distance to second reference picture may be different when
1156             //using multiple reference frames on P. Scale based on difference
1157             //in temporal distance to ref pic 1 compared to distance to ref pic 0
1158             iRef0Dist = (uFrameNum - uRef0Num);
1159             iRef1Dist = (uFrameNum - uRef1Num);
1160             iScale    = (iRef1Dist << 8) / iRef0Dist;
1161 
1162             if (iScale > 1023) iScale = 1023;
1163             if (iScale < -1024) iScale = -1024;
1164 
1165             uMvCalcBelow |= F_ENCODE(iScale, TOPAZHP_CR_PIC1_DIST_SCALE_FACTOR);
1166         } else
1167             uMvCalcBelow |= F_ENCODE(1 << 8, TOPAZHP_CR_PIC1_DIST_SCALE_FACTOR);
1168     }
1169 
1170     if (uFrameNum > 0) {
1171         IMG_INT ref0_distance, ref1_distance;
1172         IMG_INT jitter0, jitter1;
1173 
1174         ref0_distance = tng__abs32((IMG_INT32)uFrameNum - (IMG_INT32)uRef0Num);
1175         ref1_distance = tng__abs32((IMG_INT32)uFrameNum - (IMG_INT32)uRef1Num);
1176 
1177         if (!(ui32PicFlags & ISINTERB_FLAGS)) {
1178             jitter0 = ref0_distance * 1;
1179             jitter1 = jitter0 > 1 ? 1 : 2;
1180         } else {
1181             jitter0 = ref1_distance * 1;
1182             jitter1 = ref0_distance * 1;
1183         }
1184 
1185         //Hardware can only cope with 1 - 4 jitter factors
1186         jitter0 = (jitter0 > 4) ? 4 : (jitter0 < 1) ? 1 : jitter0;
1187         jitter1 = (jitter1 > 4) ? 4 : (jitter1 < 1) ? 1 : jitter1;
1188 
1189         //Hardware can only cope with 1 - 4 jitter factors
1190         assert(jitter0 > 0 && jitter0 <= 4 && jitter1 > 0 && jitter1 <= 4);
1191 
1192         uMvCalcConfig |= F_ENCODE(jitter0 - 1, TOPAZHP_CR_MVCALC_IPE0_JITTER_FACTOR) |
1193                          F_ENCODE(jitter1 - 1, TOPAZHP_CR_MVCALC_IPE1_JITTER_FACTOR);
1194     }
1195 
1196     uMvCalcConfig |= F_ENCODE(1, TOPAZHP_CR_MVCALC_DUP_VEC_MARGIN);
1197     uMvCalcConfig |= F_ENCODE(7, TOPAZHP_CR_MVCALC_GRID_MB_X_STEP);
1198     uMvCalcConfig |= F_ENCODE(13, TOPAZHP_CR_MVCALC_GRID_MB_Y_STEP);
1199     uMvCalcConfig |= F_ENCODE(3, TOPAZHP_CR_MVCALC_GRID_SUB_STEP);
1200     uMvCalcConfig |= F_ENCODE(1, TOPAZHP_CR_MVCALC_GRID_DISABLE);
1201 
1202     if (bSkipDuplicateVectors)
1203         uMvCalcConfig |= F_ENCODE(1, TOPAZHP_CR_MVCALC_NO_PSEUDO_DUPLICATES);
1204 
1205     * pui32MVCalc_Below =   uMvCalcBelow;
1206     * pui32MVCalc_Colocated = uMvCalcColocated;
1207     * pui32MVCalc_Config = uMvCalcConfig;
1208 }
1209 
tng__prepare_mv_estimates(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)1210 static void tng__prepare_mv_estimates(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
1211 {
1212     context_ENC_mem* ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
1213     IMG_MTX_VIDEO_CONTEXT* psMtxEncCtx = NULL;
1214     IMG_UINT32 ui32Distance;
1215 
1216     psb_buffer_map(&(ps_mem->bufs_mtx_context), &(ps_mem->bufs_mtx_context.virtual_addr));
1217     if (ps_mem->bufs_mtx_context.virtual_addr == NULL) {
1218         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping mtx context\n", __FUNCTION__);
1219         return ;
1220     }
1221 
1222     psMtxEncCtx = (IMG_MTX_VIDEO_CONTEXT*)(ps_mem->bufs_mtx_context.virtual_addr);
1223 
1224     /* IDR */
1225     psMtxEncCtx->sMVSettingsIdr.ui32MVCalc_Config = DEFAULT_MVCALC_CONFIG;  // default based on TRM
1226     psMtxEncCtx->sMVSettingsIdr.ui32MVCalc_Colocated = 0x00100100;// default based on TRM
1227     psMtxEncCtx->sMVSettingsIdr.ui32MVCalc_Below = 0x01000100;      // default based on TRM
1228 
1229     tng_update_driver_mv_scaling(
1230         0, 0, 0, 0, IMG_FALSE, //psMtxEncCtx->bSkipDuplicateVectors, //By default false Newly Added
1231         &psMtxEncCtx->sMVSettingsIdr.ui32MVCalc_Below,
1232         &psMtxEncCtx->sMVSettingsIdr.ui32MVCalc_Colocated,
1233         &psMtxEncCtx->sMVSettingsIdr.ui32MVCalc_Config);
1234 
1235     /* NonB (I or P) */
1236     for (ui32Distance = 1; ui32Distance <= MAX_BFRAMES + 1; ui32Distance++) {
1237         psMtxEncCtx->sMVSettingsNonB[ui32Distance - 1].ui32MVCalc_Config = DEFAULT_MVCALC_CONFIG;       // default based on TRM
1238         psMtxEncCtx->sMVSettingsNonB[ui32Distance - 1].ui32MVCalc_Colocated = 0x00100100;// default based on TRM
1239         psMtxEncCtx->sMVSettingsNonB[ui32Distance - 1].ui32MVCalc_Below = 0x01000100;   // default based on TRM
1240 
1241 
1242         tng_update_driver_mv_scaling(ui32Distance, 0, 0, 0, IMG_FALSE, //psMtxEncCtx->bSkipDuplicateVectors,
1243                                      &psMtxEncCtx->sMVSettingsNonB[ui32Distance - 1].ui32MVCalc_Below,
1244                                      &psMtxEncCtx->sMVSettingsNonB[ui32Distance - 1].ui32MVCalc_Colocated,
1245                                      &psMtxEncCtx->sMVSettingsNonB[ui32Distance - 1].ui32MVCalc_Config);
1246     }
1247 
1248     {
1249         IMG_UINT32 ui32DistanceB;
1250         IMG_UINT32 ui32Position;
1251         context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
1252         IMG_MV_SETTINGS *pHostMVSettingsHierarchical = NULL;
1253         IMG_MV_SETTINGS *pMvElement = NULL;
1254         IMG_MV_SETTINGS *pHostMVSettingsBTable = NULL;
1255 
1256         psb_buffer_map(&(ps_mem->bufs_mv_setting_btable), &(ps_mem->bufs_mv_setting_btable.virtual_addr));
1257         if (ps_mem->bufs_mv_setting_btable.virtual_addr == NULL) {
1258             drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping mv setting btable\n", __FUNCTION__);
1259             return ;
1260         }
1261 
1262         pHostMVSettingsBTable = (IMG_MV_SETTINGS *)(ps_mem->bufs_mv_setting_btable.virtual_addr);
1263 
1264         for (ui32DistanceB = 0; ui32DistanceB < MAX_BFRAMES; ui32DistanceB++) {
1265             for (ui32Position = 1; ui32Position <= ui32DistanceB + 1; ui32Position++) {
1266                 pMvElement = (IMG_MV_SETTINGS * ) ((IMG_UINT8 *) pHostMVSettingsBTable + MV_OFFSET_IN_TABLE(ui32DistanceB, ui32Position - 1));
1267                 pMvElement->ui32MVCalc_Config= (DEFAULT_MVCALC_CONFIG|MASK_TOPAZHP_CR_MVCALC_GRID_DISABLE);    // default based on TRM
1268                 pMvElement->ui32MVCalc_Colocated=0x00100100;// default based on TRM
1269                 pMvElement->ui32MVCalc_Below=0x01000100;	// default based on TRM
1270 
1271                 tng_update_driver_mv_scaling(
1272                     ui32Position, ui32DistanceB + 2, 0, ISINTERB_FLAGS, IMG_FALSE,
1273                     &pMvElement->ui32MVCalc_Below,
1274                     &pMvElement->ui32MVCalc_Colocated,
1275                     &pMvElement->ui32MVCalc_Config);
1276             }
1277         }
1278 
1279         if (ctx->b_is_mv_setting_hierar){
1280             pHostMVSettingsHierarchical = (IMG_MV_SETTINGS *)(ps_mem->bufs_mv_setting_hierar.virtual_addr);
1281 
1282             for (ui32DistanceB = 0; ui32DistanceB < MAX_BFRAMES; ui32DistanceB++) {
1283                 pMvElement = (IMG_MV_SETTINGS * ) ((IMG_UINT8 *)pHostMVSettingsBTable + MV_OFFSET_IN_TABLE(ui32DistanceB, ui32DistanceB >> 1));
1284                 //memcpy(pHostMVSettingsHierarchical + ui32DistanceB, , sizeof(IMG_MV_SETTINGS));
1285                 pHostMVSettingsHierarchical[ui32DistanceB].ui32MVCalc_Config    = pMvElement->ui32MVCalc_Config;
1286                 pHostMVSettingsHierarchical[ui32DistanceB].ui32MVCalc_Colocated = pMvElement->ui32MVCalc_Colocated;
1287                 pHostMVSettingsHierarchical[ui32DistanceB].ui32MVCalc_Below     = pMvElement->ui32MVCalc_Below;
1288             }
1289         }
1290         psb_buffer_unmap(&(ps_mem->bufs_mv_setting_btable));
1291     }
1292 
1293     psb_buffer_unmap(&(ps_mem->bufs_mtx_context));
1294 
1295     return ;
1296 }
1297 
tng__adjust_picflags(context_ENC_p ctx,IMG_RC_PARAMS * psRCParams,IMG_BOOL bFirstPic,IMG_UINT32 * pui32Flags)1298 static void tng__adjust_picflags(
1299     context_ENC_p ctx,
1300     IMG_RC_PARAMS * psRCParams,
1301     IMG_BOOL bFirstPic,
1302     IMG_UINT32 * pui32Flags)
1303 {
1304     IMG_UINT32 ui32Flags;
1305     PIC_PARAMS * psPicParams = &ctx->sPicParams;
1306     ui32Flags = psPicParams->ui32Flags;
1307 
1308     if (!psRCParams->bRCEnable || (!bFirstPic))
1309         ui32Flags = 0;
1310 
1311     switch (ctx->eStandard) {
1312     case IMG_STANDARD_NONE:
1313         break;
1314     case IMG_STANDARD_H264:
1315         break;
1316     case IMG_STANDARD_H263:
1317         ui32Flags |= ISH263_FLAGS;
1318         break;
1319     case IMG_STANDARD_MPEG4:
1320         ui32Flags |= ISMPEG4_FLAGS;
1321         break;
1322     case IMG_STANDARD_MPEG2:
1323         ui32Flags |= ISMPEG2_FLAGS;
1324         break;
1325     default:
1326         break;
1327     }
1328     * pui32Flags = ui32Flags;
1329 }
1330 
1331 #define gbLowLatency 0
1332 
tng__setup_rcdata(context_ENC_p ctx)1333 static void tng__setup_rcdata(context_ENC_p ctx)
1334 {
1335     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
1336     PIC_PARAMS    *psPicParams = &(ctx->sPicParams);
1337 
1338     IMG_INT32 i32FrameRate, i32TmpQp;
1339     double        L1, L2, L3,L4, L5, L6, flBpp;
1340     IMG_INT32 i32BufferSizeInFrames;
1341 
1342     if (ctx->bInsertHRDParams &&
1343        (ctx->eStandard == IMG_STANDARD_H264)) {
1344        psRCParams->ui32BufferSize = ctx->buffer_size;
1345        psRCParams->i32InitialLevel = ctx->buffer_size - ctx->initial_buffer_fullness;
1346        psRCParams->i32InitialDelay = ctx->initial_buffer_fullness;
1347     }
1348 
1349     // If Bit Rate and Basic Units are not specified then set to default values.
1350     if (psRCParams->ui32BitsPerSecond == 0 && !ctx->bEnableMVC) {
1351         psRCParams->ui32BitsPerSecond = 640000;     // kbps
1352     }
1353 
1354     if (!psRCParams->ui32BUSize) {
1355         psRCParams->ui32BUSize = (ctx->ui16PictureHeight>>4) * (ctx->ui16Width>>4);		// BU = 1 Frame
1356     }
1357 
1358     if (!psRCParams->ui32FrameRate) {
1359         psRCParams->ui32FrameRate = 30;		// fps
1360     }
1361 
1362     // Calculate Bits Per Pixel
1363     if (ctx->ui16Width <= 176 ) {
1364         i32FrameRate    = 30;
1365     } else {
1366         i32FrameRate	= psRCParams->ui32FrameRate;
1367     }
1368 
1369     flBpp = 1.0 * psRCParams->ui32BitsPerSecond / (i32FrameRate * ctx->ui16Width * ctx->ui16FrameHeight);
1370 
1371     psPicParams->sInParams.ui8SeInitQP          = psRCParams->ui32InitialQp;
1372     psPicParams->sInParams.ui8MBPerRow      = (ctx->ui16Width>>4);
1373     psPicParams->sInParams.ui16MBPerBU       = psRCParams->ui32BUSize;
1374     psPicParams->sInParams.ui16MBPerFrm     = (ctx->ui16Width>>4) * (ctx->ui16PictureHeight>>4);
1375     psPicParams->sInParams.ui16BUPerFrm      = (psPicParams->sInParams.ui16MBPerFrm) / psRCParams->ui32BUSize;
1376 
1377     psPicParams->sInParams.ui16IntraPeriod      = psRCParams->ui32IntraFreq;
1378     psPicParams->sInParams.ui16BFrames         = psRCParams->ui16BFrames;
1379     psPicParams->sInParams.i32BitRate             = psRCParams->ui32BitsPerSecond;
1380 
1381     psPicParams->sInParams.bFrmSkipDisable   = psRCParams->bDisableFrameSkipping;
1382     psPicParams->sInParams.i32BitsPerFrm       = (psRCParams->ui32BitsPerSecond + psRCParams->ui32FrameRate/2) / psRCParams->ui32FrameRate;
1383     psPicParams->sInParams.i32BitsPerBU         = psPicParams->sInParams.i32BitsPerFrm / (4 * psPicParams->sInParams.ui16BUPerFrm);
1384 
1385     // Codec-dependant fields
1386     if (ctx->eStandard == IMG_STANDARD_H264) {
1387         psPicParams->sInParams.mode.h264.i32TransferRate = (psRCParams->ui32TransferBitsPerSecond + psRCParams->ui32FrameRate/2) / psRCParams->ui32FrameRate;
1388         psPicParams->sInParams.mode.h264.bHierarchicalMode =   psRCParams->b16Hierarchical;
1389     } else {
1390         psPicParams->sInParams.mode.other.i32BitsPerGOP      = (psRCParams->ui32BitsPerSecond / psRCParams->ui32FrameRate) * psRCParams->ui32IntraFreq;
1391         psPicParams->sInParams.mode.other.ui16AvQPVal         = psRCParams->ui32InitialQp;
1392         psPicParams->sInParams.mode.other.ui16MyInitQP         = psRCParams->ui32InitialQp;
1393     }
1394 
1395 
1396     if (psPicParams->sInParams.i32BitsPerFrm) {
1397         i32BufferSizeInFrames = (psRCParams->ui32BufferSize + (psPicParams->sInParams.i32BitsPerFrm/2))/psPicParams->sInParams.i32BitsPerFrm;
1398     } else {
1399         IMG_ASSERT(ctx->bEnableMvc && "Can happen only in MVC mode");
1400         /* Asigning more or less `normal` value. To be overriden by MVC RC module */
1401         i32BufferSizeInFrames = 30;
1402     }
1403 
1404     // select thresholds and initial Qps etc that are codec dependent
1405     switch (ctx->eStandard) {
1406         case IMG_STANDARD_H264:
1407             L1 = 0.1;	L2 = 0.15;	L3 = 0.2;
1408             psPicParams->sInParams.ui8MaxQPVal = 51;
1409             ctx->ui32KickSize = psPicParams->sInParams.ui16MBPerBU;
1410 
1411             // Setup MAX and MIN Quant Values
1412             if (psRCParams->iMinQP == 0) {
1413                 if (flBpp >= 0.50)
1414                     i32TmpQp = 4;
1415                 else if (flBpp > 0.133)
1416                     i32TmpQp = (IMG_INT32)(22 - (40*flBpp));
1417                 else
1418                     i32TmpQp = (IMG_INT32)(30 - (100 * flBpp));
1419 
1420                 /* Adjust minQp up for small buffer size and down for large buffer size */
1421                 if (i32BufferSizeInFrames < 5) {
1422                     i32TmpQp += 2;
1423                 }
1424 
1425                 if (i32BufferSizeInFrames > 40) {
1426                     if(i32TmpQp>=1)
1427                         i32TmpQp -= 1;
1428                 }
1429                 /* for HD content allow a lower minQp as bitrate is more easily controlled in this case */
1430                 if (psPicParams->sInParams.ui16MBPerFrm > 2000) {
1431                         i32TmpQp -= 6;
1432                 }
1433             } else
1434                 i32TmpQp = psRCParams->iMinQP;
1435 
1436             if (i32TmpQp < 2) {
1437                 psPicParams->sInParams.ui8MinQPVal = 2;
1438             } else {
1439                 psPicParams->sInParams.ui8MinQPVal = i32TmpQp;
1440             }
1441 
1442             // Calculate Initial QP if it has not been specified
1443             i32TmpQp = psPicParams->sInParams.ui8SeInitQP;
1444             if (psPicParams->sInParams.ui8SeInitQP==0) {
1445                 L1 = 0.050568;
1446                 L2 = 0.202272;
1447                 L3 = 0.40454321;
1448                 L4 = 0.80908642;
1449                 L5 = 1.011358025;
1450 
1451                 if (flBpp < L1)
1452                     i32TmpQp = (IMG_INT32)(45 - 78.10*flBpp);
1453                 else if (flBpp>=L1 && flBpp<L2)
1454                     i32TmpQp = (IMG_INT32)(44 - 72.51*flBpp);
1455                 else if (flBpp>=L2 && flBpp<L3)
1456                     i32TmpQp = (IMG_INT32)(34 - 24.72*flBpp);
1457                 else if (flBpp>=L3 && flBpp<L4)
1458                     i32TmpQp = (IMG_INT32)(32 - 19.78*flBpp);
1459                 else if (flBpp>=L4 && flBpp<L5)
1460                     i32TmpQp = (IMG_INT32)(25 - 9.89*flBpp);
1461                 else if (flBpp>=L5)
1462                     i32TmpQp = (IMG_INT32)(18 - 4.95*flBpp);
1463 
1464                 /* Adjust ui8SeInitQP up for small buffer size or small fps */
1465                 /* Adjust ui8SeInitQP up for small gop size */
1466                 if ((i32BufferSizeInFrames < 20) || (psRCParams->ui32IntraFreq < 20)) {
1467                     i32TmpQp += 2;
1468                 }
1469 
1470 		/* for very small buffers increase initial Qp even more */
1471 		if(i32BufferSizeInFrames < 5)
1472 		{
1473 			i32TmpQp += 8;
1474 		}
1475 
1476                 /* start on a lower initial Qp for HD content as the coding is more efficient */
1477                 if (psPicParams->sInParams.ui16MBPerFrm > 2000) {
1478                     i32TmpQp -= 2;
1479                 }
1480 
1481 		if(psPicParams->sInParams.ui16IntraPeriod ==1)
1482 		{
1483 		    /* for very small GOPS start with a much higher initial Qp */
1484 		    i32TmpQp += 12;
1485 		} else if (psPicParams->sInParams.ui16IntraPeriod<5) {
1486 		    /* for very small GOPS start with a much higher initial Qp */
1487 		    i32TmpQp += 6;
1488 		}
1489             }
1490             if (i32TmpQp>49) {
1491                 i32TmpQp = 49;
1492             }
1493             if (i32TmpQp < psPicParams->sInParams.ui8MinQPVal) {
1494                 i32TmpQp = psPicParams->sInParams.ui8MinQPVal;
1495             }
1496             psPicParams->sInParams.ui8SeInitQP = i32TmpQp;
1497 
1498             if(flBpp <= 0.3)
1499                 psPicParams->ui32Flags |= ISRC_I16BIAS;
1500 
1501             break;
1502 
1503         case IMG_STANDARD_MPEG4:
1504         case IMG_STANDARD_MPEG2:
1505         case IMG_STANDARD_H263:
1506             psPicParams->sInParams.ui8MaxQPVal	 = 31;
1507             if (ctx->ui16Width == 176) {
1508                 L1 = 0.042;    L2 = 0.084;    L3 = 0.126;    L4 = 0.168;    L5 = 0.336;    L6=0.505;
1509             } else if (ctx->ui16Width == 352) {
1510                 L1 = 0.064;    L2 = 0.084;    L3 = 0.106;    L4 = 0.126;    L5 = 0.168;    L6=0.210;
1511             } else {
1512                 L1 = 0.050;    L2 = 0.0760;    L3 = 0.096;   L4 = 0.145;    L5 = 0.193;    L6=0.289;
1513             }
1514 
1515             if (psPicParams->sInParams.ui8SeInitQP==0) {
1516                 if (flBpp < L1)
1517                     psPicParams->sInParams.ui8SeInitQP = 31;
1518                 else if (flBpp>=L1 && flBpp<L2)
1519                     psPicParams->sInParams.ui8SeInitQP = 26;
1520                 else if (flBpp>=L2 && flBpp<L3)
1521                     psPicParams->sInParams.ui8SeInitQP = 22;
1522                 else if (flBpp>=L3 && flBpp<L4)
1523                     psPicParams->sInParams.ui8SeInitQP = 18;
1524                 else if (flBpp>=L4 && flBpp<L5)
1525                     psPicParams->sInParams.ui8SeInitQP = 14;
1526                 else if (flBpp>=L5 && flBpp<L6)
1527                     psPicParams->sInParams.ui8SeInitQP = 10;
1528                 else
1529                     psPicParams->sInParams.ui8SeInitQP = 8;
1530 
1531                 /* Adjust ui8SeInitQP up for small buffer size or small fps */
1532                 /* Adjust ui8SeInitQP up for small gop size */
1533                 if ((i32BufferSizeInFrames < 20) || (psRCParams->ui32IntraFreq < 20)) {
1534                     psPicParams->sInParams.ui8SeInitQP += 2;
1535                 }
1536 
1537                 if (psPicParams->sInParams.ui8SeInitQP > psPicParams->sInParams.ui8MaxQPVal) {
1538                     psPicParams->sInParams.ui8SeInitQP = psPicParams->sInParams.ui8MaxQPVal;
1539                 }
1540                 psPicParams->sInParams.mode.other.ui16AvQPVal =  psPicParams->sInParams.ui8SeInitQP;
1541             }
1542             psPicParams->sInParams.ui8MinQPVal = 2;
1543 
1544             /* Adjust minQp up for small buffer size and down for large buffer size */
1545             if (i32BufferSizeInFrames < 20) {
1546                 psPicParams->sInParams.ui8MinQPVal += 1;
1547             }
1548             break;
1549 
1550         default:
1551             /* the NO RC cases will fall here */
1552             break;
1553     }
1554 
1555     if (ctx->sRCParams.eRCMode == IMG_RCMODE_VBR) {
1556         psPicParams->sInParams.ui16MBPerBU  = psPicParams->sInParams.ui16MBPerFrm;
1557         psPicParams->sInParams.ui16BUPerFrm = 1;
1558 
1559         // Initialize the parameters of fluid flow traffic model.
1560         psPicParams->sInParams.i32BufferSize   = psRCParams->ui32BufferSize;
1561 
1562 
1563         // These scale factor are used only for rate control to avoid overflow
1564         // in fixed-point calculation these scale factors are decided by bit rate
1565         if (psRCParams->ui32BitsPerSecond < 640000) {
1566             psPicParams->sInParams.ui8ScaleFactor  = 2;						// related to complexity
1567         }
1568         else if (psRCParams->ui32BitsPerSecond < 2000000) {
1569             // 2 Mbits
1570             psPicParams->sInParams.ui8ScaleFactor  = 4;
1571         }
1572         else if(psRCParams->ui32BitsPerSecond < 8000000) {
1573             // 8 Mbits
1574             psPicParams->sInParams.ui8ScaleFactor  = 6;
1575         } else
1576             psPicParams->sInParams.ui8ScaleFactor  = 8;
1577     } else {
1578         // Set up Input Parameters that are mode dependent
1579         switch (ctx->eStandard) {
1580             case IMG_STANDARD_H264:
1581                 // ------------------- H264 CBR RC ------------------- //
1582                 // Initialize the parameters of fluid flow traffic model.
1583                 psPicParams->sInParams.i32BufferSize = psRCParams->ui32BufferSize;
1584 
1585                 // HRD consideration - These values are used by H.264 reference code.
1586                 if (psRCParams->ui32BitsPerSecond < 1000000) {
1587                 // 1 Mbits/s
1588                     psPicParams->sInParams.ui8ScaleFactor = 0;
1589                 } else if (psRCParams->ui32BitsPerSecond < 2000000) {
1590                 // 2 Mbits/s
1591                     psPicParams->sInParams.ui8ScaleFactor = 1;
1592                 } else if (psRCParams->ui32BitsPerSecond < 4000000) {
1593                 // 4 Mbits/s
1594                     psPicParams->sInParams.ui8ScaleFactor = 2;
1595                 } else if (psRCParams->ui32BitsPerSecond < 8000000) {
1596                 // 8 Mbits/s
1597                     psPicParams->sInParams.ui8ScaleFactor = 3;
1598                 } else  {
1599                     psPicParams->sInParams.ui8ScaleFactor = 4;
1600                 }
1601 
1602                 if (ctx->sRCParams.eRCMode == IMG_RCMODE_VCM) {
1603                     psPicParams->sInParams.i32BufferSize = i32BufferSizeInFrames;
1604                 }
1605                 break;
1606             case IMG_STANDARD_MPEG4:
1607             case IMG_STANDARD_MPEG2:
1608             case IMG_STANDARD_H263:
1609                 flBpp  = 256 * (psRCParams->ui32BitsPerSecond/ctx->ui16Width);
1610                 flBpp /= (ctx->ui16FrameHeight * psRCParams->ui32FrameRate);
1611 
1612                 if ((psPicParams->sInParams.ui16MBPerFrm > 1024 && flBpp < 16) || (psPicParams->sInParams.ui16MBPerFrm <= 1024 && flBpp < 24))
1613                     psPicParams->sInParams.mode.other.ui8HalfFrameRate = 1;
1614                 else
1615                     psPicParams->sInParams.mode.other.ui8HalfFrameRate = 0;
1616 
1617                 if (psPicParams->sInParams.mode.other.ui8HalfFrameRate >= 1) {
1618                     psPicParams->sInParams.ui8SeInitQP = 31;
1619                     psPicParams->sInParams.mode.other.ui16AvQPVal = 31;
1620                     psPicParams->sInParams.mode.other.ui16MyInitQP = 31;
1621                 }
1622 
1623                 psPicParams->sInParams.i32BufferSize = psRCParams->ui32BufferSize;
1624                 break;
1625             default:
1626                 break;
1627         }
1628     }
1629 
1630     if (psRCParams->bScDetectDisable)
1631         psPicParams->ui32Flags  |= ISSCENE_DISABLED;
1632 
1633     psPicParams->sInParams.i32InitialDelay	= psRCParams->i32InitialDelay;
1634     psPicParams->sInParams.i32InitialLevel	= psRCParams->i32InitialLevel;
1635     psRCParams->ui32InitialQp = psPicParams->sInParams.ui8SeInitQP;
1636 
1637     /* The rate control uses this value to adjust the reaction rate to larger than expected frames */
1638     if (ctx->eStandard == IMG_STANDARD_H264) {
1639         if (psPicParams->sInParams.i32BitsPerFrm) {
1640             const IMG_INT32 bitsPerGop = (psRCParams->ui32BitsPerSecond / psRCParams->ui32FrameRate) * psRCParams->ui32IntraFreq;
1641             psPicParams->sInParams.mode.h264.ui32RCScaleFactor = (bitsPerGop * 256) /
1642                 (psPicParams->sInParams.i32BufferSize - psPicParams->sInParams.i32InitialLevel);
1643         } else {
1644             psPicParams->sInParams.mode.h264.ui32RCScaleFactor = 0;
1645         }
1646     } else {
1647         psPicParams->sInParams.mode.other.ui16MyInitQP		= psPicParams->sInParams.ui8SeInitQP;
1648     }
1649 
1650     return ;
1651 }
1652 
tng__save_slice_params_template(context_ENC_p ctx,IMG_UINT32 ui32SliceBufIdx,IMG_UINT32 ui32SliceType,IMG_UINT32 ui32IPEControl,IMG_UINT32 ui32Flags,IMG_UINT32 ui32SliceConfig,IMG_UINT32 ui32SeqConfig,IMG_UINT32 ui32StreamIndex)1653 static void tng__save_slice_params_template(
1654     context_ENC_p ctx,
1655     IMG_UINT32  ui32SliceBufIdx,
1656     IMG_UINT32  ui32SliceType,
1657     IMG_UINT32  ui32IPEControl,
1658     IMG_UINT32  ui32Flags,
1659     IMG_UINT32  ui32SliceConfig,
1660     IMG_UINT32  ui32SeqConfig,
1661     IMG_UINT32  ui32StreamIndex
1662 )
1663 {
1664     IMG_FRAME_TEMPLATE_TYPE eSliceType = (IMG_FRAME_TEMPLATE_TYPE)ui32SliceType;
1665     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
1666     SLICE_PARAMS *slice_temp_p = NULL;
1667 
1668     psb_buffer_map(&(ps_mem->bufs_slice_template), &(ps_mem->bufs_slice_template.virtual_addr));
1669     if (ps_mem->bufs_slice_template.virtual_addr == NULL) {
1670         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping slice template\n", __FUNCTION__);
1671         return ;
1672     }
1673 
1674     slice_temp_p = (SLICE_PARAMS*)(ps_mem->bufs_slice_template.virtual_addr + (ctx->ctx_mem_size.slice_template * ui32SliceBufIdx));
1675 
1676     slice_temp_p->eTemplateType = eSliceType;
1677     slice_temp_p->ui32Flags = ui32Flags;
1678     slice_temp_p->ui32IPEControl = ui32IPEControl;
1679     slice_temp_p->ui32SliceConfig = ui32SliceConfig;
1680     slice_temp_p->ui32SeqConfig = ui32SeqConfig;
1681 
1682     psb_buffer_unmap(&(ps_mem->bufs_slice_template));
1683 
1684     return ;
1685 }
1686 
1687 
1688 /*****************************************************************************
1689  * Function Name        :       PrepareEncodeSliceParams
1690  *
1691  ****************************************************************************/
tng__prepare_encode_sliceparams(context_ENC_p ctx,IMG_UINT32 ui32SliceBufIdx,IMG_UINT32 ui32SliceType,IMG_UINT16 __maybe_unused ui16CurrentRow,IMG_UINT16 ui16SliceHeight,IMG_UINT8 uiDeblockIDC,IMG_BOOL bFieldMode,IMG_INT iFineYSearchSize,IMG_UINT32 ui32StreamIndex)1692 static IMG_UINT32 tng__prepare_encode_sliceparams(
1693     context_ENC_p ctx,
1694     IMG_UINT32  ui32SliceBufIdx,
1695     IMG_UINT32  ui32SliceType,
1696     IMG_UINT16  __maybe_unused ui16CurrentRow,
1697     IMG_UINT16  ui16SliceHeight,
1698     IMG_UINT8   uiDeblockIDC,
1699     IMG_BOOL    bFieldMode,
1700     IMG_INT     iFineYSearchSize,
1701     IMG_UINT32  ui32StreamIndex
1702 )
1703 {
1704     IMG_UINT32      ui32FrameStoreFormat;
1705     IMG_UINT8       ui8SwapChromas;
1706     IMG_UINT32      ui32MBsPerKick, ui32KicksPerSlice;
1707     IMG_UINT32      ui32IPEControl;
1708     IMG_UINT32      ui32Flags = 0;
1709     IMG_UINT32      ui32SliceConfig = 0;
1710     IMG_UINT32      ui32SeqConfig = 0;
1711     IMG_BOOL bIsIntra = IMG_FALSE;
1712     IMG_BOOL bIsBPicture = IMG_FALSE;
1713     IMG_BOOL bIsIDR = IMG_FALSE;
1714     IMG_IPE_MINBLOCKSIZE blkSz;
1715     IMG_FRAME_TEMPLATE_TYPE eSliceType = (IMG_FRAME_TEMPLATE_TYPE)ui32SliceType;
1716 
1717     if (!ctx) {
1718         return VA_STATUS_ERROR_INVALID_CONTEXT;
1719     }
1720 
1721     /* We want multiple ones of these so we can submit multiple slices without having to wait for the next*/
1722     ui32IPEControl = ctx->ui32IPEControl;
1723     bIsIntra = ((eSliceType == IMG_FRAME_IDR) || (eSliceType == IMG_FRAME_INTRA));
1724     bIsBPicture = (eSliceType == IMG_FRAME_INTER_B);
1725     bIsIDR = ((eSliceType == IMG_FRAME_IDR) || (eSliceType == IMG_FRAME_INTER_P_IDR));
1726 
1727     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG bIsIntra  = %x\n", __FUNCTION__, bIsIntra);
1728     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG bIsBFrame = %x\n", __FUNCTION__, bIsBPicture);
1729     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG bIsIDR    = %x\n", __FUNCTION__, bIsIDR);
1730     /* extract block size */
1731     blkSz = F_EXTRACT(ui32IPEControl, TOPAZHP_CR_IPE_BLOCKSIZE);
1732     /* mask-out the block size bits from ui32IPEControl */
1733     ui32IPEControl &= ~(F_MASK(TOPAZHP_CR_IPE_BLOCKSIZE));
1734     switch (ctx->eStandard) {
1735     case IMG_STANDARD_NONE:
1736     case IMG_STANDARD_JPEG:
1737         break;
1738 
1739     case IMG_STANDARD_H264:
1740         if (blkSz > 2) blkSz = 2;
1741         if (bIsBPicture) {
1742             if (blkSz > 1) blkSz = 1;
1743         }
1744 #ifdef BRN_30322
1745         else if (bIsIntra) {
1746             if (blkSz == 0) blkSz = 1; // Workaround for BRN 30322
1747         }
1748 #endif
1749 
1750 #ifdef BRN_30550
1751         if (ctx->bCabacEnabled)
1752             if (blkSz == 0) blkSz = 1;
1753 #endif
1754         if (ctx->uMBspS >= _1080P_30FPS) {
1755             ui32IPEControl |= F_ENCODE(iFineYSearchSize, TOPAZHP_CR_IPE_LRITC_BOUNDARY) |
1756                               F_ENCODE(iFineYSearchSize, TOPAZHP_CR_IPE_Y_FINE_SEARCH);
1757         } else {
1758             ui32IPEControl |= F_ENCODE(iFineYSearchSize + 1, TOPAZHP_CR_IPE_LRITC_BOUNDARY) |
1759                               F_ENCODE(iFineYSearchSize, TOPAZHP_CR_IPE_Y_FINE_SEARCH);
1760 
1761         }
1762         if (ctx->bLimitNumVectors)
1763             ui32IPEControl |= F_ENCODE(1, TOPAZHP_CR_IPE_MV_NUMBER_RESTRICTION);
1764         break;
1765 
1766     case IMG_STANDARD_H263:
1767         blkSz = 0;
1768         ui32IPEControl = F_ENCODE(iFineYSearchSize + 1, TOPAZHP_CR_IPE_LRITC_BOUNDARY) |
1769                          F_ENCODE(iFineYSearchSize, TOPAZHP_CR_IPE_Y_FINE_SEARCH) |
1770                          F_ENCODE(0, TOPAZHP_CR_IPE_4X4_SEARCH);
1771         //We only support a maxium vector of 15.5 pixels in H263
1772         break;
1773 
1774     case IMG_STANDARD_MPEG4:
1775         if (blkSz > BLK_SZ_8x8) blkSz = BLK_SZ_8x8;
1776         ui32IPEControl |= F_ENCODE(iFineYSearchSize + 1, TOPAZHP_CR_IPE_LRITC_BOUNDARY) |
1777                           F_ENCODE(iFineYSearchSize, TOPAZHP_CR_IPE_Y_FINE_SEARCH) |
1778                           F_ENCODE(0, TOPAZHP_CR_IPE_4X4_SEARCH);
1779         // FIXME Should be 1, set to zero for hardware testing.
1780         break;
1781     case IMG_STANDARD_MPEG2:
1782         if (blkSz != BLK_SZ_16x16) blkSz = BLK_SZ_16x16;
1783         ui32IPEControl |= F_ENCODE(iFineYSearchSize + 1, TOPAZHP_CR_IPE_LRITC_BOUNDARY) |
1784                           F_ENCODE(iFineYSearchSize, TOPAZHP_CR_IPE_Y_FINE_SEARCH) |
1785                           F_ENCODE(0, TOPAZHP_CR_IPE_4X4_SEARCH);
1786         // FIXME Should be 1, set to zero for hardware testing.
1787         break;
1788     }
1789 
1790     {
1791         IMG_BOOL bRestrict4x4SearchSize;
1792         IMG_UINT32 uLritcBoundary;
1793 
1794         if (ctx->uMBspS >= _1080P_30FPS)
1795             bRestrict4x4SearchSize = 1;
1796         else
1797             bRestrict4x4SearchSize = 0;
1798 
1799         ui32IPEControl |= F_ENCODE(blkSz, TOPAZHP_CR_IPE_BLOCKSIZE);
1800         uLritcBoundary = (blkSz != BLK_SZ_16x16) ? (iFineYSearchSize + (bRestrict4x4SearchSize ? 0 : 1)) : 1;
1801         if (uLritcBoundary > 3) {
1802             return VA_STATUS_ERROR_UNKNOWN;
1803         }
1804 
1805         /* Minium sub block size to calculate motion vectors for. 0=16x16, 1=8x8, 2=4x4 */
1806         ui32IPEControl = F_INSERT(ui32IPEControl, blkSz, TOPAZHP_CR_IPE_BLOCKSIZE);
1807         ui32IPEControl = F_INSERT(ui32IPEControl, iFineYSearchSize, TOPAZHP_CR_IPE_Y_FINE_SEARCH);
1808         ui32IPEControl = F_INSERT(ui32IPEControl, ctx->bLimitNumVectors, TOPAZHP_CR_IPE_MV_NUMBER_RESTRICTION);
1809 
1810         ui32IPEControl = F_INSERT(ui32IPEControl, uLritcBoundary, TOPAZHP_CR_IPE_LRITC_BOUNDARY);  // 8x8 search
1811         ui32IPEControl = F_INSERT(ui32IPEControl, bRestrict4x4SearchSize ? 0 : 1, TOPAZHP_CR_IPE_4X4_SEARCH);
1812 
1813     }
1814     ui32IPEControl = F_INSERT(ui32IPEControl, ctx->bHighLatency, TOPAZHP_CR_IPE_HIGH_LATENCY);
1815 //              psSliceParams->ui32IPEControl = ui32IPEControl;
1816 
1817     if (!bIsIntra) {
1818         if (bIsBPicture)
1819             ui32Flags |= ISINTERB_FLAGS;
1820         else
1821             ui32Flags |= ISINTERP_FLAGS;
1822     }
1823     switch (ctx->eStandard)  {
1824     case IMG_STANDARD_NONE:
1825         break;
1826     case IMG_STANDARD_H263:
1827         ui32Flags |= ISH263_FLAGS;
1828         break;
1829     case IMG_STANDARD_MPEG4:
1830         ui32Flags |= ISMPEG4_FLAGS;
1831         break;
1832     case IMG_STANDARD_MPEG2:
1833         ui32Flags |= ISMPEG2_FLAGS;
1834         break;
1835     default:
1836         break;
1837     }
1838 
1839     if (ctx->bMultiReferenceP && !(bIsIntra || bIsBPicture))
1840         ui32Flags |= ISMULTIREF_FLAGS;
1841     if (ctx->bSpatialDirect && bIsBPicture)
1842         ui32Flags |= SPATIALDIRECT_FLAGS;
1843 
1844     if (bIsIntra) {
1845         ui32SliceConfig = F_ENCODE(TOPAZHP_CR_SLICE_TYPE_I_SLICE, TOPAZHP_CR_SLICE_TYPE);
1846     } else {
1847         if (bIsBPicture) {
1848             ui32SliceConfig = F_ENCODE(TOPAZHP_CR_SLICE_TYPE_B_SLICE, TOPAZHP_CR_SLICE_TYPE);
1849         } else {
1850             // p frame
1851             ui32SliceConfig = F_ENCODE(TOPAZHP_CR_SLICE_TYPE_P_SLICE, TOPAZHP_CR_SLICE_TYPE);
1852         }
1853     }
1854 
1855     ui32MBsPerKick = ctx->ui32KickSize;
1856     // we need to figure out the number of kicks and mb's per kick to use.
1857     // on H.264 we will use a MB's per kick of basic unit
1858     // on other rc varients we will use mb's per kick of width
1859     ui32KicksPerSlice = ((ui16SliceHeight / 16) * (ctx->ui16Width / 16)) / ui32MBsPerKick;
1860     assert((ui32KicksPerSlice * ui32MBsPerKick) == ((ui16SliceHeight / 16)*(ctx->ui16Width / 16)));
1861 
1862     // need some sensible ones don't look to be implemented yet...
1863     // change per stream
1864 
1865     if ((ctx->eFormat == IMG_CODEC_UY0VY1_8888) || (ctx->eFormat == IMG_CODEC_VY0UY1_8888))
1866         ui32FrameStoreFormat = 3;
1867     else if ((ctx->eFormat == IMG_CODEC_Y0UY1V_8888) || (ctx->eFormat == IMG_CODEC_Y0VY1U_8888))
1868         ui32FrameStoreFormat = 2;
1869     else if ((ctx->eFormat == IMG_CODEC_PL12) || (ctx->eFormat == IMG_CODEC_422_PL12))
1870         ui32FrameStoreFormat = 1;
1871     else
1872         ui32FrameStoreFormat = 0;
1873 
1874     if ((ctx->eFormat == IMG_CODEC_VY0UY1_8888) || (ctx->eFormat == IMG_CODEC_Y0VY1U_8888))
1875         ui8SwapChromas = 1;
1876     else
1877         ui8SwapChromas = 0;
1878 
1879     switch (ctx->eStandard) {
1880     case IMG_STANDARD_NONE:
1881     case IMG_STANDARD_JPEG:
1882         break;
1883     case IMG_STANDARD_H264:
1884         /* H264 */
1885 
1886         ui32SeqConfig = F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC0_BELOW_IN_VALID)
1887                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC1_BELOW_IN_VALID)
1888                         | F_ENCODE(0, TOPAZHP_CR_ABOVE_OUT_OF_SLICE_VALID)
1889                         | F_ENCODE(1, TOPAZHP_CR_WRITE_TEMPORAL_PIC0_BELOW_VALID)
1890                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC0_VALID)
1891                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC1_VALID)
1892                         | F_ENCODE(!bIsBPicture, TOPAZHP_CR_REF_PIC1_EQUAL_PIC0)
1893                         | F_ENCODE(bFieldMode ? 1 : 0 , TOPAZHP_CR_FIELD_MODE)
1894                         | F_ENCODE(ui8SwapChromas, TOPAZHP_CR_FRAME_STORE_CHROMA_SWAP)
1895                         | F_ENCODE(ui32FrameStoreFormat, TOPAZHP_CR_FRAME_STORE_FORMAT)
1896                         | F_ENCODE(TOPAZHP_CR_ENCODER_STANDARD_H264, TOPAZHP_CR_ENCODER_STANDARD)
1897                         | F_ENCODE(uiDeblockIDC == 1 ? 0 : 1, TOPAZHP_CR_DEBLOCK_ENABLE);
1898 
1899         if (ctx->sRCParams.ui16BFrames) {
1900             ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_WRITE_TEMPORAL_COL_VALID);
1901             if ((ui32Flags & ISINTERB_FLAGS) == ISINTERB_FLAGS)
1902                 ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_TEMPORAL_COL_IN_VALID);
1903         }
1904 
1905         if (!bIsBPicture) {
1906             ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_WRITE_TEMPORAL_COL_VALID);
1907         }
1908 
1909         break;
1910     case IMG_STANDARD_MPEG4:
1911         /* MPEG4 */
1912         ui32SeqConfig = F_ENCODE(1, TOPAZHP_CR_WRITE_RECON_PIC)
1913                         | F_ENCODE(0, TOPAZHP_CR_DEBLOCK_ENABLE)
1914                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC0_BELOW_IN_VALID)
1915                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC1_BELOW_IN_VALID)
1916                         | F_ENCODE(0, TOPAZHP_CR_ABOVE_OUT_OF_SLICE_VALID)
1917                         | F_ENCODE(((ui32Flags & ISINTERP_FLAGS) == ISINTERP_FLAGS), TOPAZHP_CR_WRITE_TEMPORAL_PIC0_BELOW_VALID)
1918                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC0_VALID)
1919                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC1_VALID)
1920                         | F_ENCODE(1, TOPAZHP_CR_REF_PIC1_EQUAL_PIC0)
1921                         | F_ENCODE(0, TOPAZHP_CR_FIELD_MODE)
1922                         | F_ENCODE(ui8SwapChromas, TOPAZHP_CR_FRAME_STORE_CHROMA_SWAP)
1923                         | F_ENCODE(ui32FrameStoreFormat, TOPAZHP_CR_FRAME_STORE_FORMAT)
1924                         | F_ENCODE(TOPAZHP_CR_ENCODER_STANDARD_MPEG4, TOPAZHP_CR_ENCODER_STANDARD);
1925         break;
1926     case IMG_STANDARD_MPEG2:
1927         /* MPEG2 */
1928         ui32SeqConfig = F_ENCODE(1, TOPAZHP_CR_WRITE_RECON_PIC)
1929                         | F_ENCODE(0, TOPAZHP_CR_DEBLOCK_ENABLE)
1930                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC0_BELOW_IN_VALID)
1931                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC1_BELOW_IN_VALID)
1932                         | F_ENCODE(0, TOPAZHP_CR_ABOVE_OUT_OF_SLICE_VALID)
1933                         | F_ENCODE(((ui32Flags & ISINTERP_FLAGS) == ISINTERP_FLAGS), TOPAZHP_CR_WRITE_TEMPORAL_PIC0_BELOW_VALID)
1934                         | F_ENCODE(1, TOPAZHP_CR_REF_PIC0_VALID)
1935                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC1_VALID)
1936                         | F_ENCODE(1, TOPAZHP_CR_REF_PIC1_EQUAL_PIC0)
1937                         | F_ENCODE(bFieldMode ? 1 : 0 , TOPAZHP_CR_FIELD_MODE)
1938                         | F_ENCODE(ui8SwapChromas, TOPAZHP_CR_FRAME_STORE_CHROMA_SWAP)
1939                         | F_ENCODE(ui32FrameStoreFormat, TOPAZHP_CR_FRAME_STORE_FORMAT)
1940                         | F_ENCODE(TOPAZHP_CR_ENCODER_STANDARD_MPEG2, TOPAZHP_CR_ENCODER_STANDARD);
1941         break;
1942     case IMG_STANDARD_H263:
1943         /* H263 */
1944         ui32SeqConfig = F_ENCODE(1, TOPAZHP_CR_WRITE_RECON_PIC)
1945                         | F_ENCODE(0, TOPAZHP_CR_DEBLOCK_ENABLE)
1946                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC0_BELOW_IN_VALID)
1947                         | F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC1_BELOW_IN_VALID)
1948                         | F_ENCODE(0, TOPAZHP_CR_ABOVE_OUT_OF_SLICE_VALID)
1949                         | F_ENCODE(((ui32Flags & ISINTERP_FLAGS) == ISINTERP_FLAGS), TOPAZHP_CR_WRITE_TEMPORAL_PIC0_BELOW_VALID)
1950                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC0_VALID)
1951                         | F_ENCODE(0, TOPAZHP_CR_REF_PIC1_VALID)
1952                         | F_ENCODE(1, TOPAZHP_CR_REF_PIC1_EQUAL_PIC0)
1953                         | F_ENCODE(0, TOPAZHP_CR_FIELD_MODE)
1954                         | F_ENCODE(ui8SwapChromas, TOPAZHP_CR_FRAME_STORE_CHROMA_SWAP)
1955                         | F_ENCODE(ui32FrameStoreFormat, TOPAZHP_CR_FRAME_STORE_FORMAT)
1956                         | F_ENCODE(TOPAZHP_CR_ENCODER_STANDARD_H263, TOPAZHP_CR_ENCODER_STANDARD);
1957         break;
1958     }
1959 
1960     if (bIsBPicture)        {
1961         ui32SeqConfig |= F_ENCODE(0, TOPAZHP_CR_TEMPORAL_PIC1_BELOW_IN_VALID)
1962                          | F_ENCODE(0, TOPAZHP_CR_WRITE_TEMPORAL_PIC1_BELOW_VALID)
1963                          | F_ENCODE(1, TOPAZHP_CR_REF_PIC1_VALID)
1964                          | F_ENCODE(1, TOPAZHP_CR_TEMPORAL_COL_IN_VALID);
1965     }
1966 
1967     if (ctx->ui8EnableSelStatsFlags & ESF_FIRST_STAGE_STATS)        {
1968         ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_WRITE_MB_FIRST_STAGE_VALID);
1969     }
1970 
1971     if (ctx->ui8EnableSelStatsFlags & ESF_MP_BEST_MB_DECISION_STATS ||
1972         ctx->ui8EnableSelStatsFlags & ESF_MP_BEST_MOTION_VECTOR_STATS)  {
1973         ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_BEST_MULTIPASS_OUT_VALID);
1974 
1975         if (!(ctx->ui8EnableSelStatsFlags & ESF_MP_BEST_MOTION_VECTOR_STATS)) {
1976             ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_BEST_MVS_OUT_DISABLE);// 64 Byte Best Multipass Motion Vector output disabled by default
1977         }
1978     }
1979 
1980     if (ctx->bEnableInpCtrl) {
1981         ui32SeqConfig |= F_ENCODE(1, TOPAZHP_CR_MB_CONTROL_IN_VALID);
1982     }
1983 
1984     if (eSliceType == IMG_FRAME_IDR) {
1985         ctx->sBiasTables.ui32SeqConfigInit = ui32SeqConfig;
1986     }
1987 
1988     tng__save_slice_params_template(ctx, ui32SliceBufIdx, eSliceType,
1989         ui32IPEControl, ui32Flags, ui32SliceConfig, ui32SeqConfig, ui32StreamIndex);
1990 
1991     return 0;
1992 }
1993 
tng__mpeg4_generate_pic_hdr_template(context_ENC_p ctx,IMG_FRAME_TEMPLATE_TYPE ui8SliceType,IMG_UINT8 ui8Search_range)1994 void tng__mpeg4_generate_pic_hdr_template(
1995     context_ENC_p ctx,
1996     IMG_FRAME_TEMPLATE_TYPE ui8SliceType,
1997     IMG_UINT8 ui8Search_range)
1998 {
1999     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ctx->ui32StreamID]);
2000     MTX_HEADER_PARAMS * pPicHeaderMem;
2001     VOP_CODING_TYPE eVop_Coding_Type;
2002     IMG_BOOL8 b8IsVopCoded;
2003     IMG_UINT8 ui8OriginalSliceType = ui8SliceType;
2004 
2005     /* MPEG4: We do not support B-frames at the moment, so we use a spare slot, to store a template for the skipped frame */
2006     if (ui8SliceType == IMG_FRAME_INTER_B)
2007     {
2008 	ui8SliceType = IMG_FRAME_INTER_P;
2009 	b8IsVopCoded = IMG_FALSE;
2010     } else {
2011 	b8IsVopCoded = IMG_TRUE;
2012     }
2013 
2014     eVop_Coding_Type = (ui8SliceType == IMG_FRAME_INTER_P) ? P_FRAME : I_FRAME;
2015 
2016     psb_buffer_map(&(ps_mem->bufs_pic_template), &(ps_mem->bufs_pic_template.virtual_addr));
2017     if (ps_mem->bufs_pic_template.virtual_addr == NULL) {
2018         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping pic template\n", __FUNCTION__);
2019         return ;
2020     }
2021 
2022     pPicHeaderMem = (MTX_HEADER_PARAMS *)((IMG_UINT8*)(ps_mem->bufs_pic_template.virtual_addr + (ctx->ctx_mem_size.pic_template * ui8OriginalSliceType)));
2023     //todo fix time resolution
2024     tng__MPEG4_notforsims_prepare_vop_header(pPicHeaderMem, b8IsVopCoded, ui8Search_range, eVop_Coding_Type);
2025     psb_buffer_unmap(&(ps_mem->bufs_pic_template));
2026 
2027 }
2028 
tng__h263_generate_pic_hdr_template(context_ENC_p ctx,IMG_FRAME_TEMPLATE_TYPE eFrameType,IMG_UINT16 ui16Width,IMG_UINT16 ui16Heigh)2029 void tng__h263_generate_pic_hdr_template(
2030     context_ENC_p ctx,
2031     IMG_FRAME_TEMPLATE_TYPE eFrameType,
2032     IMG_UINT16 ui16Width,
2033     IMG_UINT16 ui16Heigh)
2034 
2035 {
2036     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ctx->ui32StreamID]);
2037     MTX_HEADER_PARAMS * pPicHeaderMem = NULL;
2038     H263_PICTURE_CODING_TYPE ePictureCodingType = ((eFrameType == IMG_FRAME_INTRA)|| (eFrameType == IMG_FRAME_IDR)) ? I_FRAME : P_FRAME;
2039 
2040     psb_buffer_map(&(ps_mem->bufs_pic_template), &(ps_mem->bufs_pic_template.virtual_addr));
2041     if (ps_mem->bufs_pic_template.virtual_addr == NULL) {
2042         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping pic template\n", __FUNCTION__);
2043         return ;
2044     }
2045 
2046     pPicHeaderMem = (MTX_HEADER_PARAMS *)((IMG_UINT8*)(ps_mem->bufs_pic_template.virtual_addr + (ctx->ctx_mem_size.pic_template * eFrameType)));
2047 
2048     IMG_UINT8 ui8FrameRate = (IMG_UINT8)ctx->sRCParams.ui32FrameRate;
2049 
2050     // Get a pointer to the memory the header will be written to
2051     tng__H263_notforsims_prepare_video_pictureheader(
2052         pPicHeaderMem,
2053         ePictureCodingType,
2054         ctx->ui8H263SourceFormat,
2055         ui8FrameRate,
2056         ui16Width,
2057         ui16Heigh);
2058 
2059     psb_buffer_unmap(&(ps_mem->bufs_pic_template));
2060 
2061 }
2062 
2063 
tng__MPEG4ES_send_seq_header(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)2064 static void tng__MPEG4ES_send_seq_header(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
2065 {
2066     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
2067     tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
2068 
2069     psb_buffer_map(&(ps_mem->bufs_seq_header), &(ps_mem->bufs_seq_header.virtual_addr));
2070     if (ps_mem->bufs_seq_header.virtual_addr == NULL) {
2071         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping seq template\n", __FUNCTION__);
2072         return ;
2073     }
2074 
2075     tng__MPEG4_prepare_sequence_header(ps_mem->bufs_seq_header.virtual_addr,
2076                                        IMG_FALSE,//FIXME: Zhaohan bFrame
2077                                        ctx->ui8ProfileIdc,//profile
2078                                        ctx->ui8LevelIdc,//ui8Profile_lvl_indication
2079                                        3,//ui8Fixed_vop_time_increment
2080                                        ctx->obj_context->picture_width,//ui8Fixed_vop_time_increment
2081                                        ctx->obj_context->picture_height,//ui32Picture_Height_Pixels
2082                                        NULL,//VBVPARAMS
2083                                        ctx->ui32VopTimeResolution);
2084     psb_buffer_unmap(&(ps_mem->bufs_seq_header));
2085 
2086     cmdbuf->cmd_idx_saved[TNG_CMDBUF_SEQ_HEADER_IDX] = cmdbuf->cmd_idx;
2087 }
2088 
tng__H264ES_send_seq_header(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)2089 static void tng__H264ES_send_seq_header(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
2090 {
2091     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
2092     tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
2093     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
2094     H264_VUI_PARAMS *psVuiParams = &(ctx->sVuiParams);
2095 
2096 //    memset(psVuiParams, 0, sizeof(H264_VUI_PARAMS));
2097 
2098     if (psRCParams->eRCMode != IMG_RCMODE_NONE) {
2099         psVuiParams->vui_flag = 1;
2100         if (psVuiParams->num_units_in_tick == 0 || psVuiParams->Time_Scale == 0) {
2101             psVuiParams->num_units_in_tick = 1;
2102             psVuiParams->Time_Scale = psRCParams->ui32FrameRate * 2;
2103         }
2104         psVuiParams->bit_rate_value_minus1 = psRCParams->ui32BitsPerSecond / 64 - 1;
2105         psVuiParams->cbp_size_value_minus1 = psRCParams->ui32BufferSize / 64 - 1;
2106         psVuiParams->CBR = ((psRCParams->eRCMode == IMG_RCMODE_CBR) && (!psRCParams->bDisableBitStuffing)) ? 1 : 0;
2107         psVuiParams->initial_cpb_removal_delay_length_minus1 = BPH_SEI_NAL_INITIAL_CPB_REMOVAL_DELAY_SIZE - 1;
2108         psVuiParams->cpb_removal_delay_length_minus1 = PTH_SEI_NAL_CPB_REMOVAL_DELAY_SIZE - 1;
2109         psVuiParams->dpb_output_delay_length_minus1 = PTH_SEI_NAL_DPB_OUTPUT_DELAY_SIZE - 1;
2110         psVuiParams->time_offset_length = 24;
2111     }
2112     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s psVuiParams->vui_flag = %d\n", __FUNCTION__, psVuiParams->vui_flag);
2113 
2114     psb_buffer_map(&(ps_mem->bufs_seq_header), &(ps_mem->bufs_seq_header.virtual_addr));
2115     if (ps_mem->bufs_seq_header.virtual_addr == NULL) {
2116         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping seq header\n", __FUNCTION__);
2117         return ;
2118     }
2119 
2120     tng__H264ES_prepare_sequence_header(
2121         ps_mem->bufs_seq_header.virtual_addr,
2122         &(ctx->sVuiParams),
2123         &(ctx->sCropParams),
2124         ctx->ui16Width,         //ui8_picture_width_in_mbs
2125         ctx->ui16PictureHeight, //ui8_picture_height_in_mbs
2126         ctx->ui32CustomQuantMask,    //0,  ui8_custom_quant_mask
2127         ctx->ui8ProfileIdc,          //ui8_profile
2128         ctx->ui8LevelIdc,            //ui8_level
2129         ctx->ui8FieldCount,          //1,  ui8_field_count
2130         ctx->ui8MaxNumRefFrames,     //1,  ui8_max_num_ref_frames
2131         ctx->bPpsScaling,            //0   ui8_pps_scaling_cnt
2132         ctx->bUseDefaultScalingList, //0,  b_use_default_scaling_list
2133         ctx->bEnableLossless,        //0,  blossless
2134         ctx->bArbitrarySO
2135     );
2136     psb_buffer_unmap(&(ps_mem->bufs_seq_header));
2137 
2138     if (ctx->bEnableMVC) {
2139         psb_buffer_map(&(ps_mem->bufs_sub_seq_header), &(ps_mem->bufs_sub_seq_header.virtual_addr));
2140         if (ps_mem->bufs_sub_seq_header.virtual_addr == NULL) {
2141             drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping sub seq header\n", __FUNCTION__);
2142             return ;
2143         }
2144         tng__H264ES_prepare_mvc_sequence_header(
2145             ps_mem->bufs_sub_seq_header.virtual_addr,
2146             &(ctx->sCropParams),
2147             ctx->ui16Width,         //ui8_picture_width_in_mbs
2148             ctx->ui16PictureHeight, //ui8_picture_height_in_mbs
2149             ctx->ui32CustomQuantMask,    //0,  ui8_custom_quant_mask
2150             ctx->ui8ProfileIdc,          //ui8_profile
2151             ctx->ui8LevelIdc,            //ui8_level
2152             ctx->ui8FieldCount,          //1,  ui8_field_count
2153             ctx->ui8MaxNumRefFrames,     //1,  ui8_max_num_ref_frames
2154             ctx->bPpsScaling,            //0   ui8_pps_scaling_cnt
2155             ctx->bUseDefaultScalingList, //0,  b_use_default_scaling_list
2156             ctx->bEnableLossless,        //0,  blossless
2157             ctx->bArbitrarySO
2158         );
2159         psb_buffer_unmap(&(ps_mem->bufs_sub_seq_header));
2160     }
2161 
2162     cmdbuf->cmd_idx_saved[TNG_CMDBUF_SEQ_HEADER_IDX] = cmdbuf->cmd_idx;
2163 
2164     return ;
2165 }
2166 
tng__H264ES_send_pic_header(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)2167 static void tng__H264ES_send_pic_header(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
2168 {
2169     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
2170     IMG_BOOL bDepViewPPS = IMG_FALSE;
2171 
2172     if ((ctx->bEnableMVC) && (ctx->ui16MVCViewIdx != 0) &&
2173         (ctx->ui16MVCViewIdx != (IMG_UINT16)(NON_MVC_VIEW))) {
2174         bDepViewPPS = IMG_TRUE;
2175     }
2176 
2177     psb_buffer_map(&(ps_mem->bufs_pic_template), &(ps_mem->bufs_pic_template.virtual_addr));
2178     if (ps_mem->bufs_pic_template.virtual_addr == NULL) {
2179         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping pic template\n", __FUNCTION__);
2180         return ;
2181     }
2182 
2183     tng__H264ES_prepare_picture_header(
2184         ps_mem->bufs_pic_template.virtual_addr,
2185         ctx->bCabacEnabled,
2186         ctx->bH2648x8Transform,     //IMG_BOOL    b_8x8transform,
2187         ctx->bH264IntraConstrained, //IMG_BOOL    bIntraConstrained,
2188         0, //IMG_INT8    i8CQPOffset,
2189         0, //IMG_BOOL    bWeightedPrediction,
2190         0, //IMG_UINT8   ui8WeightedBiPred,
2191         bDepViewPPS, //IMG_BOOL    bMvcPPS,
2192         0, //IMG_BOOL    bScalingMatrix,
2193         0  //IMG_BOOL    bScalingLists
2194     );
2195 
2196     psb_buffer_unmap(&(ps_mem->bufs_pic_template));
2197     return ;
2198 }
2199 
tng__H264ES_send_hrd_header(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)2200 static void tng__H264ES_send_hrd_header(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
2201 {
2202     unsigned int ui32nal_initial_cpb_removal_delay;
2203     unsigned int ui32nal_initial_cpb_removal_delay_offset;
2204     uint32_t ui32cpb_removal_delay;
2205     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
2206     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
2207     H264_VUI_PARAMS *psVuiParams = &(ctx->sVuiParams);
2208     IMG_UINT8 aui8clocktimestampflag[1];
2209     aui8clocktimestampflag[0] = IMG_FALSE;
2210 
2211     ui32nal_initial_cpb_removal_delay =
2212         90000 * (1.0 * psRCParams->i32InitialDelay / psRCParams->ui32BitsPerSecond);
2213     ui32nal_initial_cpb_removal_delay_offset =
2214         90000 * (1.0 * ctx->buffer_size / psRCParams->ui32BitsPerSecond)
2215         - ui32nal_initial_cpb_removal_delay;
2216 
2217     drv_debug_msg(VIDEO_DEBUG_GENERAL, "Insert SEI buffer period message with "
2218             "ui32nal_initial_cpb_removal_delay(%d) and "
2219             "ui32nal_initial_cpb_removal_delay_offset(%d)\n",
2220             ui32nal_initial_cpb_removal_delay,
2221             ui32nal_initial_cpb_removal_delay_offset);
2222 
2223     psb_buffer_map(&(ps_mem->bufs_sei_header), &(ps_mem->bufs_sei_header.virtual_addr));
2224     if (ps_mem->bufs_sei_header.virtual_addr == NULL) {
2225         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping sei header\n", __FUNCTION__);
2226         return ;
2227     }
2228 
2229     if ((!ctx->bEnableMVC) || (ctx->ui16MVCViewIdx == 0)) {
2230         tng__H264ES_prepare_AUD_header(ps_mem->bufs_sei_header.virtual_addr);
2231     }
2232 
2233     tng__H264ES_prepare_SEI_buffering_period_header(
2234         ps_mem->bufs_sei_header.virtual_addr + (ctx->ctx_mem_size.sei_header),
2235         0,// ui8cpb_cnt_minus1,
2236         psVuiParams->initial_cpb_removal_delay_length_minus1+1, //ui8initial_cpb_removal_delay_length,
2237         1, //ui8NalHrdBpPresentFlag,
2238         ui32nal_initial_cpb_removal_delay, // ui32nal_initial_cpb_removal_delay,
2239         ui32nal_initial_cpb_removal_delay_offset, //ui32nal_initial_cpb_removal_delay_offset,
2240         0, //ui8VclHrdBpPresentFlag - CURRENTLY HARD CODED TO ZERO IN TOPAZ
2241         NOT_USED_BY_TOPAZ, // ui32vcl_initial_cpb_removal_delay, (not used when ui8VclHrdBpPresentFlag = 0)
2242         NOT_USED_BY_TOPAZ); // ui32vcl_initial_cpb_removal_delay_offset (not used when ui8VclHrdBpPresentFlag = 0)
2243 
2244     /* ui32cpb_removal_delay is zero for 1st frame and will be reset
2245      * after a IDR frame */
2246     if (ctx->ui32FrameCount[ui32StreamIndex] == 0) {
2247         if (ctx->ui32RawFrameCount == 0)
2248             ui32cpb_removal_delay = 0;
2249         else
2250             ui32cpb_removal_delay =
2251                 ctx->ui32IdrPeriod * ctx->ui32IntraCnt * 2;
2252     } else
2253         ui32cpb_removal_delay = 2 * ctx->ui32FrameCount[ui32StreamIndex];
2254 
2255     tng__H264ES_prepare_SEI_picture_timing_header(
2256         ps_mem->bufs_sei_header.virtual_addr + (ctx->ctx_mem_size.sei_header * 2),
2257         1, //ui8CpbDpbDelaysPresentFlag,
2258         psVuiParams->cpb_removal_delay_length_minus1, //cpb_removal_delay_length_minus1,
2259         psVuiParams->dpb_output_delay_length_minus1, //dpb_output_delay_length_minus1,
2260         ui32cpb_removal_delay, //ui32cpb_removal_delay,
2261         2, //ui32dpb_output_delay,
2262         0, //ui8pic_struct_present_flag (contained in the sequence header, Topaz hard-coded default to 0)
2263         NOT_USED_BY_TOPAZ, //ui8pic_struct, (not used when ui8pic_struct_present_flag = 0)
2264         NOT_USED_BY_TOPAZ, //NumClockTS, (not used when ui8pic_struct_present_flag = 0)
2265         aui8clocktimestampflag, //abclock_timestamp_flag, (not used when ui8pic_struct_present_flag = 0)
2266         NOT_USED_BY_TOPAZ, //ui8full_timestamp_flag, (not used when ui8pic_struct_present_flag = 0)
2267         NOT_USED_BY_TOPAZ, //ui8seconds_flag, (not used when ui8pic_struct_present_flag = 0)
2268         NOT_USED_BY_TOPAZ, //ui8minutes_flag, (not used when ui8pic_struct_present_flag = 0)
2269         NOT_USED_BY_TOPAZ, //ui8hours_flag, (not used when ui8pic_struct_present_flag = 0)
2270         NOT_USED_BY_TOPAZ, //seconds_value, (not used when ui8pic_struct_present_flag = 0)
2271         NOT_USED_BY_TOPAZ, //minutes_value, (not used when ui8pic_struct_present_flag = 0)
2272         NOT_USED_BY_TOPAZ, //hours_value, (not used when ui8pic_struct_present_flag = 0)
2273         NOT_USED_BY_TOPAZ, //ct_type (2=Unknown) See TRM Table D 2 ?Mapping of ct_type to source picture scan  (not used when ui8pic_struct_present_flag = 0)
2274         NOT_USED_BY_TOPAZ, //nuit_field_based_flag, (not used when ui8pic_struct_present_flag = 0)
2275         NOT_USED_BY_TOPAZ, //counting_type (See TRM Table D 3 ?Definition of counting_type values)  (not used when ui8pic_struct_present_flag = 0)
2276         NOT_USED_BY_TOPAZ, //ui8discontinuity_flag, (not used when ui8pic_struct_present_flag = 0)
2277         NOT_USED_BY_TOPAZ, //ui8cnt_dropped_flag, (not used when ui8pic_struct_present_flag = 0)
2278         NOT_USED_BY_TOPAZ, //n_frames, (not used when ui8pic_struct_present_flag = 0)
2279         NOT_USED_BY_TOPAZ, //time_offset_length, (not used when ui8pic_struct_present_flag = 0)
2280         NOT_USED_BY_TOPAZ); //time_offset (not used when ui8pic_struct_present_flag = 0)
2281     psb_buffer_unmap(&(ps_mem->bufs_sei_header));
2282 
2283     return ;
2284 }
2285 
tng__generate_slice_params_template(context_ENC_p ctx,IMG_UINT32 slice_buf_idx,IMG_UINT32 slice_type,IMG_UINT32 ui32StreamIndex)2286 static void tng__generate_slice_params_template(
2287     context_ENC_p ctx,
2288     IMG_UINT32 slice_buf_idx,
2289     IMG_UINT32 slice_type,
2290     IMG_UINT32 ui32StreamIndex
2291 )
2292 {
2293     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
2294     IMG_UINT8  *slice_mem_temp_p = NULL;
2295     IMG_UINT32 ui32SliceHeight = 0;
2296     IMG_FRAME_TEMPLATE_TYPE slice_temp_type = (IMG_FRAME_TEMPLATE_TYPE)slice_type;
2297     IMG_FRAME_TEMPLATE_TYPE buf_idx = (IMG_FRAME_TEMPLATE_TYPE)slice_buf_idx;
2298 
2299     if (ctx->ui8SlicesPerPicture != 0)
2300         ui32SliceHeight = ctx->ui16PictureHeight / ctx->ui8SlicesPerPicture;
2301     else
2302         drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s slice height\n", __FUNCTION__);
2303 
2304     ui32SliceHeight &= ~15;
2305 
2306     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG ui8DeblockIDC    = %x\n", __FUNCTION__, ctx->ui8DeblockIDC   );
2307     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG ui32SliceHeight  = %x\n", __FUNCTION__, ui32SliceHeight );
2308     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG bIsInterlaced    = %x\n", __FUNCTION__, ctx->bIsInterlaced   );
2309     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG iFineYSearchSize = %x\n", __FUNCTION__, ctx->iFineYSearchSize);
2310 
2311     tng__prepare_encode_sliceparams(
2312         ctx,
2313         slice_buf_idx,
2314         slice_temp_type,
2315         0,                        // ui16CurrentRow,
2316         ui32SliceHeight,
2317         ctx->ui8DeblockIDC,       // uiDeblockIDC
2318         ctx->bIsInterlaced,       // bFieldMode
2319         ctx->iFineYSearchSize,
2320         ui32StreamIndex
2321     );
2322 
2323     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG bCabacEnabled  = %x\n", __FUNCTION__, ctx->bCabacEnabled );
2324     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s PTG ui16MVCViewIdx = %x\n", __FUNCTION__, ctx->ui16MVCViewIdx);
2325 
2326     if(ctx->bEnableMVC)
2327         ctx->ui16MVCViewIdx = (IMG_UINT16)ui32StreamIndex;
2328 
2329     if (ps_mem->bufs_slice_template.virtual_addr == NULL) {
2330         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping slice template\n", __FUNCTION__);
2331         return ;
2332     }
2333 
2334     slice_mem_temp_p = (IMG_UINT8*)(ps_mem->bufs_slice_template.virtual_addr + (ctx->ctx_mem_size.slice_template * buf_idx));
2335     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: addr 0x%08x, virtual 0x%08x, size = 0x%08x, buf_idx = %x\n",
2336         __FUNCTION__, slice_mem_temp_p, ps_mem->bufs_slice_template.virtual_addr, ctx->ctx_mem_size.slice_template, buf_idx);
2337 
2338     /* Prepare Slice Header Template */
2339     switch (ctx->eStandard) {
2340     case IMG_STANDARD_NONE:
2341     case IMG_STANDARD_JPEG:
2342     case IMG_STANDARD_MPEG4:
2343         break;
2344     case IMG_STANDARD_H264:
2345         //H264_NOTFORSIMS_PrepareSliceHeader
2346         tng__H264ES_notforsims_prepare_sliceheader(
2347             slice_mem_temp_p,
2348             slice_temp_type,
2349             ctx->ui8DeblockIDC,
2350             0,                   // ui32FirstMBAddress
2351             0,                   // uiMBSkipRun
2352             ctx->bCabacEnabled,
2353             ctx->bIsInterlaced,
2354             ctx->ui16MVCViewIdx, //(IMG_UINT16)(NON_MVC_VIEW);
2355             IMG_FALSE            // bIsLongTermRef
2356         );
2357         break;
2358 
2359     case IMG_STANDARD_H263:
2360         tng__H263ES_notforsims_prepare_gobsliceheader(slice_mem_temp_p);
2361         break;
2362 
2363     case IMG_STANDARD_MPEG2:
2364         tng__MPEG2_prepare_sliceheader(slice_mem_temp_p);
2365         break;
2366     }
2367 
2368     psb_buffer_unmap(&(ps_mem->bufs_slice_template));
2369 
2370     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s: end \n", __FUNCTION__);
2371 
2372     return ;
2373 }
2374 
2375 //H264_PrepareTemplates
tng__prepare_templates(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)2376 static VAStatus tng__prepare_templates(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
2377 {
2378     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
2379     PIC_PARAMS *psPicParams = &(ctx->sPicParams);
2380     IN_RC_PARAMS* psInParams = &(psPicParams->sInParams);
2381     psPicParams->ui32Flags = 0;
2382 
2383     tng__prepare_mv_estimates(ctx, ui32StreamIndex);
2384 
2385     switch (ctx->eStandard) {
2386         case IMG_STANDARD_H263:
2387             psPicParams->ui32Flags |= ISH263_FLAGS;
2388             break;
2389         case IMG_STANDARD_MPEG4:
2390             psPicParams->ui32Flags |= ISMPEG4_FLAGS;
2391             break;
2392         case IMG_STANDARD_MPEG2:
2393             psPicParams->ui32Flags |= ISMPEG2_FLAGS;
2394             break;
2395         default:
2396             break;
2397     }
2398 
2399     if (psRCParams->eRCMode) {
2400         psPicParams->ui32Flags |= ISRC_FLAGS;
2401         tng__setup_rcdata(ctx);
2402     } else {
2403         psInParams->ui8SeInitQP  = psRCParams->ui32InitialQp;
2404         psInParams->ui8MBPerRow  = (ctx->ui16Width >> 4);
2405         psInParams->ui16MBPerFrm = (ctx->ui16Width >> 4) * (ctx->ui16PictureHeight >> 4);
2406         psInParams->ui16MBPerBU  = psRCParams->ui32BUSize;
2407         psInParams->ui16BUPerFrm = (psInParams->ui16MBPerFrm) / psRCParams->ui32BUSize;
2408         ctx->ui32KickSize = psInParams->ui16MBPerBU;
2409     }
2410 
2411     // Prepare Slice header templates
2412     tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_IDR, (IMG_UINT32)IMG_FRAME_IDR, ui32StreamIndex);
2413     tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_INTRA, (IMG_UINT32)IMG_FRAME_INTRA, ui32StreamIndex);
2414     tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_INTER_P, (IMG_UINT32)IMG_FRAME_INTER_P, ui32StreamIndex);
2415     switch(ctx->eStandard) {
2416 	case IMG_STANDARD_H264:
2417 	    tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_INTER_B, (IMG_UINT32)IMG_FRAME_INTER_B, ui32StreamIndex);
2418 	    if (ctx->bEnableMVC)
2419 		tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_INTER_P_IDR, (IMG_UINT32)IMG_FRAME_INTER_P_IDR, ui32StreamIndex);
2420             tng__H264ES_send_seq_header(ctx, 0);
2421             tng__H264ES_send_pic_header(ctx, 0);
2422             if (ctx->bInsertHRDParams)
2423                 tng__H264ES_send_hrd_header(ctx, 0);
2424 	    break;
2425 	case IMG_STANDARD_H263:
2426 	    tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_INTER_B, (IMG_UINT32)IMG_FRAME_INTER_B, ui32StreamIndex);
2427 	    /* Here H263 uses the actual width and height */
2428 	    tng__h263_generate_pic_hdr_template(ctx, IMG_FRAME_IDR, ctx->h263_actual_width, ctx->h263_actual_height);
2429             tng__h263_generate_pic_hdr_template(ctx, IMG_FRAME_INTRA, ctx->h263_actual_width, ctx->h263_actual_height);
2430             tng__h263_generate_pic_hdr_template(ctx, IMG_FRAME_INTER_P, ctx->h263_actual_width, ctx->h263_actual_height);
2431 	    break;
2432 	case IMG_STANDARD_MPEG4:
2433 	    tng__generate_slice_params_template(ctx, (IMG_UINT32)IMG_FRAME_INTER_B, (IMG_UINT32)IMG_FRAME_INTER_P, ui32StreamIndex);
2434 	    tng__mpeg4_generate_pic_hdr_template(ctx, IMG_FRAME_IDR, 4);
2435             tng__mpeg4_generate_pic_hdr_template(ctx, IMG_FRAME_INTRA, 4);
2436             tng__mpeg4_generate_pic_hdr_template(ctx, IMG_FRAME_INTER_P, 4);
2437 	    tng__mpeg4_generate_pic_hdr_template(ctx, IMG_FRAME_INTER_B, 4);
2438 	    break;
2439 	default:
2440 	    break;
2441     }
2442 
2443     //FIXME: Zhaohan tng__mpeg2/mpeg4_generate_pic_hdr_template(IMG_FRAME_IDR\IMG_FRAME_INTRA\IMG_FRAME_INTER_P\IMG_FRAME_INTER_B);
2444 
2445 /*
2446     else {
2447         slice_mem_temp_p = (IMG_UINT8*)cmdbuf->slice_mem_p + (((IMG_UINT32)IMG_FRAME_INTER_P_IDR) * cmdbuf->mem_size);
2448         memset(slice_mem_temp_p, 0, 128);
2449     }
2450 */
2451     // Prepare Pic Params Templates
2452     tng__adjust_picflags(ctx, psRCParams, IMG_TRUE, &(ctx->ui32FirstPicFlags));
2453     tng__adjust_picflags(ctx, psRCParams, IMG_FALSE, &(ctx->ui32NonFirstPicFlags));
2454 
2455     return VA_STATUS_SUCCESS;
2456 }
2457 
2458 #if INPUT_SCALER_SUPPORTED
VIDEO_CalculateBessel0(IMG_FLOAT fX)2459 static IMG_FLOAT VIDEO_CalculateBessel0 (IMG_FLOAT fX)
2460 {
2461     IMG_FLOAT fAX, fY;
2462 
2463     fAX = (IMG_FLOAT)IMG_FABS(fX);
2464 
2465     if (fAX < 3.75) 	{
2466         fY = (IMG_FLOAT)(fX / 3.75);
2467         fY *= fY;
2468 
2469         return (IMG_FLOAT)(1.0 + fY *
2470             (3.5156229 + fY *
2471             (3.0899424 + fY *
2472             (1.2067492 + fY *
2473             (0.2659732 + fY *
2474             (0.360768e-1 + fY * 0.45813e-2))))));
2475     }
2476 
2477     fY = (IMG_FLOAT)(3.75 / fAX);
2478 
2479     return (IMG_FLOAT)((IMG_EXP(fAX) / IMG_SQRT(fAX)) *
2480         (0.39894228 + fY *
2481         (0.1328592e-1 + fY *
2482         (0.225319e-2 + fY *
2483         (-0.157565e-2 + fY *
2484         (0.916281e-2 + fY *
2485         (-0.2057706e-1 + fY *
2486         (0.2635537e-1 + fY *
2487         (-0.1647633e-1 + fY * 0.392377e-2)))))))));
2488 }
2489 
VIDEO_SincFunc(IMG_FLOAT fInput,IMG_FLOAT fScale)2490 static IMG_FLOAT VIDEO_SincFunc (IMG_FLOAT fInput, IMG_FLOAT fScale)
2491 {
2492     IMG_FLOAT fX;
2493     IMG_FLOAT fKaiser;
2494 
2495     /* Kaiser window */
2496     fX = fInput / (4.0f / 2.0f) - 1.0f;
2497     fX = (IMG_FLOAT)IMG_SQRT(1.0f - fX * fX);
2498     fKaiser = VIDEO_CalculateBessel0(2.0f * fX) / VIDEO_CalculateBessel0(2.0f);
2499 
2500     /* Sinc function */
2501     fX = 4.0f / 2.0f - fInput;
2502     if (fX == 0) {
2503         return fKaiser;
2504     }
2505 
2506     fX *= 0.9f * fScale * 3.1415926535897f;
2507 
2508     return fKaiser * (IMG_FLOAT)(IMG_SIN(fX) / fX);
2509 }
2510 
VIDEO_CalcCoefs_FromPitch(IMG_FLOAT fPitch,IMG_UINT8 aui8Table[4][16])2511 static void VIDEO_CalcCoefs_FromPitch (IMG_FLOAT	fPitch, IMG_UINT8 aui8Table[4][16])
2512 {
2513     /* Based on sim code */
2514     /* The function is symmetrical, so we only need to calculate the first half of the taps, and the middle value. */
2515 
2516     IMG_FLOAT	fScale;
2517     IMG_UINT32	ui32I, ui32Tap;
2518     IMG_FLOAT	afTable[4][16];
2519     IMG_INT32	i32Total;
2520     IMG_FLOAT	fTotal;
2521     IMG_INT32	i32MiddleTap, i32MiddleI;		/* Mirrored / middle Values for I and T */
2522 
2523     if (fPitch < 1.0f) {
2524         fScale = 1.0f;
2525     } else {
2526         fScale = 1.0f / fPitch;
2527     }
2528 
2529     for (ui32I = 0; ui32I < 16; ui32I++) {
2530         for (ui32Tap = 0; ui32Tap < 4; ui32Tap++) {
2531             afTable[ui32Tap][ui32I] = VIDEO_SincFunc(((IMG_FLOAT)ui32Tap) + ((IMG_FLOAT)ui32I) / 16.0f, fScale);
2532         }
2533     }
2534 
2535     for (ui32Tap = 0; ui32Tap < 2; ui32Tap++) {
2536         for (ui32I = 0; ui32I < 16; ui32I++) {
2537             /* Copy the table around the centre point */
2538             i32MiddleTap = (3 - ui32Tap) + (16 - ui32I) / 16;
2539             i32MiddleI = (16 - ui32I) & 15;
2540             if ((IMG_UINT32)i32MiddleTap < 4) {
2541                 afTable[i32MiddleTap][i32MiddleI] = afTable[ui32Tap][ui32I];
2542             }
2543         }
2544     }
2545 
2546     /* The middle value */
2547     afTable[2][0] = VIDEO_SincFunc(2.0f, fScale);
2548 
2549     /* Normalize this interpolation point, and convert to 2.6 format, truncating the result	*/
2550     for (ui32I = 0; ui32I < 16; ui32I++) {
2551         fTotal = 0.0f;
2552         i32Total = 0;
2553 
2554         for (ui32Tap = 0; ui32Tap < 4; ui32Tap++) {
2555             fTotal += afTable[ui32Tap][ui32I];
2556         }
2557 
2558         for (ui32Tap = 0; ui32Tap < 4; ui32Tap++) {
2559             aui8Table[ui32Tap][ui32I] = (IMG_UINT8)((afTable[ui32Tap][ui32I] * 64.0f) / fTotal);
2560             i32Total += aui8Table[ui32Tap][ui32I];
2561         }
2562 
2563         if (ui32I <= 8) { /* normalize any floating point errors */
2564             i32Total -= 64;
2565             if (ui32I == 8) {
2566                 i32Total /= 2;
2567             }
2568             /* Subtract the error from the I Point in the first tap ( this will not get
2569             mirrored, as it would go off the end). */
2570             aui8Table[0][ui32I] = (IMG_UINT8)(aui8Table[0][ui32I] - (IMG_UINT8)i32Total);
2571         }
2572     }
2573 
2574     /* Copy the normalised table around the centre point */
2575     for (ui32Tap = 0; ui32Tap < 2; ui32Tap++) {
2576         for (ui32I = 0; ui32I < 16; ui32I++) {
2577             i32MiddleTap = (3 - ui32Tap) + (16 - ui32I) / 16;
2578             i32MiddleI = (16 - ui32I) & 15;
2579             if ((IMG_UINT32)i32MiddleTap < 4) {
2580                 aui8Table[i32MiddleTap][i32MiddleI] = aui8Table[ui32Tap][ui32I];
2581             }
2582         }
2583     }
2584     return ;
2585 }
2586 #endif
2587 
tng__setvideo_params(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)2588 static void tng__setvideo_params(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
2589 {
2590     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
2591     context_ENC_frame_buf *ps_buf = &(ctx->ctx_frame_buf);
2592     IMG_MTX_VIDEO_CONTEXT* psMtxEncContext = NULL;
2593     IMG_RC_PARAMS * psRCParams = &(ctx->sRCParams);
2594     //IMG_UINT16 ui16WidthInMbs = (ctx->ui16Width + 15) >> 4;
2595     //IMG_UINT16 ui16FrameHeightInMbs = (ctx->ui16FrameHeight + 15) >> 4;
2596     IMG_INT nIndex;
2597     IMG_UINT8 ui8Flag;
2598 #ifndef EXCLUDE_ADAPTIVE_ROUNDING
2599     IMG_INT32 i, j;
2600 #endif
2601 
2602     psb_buffer_map(&(ps_mem->bufs_mtx_context), &(ps_mem->bufs_mtx_context.virtual_addr));
2603     if (ps_mem->bufs_mtx_context.virtual_addr == NULL) {
2604         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping slice template\n", __FUNCTION__);
2605         return ;
2606     }
2607 
2608     psMtxEncContext = (IMG_MTX_VIDEO_CONTEXT*)(ps_mem->bufs_mtx_context.virtual_addr);
2609 
2610     ctx->i32PicNodes = (psRCParams->b16Hierarchical ? MAX_REF_B_LEVELS : 0) + ctx->ui8RefSpacing + 4;
2611     ctx->i32MVStores = (ctx->i32PicNodes * 2);
2612     ctx->ui8SlotsInUse = psRCParams->ui16BFrames + 2;
2613 
2614     psMtxEncContext->ui32InitialQp = ctx->sRCParams.ui32InitialQp;
2615     psMtxEncContext->ui32BUSize = ctx->sRCParams.ui32BUSize;
2616     psMtxEncContext->ui16CQPOffset = (ctx->sRCParams.i8QCPOffset & 0x1f) | ((ctx->sRCParams.i8QCPOffset & 0x1f) << 8);
2617     psMtxEncContext->eStandard = ctx->eStandard;
2618     psMtxEncContext->ui32WidthInMbs = ctx->ui16Width >> 4;
2619     psMtxEncContext->ui32PictureHeightInMbs = ctx->ui16PictureHeight >> 4;
2620     psMtxEncContext->bOutputReconstructed = (ps_buf->rec_surface != NULL) ? IMG_TRUE : IMG_FALSE;
2621     psMtxEncContext->ui32VopTimeResolution = ctx->ui32VopTimeResolution;
2622     psMtxEncContext->ui8MaxSlicesPerPicture = ctx->ui8SlicesPerPicture;
2623     psMtxEncContext->ui8NumPipes = ctx->ui8PipesToUse;
2624     psMtxEncContext->eFormat = ctx->eFormat;
2625 
2626     psMtxEncContext->b8IsInterlaced = ctx->bIsInterlaced;
2627     psMtxEncContext->b8TopFieldFirst = ctx->bTopFieldFirst;
2628     psMtxEncContext->b8ArbitrarySO = ctx->bArbitrarySO;
2629 
2630     psMtxEncContext->ui32IdrPeriod = ctx->ui32IdrPeriod * ctx->ui32IntraCnt;
2631     psMtxEncContext->ui32BFrameCount = ctx->sRCParams.ui16BFrames;
2632     psMtxEncContext->b8Hierarchical = (IMG_BOOL8) ctx->sRCParams.b16Hierarchical;
2633     psMtxEncContext->ui32IntraLoopCnt = ctx->ui32IntraCnt;
2634     psMtxEncContext->ui8RefSpacing = ctx->ui8RefSpacing;
2635     psMtxEncContext->ui32DebugCRCs = ctx->ui32DebugCRCs;
2636 
2637     psMtxEncContext->ui8FirstPipe = ctx->ui8BasePipe;
2638     psMtxEncContext->ui8LastPipe = ctx->ui8BasePipe + ctx->ui8PipesToUse - 1;
2639     psMtxEncContext->ui8PipesToUseFlags = 0;
2640     ui8Flag = 0x1 << psMtxEncContext->ui8FirstPipe;
2641     for (nIndex = 0; nIndex < psMtxEncContext->ui8NumPipes; nIndex++, ui8Flag<<=1)
2642         psMtxEncContext->ui8PipesToUseFlags |= ui8Flag; //Pipes used MUST be contiguous from the BasePipe offset
2643 
2644     // Only used in MPEG2, 2 bit field (0 = 8 bit, 1 = 9 bit, 2 = 10 bit and 3=11 bit precision)
2645     if (ctx->eStandard == IMG_STANDARD_MPEG2)
2646         psMtxEncContext->ui8MPEG2IntraDCPrecision = ctx->ui8MPEG2IntraDCPrecision;
2647 
2648     psMtxEncContext->b16EnableMvc = ctx->bEnableMVC;
2649     psMtxEncContext->ui16MvcViewIdx = ctx->ui16MVCViewIdx;
2650     if (ctx->eStandard == IMG_STANDARD_H264)
2651         psMtxEncContext->b16NoSequenceHeaders = ctx->bNoSequenceHeaders;
2652 
2653     {
2654         IMG_UINT16 ui16SrcYStride = 0, ui16SrcUVStride = 0;
2655         // 3 Components: Y, U, V
2656         ctx->ui16BufferStride = ps_buf->src_surface->psb_surface->stride;
2657         ui16SrcUVStride = ui16SrcYStride = ctx->ui16BufferStride;
2658         ctx->ui16BufferHeight = ctx->ui16FrameHeight;
2659         switch (ctx->eFormat) {
2660         case IMG_CODEC_YUV:
2661         case IMG_CODEC_PL8:
2662         case IMG_CODEC_YV12:
2663             ui16SrcUVStride = ui16SrcYStride / 2;
2664             break;
2665 
2666         case IMG_CODEC_PL12:            // Interleaved chroma pixels
2667         case IMG_CODEC_IMC2:            // Interleaved chroma rows
2668         case IMG_CODEC_422_YUV:         // Odd-numbered chroma rows unused
2669         case IMG_CODEC_422_YV12:        // Odd-numbered chroma rows unused
2670         case IMG_CODEC_422_PL8:         // Odd-numbered chroma rows unused
2671         case IMG_CODEC_Y0UY1V_8888: // Interleaved luma and chroma pixels
2672         case IMG_CODEC_Y0VY1U_8888: // Interleaved luma and chroma pixels
2673         case IMG_CODEC_UY0VY1_8888: // Interleaved luma and chroma pixels
2674         case IMG_CODEC_VY0UY1_8888: // Interleaved luma and chroma pixels
2675             ui16SrcUVStride = ui16SrcYStride;
2676             break;
2677 
2678         case IMG_CODEC_422_IMC2:        // Interleaved chroma pixels and unused odd-numbered chroma rows
2679         case IMG_CODEC_422_PL12:        // Interleaved chroma rows and unused odd-numbered chroma rows
2680             ui16SrcUVStride = ui16SrcYStride * 2;
2681             break;
2682 
2683         default:
2684             break;
2685         }
2686 
2687         if ((ctx->bIsInterlaced) && (ctx->bIsInterleaved)) {
2688             ui16SrcYStride *= 2;                    // ui16SrcYStride
2689             ui16SrcUVStride *= 2;           // ui16SrcUStride
2690         }
2691 
2692         psMtxEncContext->ui32PicRowStride = F_ENCODE(ui16SrcYStride >> 6, TOPAZHP_CR_CUR_PIC_LUMA_STRIDE) |
2693                                             F_ENCODE(ui16SrcUVStride >> 6, TOPAZHP_CR_CUR_PIC_CHROMA_STRIDE);
2694     }
2695 
2696     psMtxEncContext->eRCMode = ctx->sRCParams.eRCMode;
2697     psMtxEncContext->b8DisableBitStuffing = ctx->sRCParams.bDisableBitStuffing;
2698     psMtxEncContext->b8FirstPic = IMG_TRUE;
2699 
2700     /*Contents Adaptive Rate Control Parameters*/
2701     psMtxEncContext->bCARC          =  ctx->sCARCParams.bCARC;
2702     psMtxEncContext->iCARCBaseline  =  ctx->sCARCParams.i32CARCBaseline;
2703     psMtxEncContext->uCARCThreshold =  ctx->sCARCParams.ui32CARCThreshold;
2704     psMtxEncContext->uCARCCutoff    =  ctx->sCARCParams.ui32CARCCutoff;
2705     psMtxEncContext->uCARCNegRange  =  ctx->sCARCParams.ui32CARCNegRange;
2706     psMtxEncContext->uCARCNegScale  =  ctx->sCARCParams.ui32CARCNegScale;
2707     psMtxEncContext->uCARCPosRange  =  ctx->sCARCParams.ui32CARCPosRange;
2708     psMtxEncContext->uCARCPosScale  =  ctx->sCARCParams.ui32CARCPosScale;
2709     psMtxEncContext->uCARCShift     =  ctx->sCARCParams.ui32CARCShift;
2710     psMtxEncContext->ui32MVClip_Config =  F_ENCODE(ctx->bNoOffscreenMv, TOPAZHP_CR_MVCALC_RESTRICT_PICTURE);
2711     psMtxEncContext->ui32LRITC_Tile_Use_Config = 0;
2712     psMtxEncContext->ui32LRITC_Cache_Chunk_Config = 0;
2713 
2714     psMtxEncContext->ui32IPCM_0_Config = F_ENCODE(ctx->ui32CabacBinFlex, TOPAZ_VLC_CR_CABAC_BIN_FLEX) |
2715         F_ENCODE(DEFAULT_CABAC_DB_MARGIN, TOPAZ_VLC_CR_CABAC_DB_MARGIN);
2716 
2717     psMtxEncContext->ui32IPCM_1_Config = F_ENCODE(3200, TOPAZ_VLC_CR_IPCM_THRESHOLD) |
2718         F_ENCODE(ctx->ui32CabacBinLimit, TOPAZ_VLC_CR_CABAC_BIN_LIMIT);
2719 
2720     // leave alone until high profile and constrained modes are defined.
2721     psMtxEncContext->ui32H264CompControl  = F_ENCODE((ctx->bCabacEnabled ? 0 : 1), TOPAZHP_CR_H264COMP_8X8_CAVLC);
2722 
2723     psMtxEncContext->ui32H264CompControl |= F_ENCODE(ctx->bUseDefaultScalingList ? 1 : 0, TOPAZHP_CR_H264COMP_DEFAULT_SCALING_LIST);
2724 
2725     psMtxEncContext->ui32H264CompControl |= F_ENCODE(ctx->bH2648x8Transform ? 1 : 0, TOPAZHP_CR_H264COMP_8X8_TRANSFORM);
2726 
2727     psMtxEncContext->ui32H264CompControl |= F_ENCODE(ctx->bH264IntraConstrained ? 1 : 0, TOPAZHP_CR_H264COMP_CONSTRAINED_INTRA);
2728 
2729 
2730 #ifndef EXCLUDE_ADAPTIVE_ROUNDING
2731     psMtxEncContext->bMCAdaptiveRoundingDisable = ctx->bVPAdaptiveRoundingDisable;
2732     psMtxEncContext->ui32H264CompControl |= F_ENCODE(psMtxEncContext->bMCAdaptiveRoundingDisable ? 0 : 1, TOPAZHP_CR_H264COMP_ADAPT_ROUND_ENABLE);
2733 
2734     if (!psMtxEncContext->bMCAdaptiveRoundingDisable)
2735         for (i = 0; i < 4; i++)
2736             for (j = 0; j < 18; j++)
2737                 psMtxEncContext->ui16MCAdaptiveRoundingOffsets[j][i] = H264_ROUNDING_OFFSETS[j][i];
2738 #endif
2739 
2740     if ((ctx->eStandard == IMG_STANDARD_H264) && (ctx->ui32CoreRev >= MIN_34_REV)) {
2741         psMtxEncContext->ui32H264CompControl |= F_ENCODE(USE_VCM_HW_SUPPORT, TOPAZHP_CR_H264COMP_VIDEO_CONF_ENABLE);
2742     }
2743 
2744     psMtxEncContext->ui32H264CompControl |=
2745            F_ENCODE(ctx->ui16UseCustomScalingLists & 0x01 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_4X4_INTRA_LUMA_ENABLE)
2746         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x02 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_4X4_INTRA_CB_ENABLE)
2747         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x04 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_4X4_INTRA_CR_ENABLE)
2748         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x08 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_4X4_INTER_LUMA_ENABLE)
2749         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x10 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_4X4_INTER_CB_ENABLE)
2750         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x20 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_4X4_INTER_CR_ENABLE)
2751         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x40 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_8X8_INTRA_LUMA_ENABLE)
2752         | F_ENCODE(ctx->ui16UseCustomScalingLists & 0x80 ? 1 : 0, TOPAZHP_CR_H264COMP_CUSTOM_QUANT_8X8_INTER_LUMA_ENABLE);
2753 
2754     psMtxEncContext->ui32H264CompControl |=
2755            F_ENCODE(ctx->bEnableLossless ? 1 : 0, INTEL_H264_LL)
2756         | F_ENCODE(ctx->bLossless8x8Prefilter ? 1 : 0, INTEL_H264_LL8X8P);
2757 
2758     psMtxEncContext->ui32H264CompIntraPredModes = 0x3ffff;// leave at default for now.
2759     psMtxEncContext->ui32PredCombControl = ctx->ui32PredCombControl;
2760     psMtxEncContext->ui32SkipCodedInterIntra = F_ENCODE(ctx->ui8InterIntraIndex, TOPAZHP_CR_INTER_INTRA_SCALE_IDX)
2761         |F_ENCODE(ctx->ui8CodedSkippedIndex, TOPAZHP_CR_SKIPPED_CODED_SCALE_IDX);
2762 
2763     if (ctx->bEnableInpCtrl) {
2764         psMtxEncContext->ui32MBHostCtrl = F_ENCODE(ctx->bEnableHostQP, TOPAZHP_CR_MB_HOST_QP)
2765             |F_ENCODE(ctx->bEnableHostBias, TOPAZHP_CR_MB_HOST_SKIPPED_CODED_SCALE)
2766             |F_ENCODE(ctx->bEnableHostBias, TOPAZHP_CR_MB_HOST_INTER_INTRA_SCALE);
2767         psMtxEncContext->ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTER_INTRA_SCALE_ENABLE)
2768             |F_ENCODE(1, TOPAZHP_CR_SKIPPED_CODED_SCALE_ENABLE);
2769     }
2770 
2771     if (ctx->bEnableCumulativeBiases)
2772         psMtxEncContext->ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_CUMULATIVE_BIASES_ENABLE);
2773 
2774     psMtxEncContext->ui32PredCombControl |=
2775         F_ENCODE((((ctx->ui8InterIntraIndex == 3) && (ctx->ui8CodedSkippedIndex == 3)) ? 0 : 1), TOPAZHP_CR_INTER_INTRA_SCALE_ENABLE) |
2776         F_ENCODE((ctx->ui8CodedSkippedIndex == 3 ? 0 : 1), TOPAZHP_CR_SKIPPED_CODED_SCALE_ENABLE);
2777     // workaround for BRN 33252, if the Skip coded scale is set then we also have to set the inter/inter enable. We set it enabled and rely on the default value of 3 (unbiased) to keep things behaving.
2778     //      psMtxEncContext->ui32PredCombControl |= F_ENCODE((ctx->ui8InterIntraIndex==3?0:1), TOPAZHP_CR_INTER_INTRA_SCALE_ENABLE) | F_ENCODE((ctx->ui8CodedSkippedIndex==3?0:1), TOPAZHP_CR_SKIPPED_CODED_SCALE_ENABLE);
2779     //psMtxEncContext->ui32PredCombControl |= F_ENCODE(1, TOPAZHP_CR_INTER_INTRA_SCALE_ENABLE) | F_ENCODE(1, TOPAZHP_CR_SKIPPED_CODED_SCALE_ENABLE);
2780     psMtxEncContext->ui32DeblockCtrl = F_ENCODE(ctx->ui8DeblockIDC, TOPAZ_DB_CR_DISABLE_DEBLOCK_IDC);
2781     psMtxEncContext->ui32VLCControl = 0;
2782 
2783     switch (ctx->eStandard) {
2784     case IMG_STANDARD_H264:
2785         psMtxEncContext->ui32VLCControl |= F_ENCODE(1, TOPAZ_VLC_CR_CODEC); // 1 for H.264 note this is inconsistant with the sequencer value
2786         psMtxEncContext->ui32VLCControl |= F_ENCODE(0, TOPAZ_VLC_CR_CODEC_EXTEND);
2787 
2788         break;
2789     case IMG_STANDARD_H263:
2790         psMtxEncContext->ui32VLCControl |= F_ENCODE(3, TOPAZ_VLC_CR_CODEC); // 3 for H.263 note this is inconsistant with the sequencer value
2791         psMtxEncContext->ui32VLCControl |= F_ENCODE(0, TOPAZ_VLC_CR_CODEC_EXTEND);
2792 
2793         break;
2794     case IMG_STANDARD_MPEG4:
2795         psMtxEncContext->ui32VLCControl |= F_ENCODE(2, TOPAZ_VLC_CR_CODEC); // 2 for Mpeg4 note this is inconsistant with the sequencer value
2796         psMtxEncContext->ui32VLCControl |= F_ENCODE(0, TOPAZ_VLC_CR_CODEC_EXTEND);
2797         break;
2798     case IMG_STANDARD_MPEG2:
2799         psMtxEncContext->ui32VLCControl |= F_ENCODE(0, TOPAZ_VLC_CR_CODEC);
2800         psMtxEncContext->ui32VLCControl |= F_ENCODE(1, TOPAZ_VLC_CR_CODEC_EXTEND);
2801         break;
2802     default:
2803         break;
2804     }
2805 
2806     if (ctx->bCabacEnabled) {
2807         psMtxEncContext->ui32VLCControl |= F_ENCODE(1, TOPAZ_VLC_CR_CABAC_ENABLE); // 2 for Mpeg4 note this is inconsistant with the sequencer value
2808     }
2809 
2810     psMtxEncContext->ui32VLCControl |= F_ENCODE(ctx->bIsInterlaced ? 1 : 0, TOPAZ_VLC_CR_VLC_FIELD_CODED);
2811     psMtxEncContext->ui32VLCControl |= F_ENCODE(ctx->bH2648x8Transform ? 1 : 0, TOPAZ_VLC_CR_VLC_8X8_TRANSFORM);
2812     psMtxEncContext->ui32VLCControl |= F_ENCODE(ctx->bH264IntraConstrained ? 1 : 0, TOPAZ_VLC_CR_VLC_CONSTRAINED_INTRA);
2813 
2814     psMtxEncContext->ui32VLCSliceControl = F_ENCODE(ctx->sRCParams.ui32SliceByteLimit, TOPAZ_VLC_CR_SLICE_SIZE_LIMIT);
2815     psMtxEncContext->ui32VLCSliceMBControl = F_ENCODE(ctx->sRCParams.ui32SliceMBLimit, TOPAZ_VLC_CR_SLICE_MBS_LIMIT);
2816 
2817         switch (ctx->eStandard) {
2818             case IMG_STANDARD_H264: {
2819                 IMG_UINT32 ui32VertMVLimit = 255; // default to no clipping
2820                 if (ctx->ui32VertMVLimit)
2821                     ui32VertMVLimit = ctx->ui32VertMVLimit;
2822                 // as topaz can only cope with at most 255 (in the register field)
2823                 ui32VertMVLimit = tng__min(255,ui32VertMVLimit);
2824                 // workaround for BRN 29973 and 30032
2825                 {
2826 #if defined(BRN_29973) || defined(BRN_30032)
2827                     if (ctx->ui32CoreRev <= 0x30006) {
2828                         if ((ctx->ui16Width / 16) & 1) // BRN 30032, if odd number of macroblocks we need to limit vector to +-112
2829                             psMtxEncContext->ui32IPEVectorClipping = F_ENCODE(1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_ENABLED)
2830                                 |F_ENCODE(112, TOPAZHP_CR_IPE_VECTOR_CLIPPING_X)
2831                                 |F_ENCODE(ui32VertMVLimit, TOPAZHP_CR_IPE_VECTOR_CLIPPING_Y);
2832                         else // for 29973 we need to limit vector to +-120
2833                             if (ctx->ui16Width >= 1920)
2834                                 psMtxEncContext->ui32IPEVectorClipping = F_ENCODE(1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_ENABLED)
2835                                 |F_ENCODE(120, TOPAZHP_CR_IPE_VECTOR_CLIPPING_X)
2836                                 |F_ENCODE(ui32VertMVLimit, TOPAZHP_CR_IPE_VECTOR_CLIPPING_Y);
2837                             else
2838                                 psMtxEncContext->ui32IPEVectorClipping = F_ENCODE(1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_ENABLED)
2839                                 |F_ENCODE(255, TOPAZHP_CR_IPE_VECTOR_CLIPPING_X)
2840                                 |F_ENCODE(ui32VertMVLimit, TOPAZHP_CR_IPE_VECTOR_CLIPPING_Y);
2841                     } else
2842 #endif
2843                         {
2844                             psMtxEncContext->ui32IPEVectorClipping =
2845                             F_ENCODE(1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_ENABLED) |
2846                             F_ENCODE(255, TOPAZHP_CR_IPE_VECTOR_CLIPPING_X) |
2847                             F_ENCODE(ui32VertMVLimit, TOPAZHP_CR_IPE_VECTOR_CLIPPING_Y);
2848                         }
2849                     }
2850                     psMtxEncContext->ui32SPEMvdClipRange = F_ENCODE(0, TOPAZHP_CR_SPE_MVD_CLIP_ENABLE);
2851             }
2852             break;
2853             case IMG_STANDARD_H263:
2854                 {
2855                     psMtxEncContext->ui32IPEVectorClipping = F_ENCODE(1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_ENABLED)
2856                         | F_ENCODE(16 - 1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_X)
2857                         | F_ENCODE(16 - 1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_Y);
2858 
2859                     psMtxEncContext->ui32SPEMvdClipRange = F_ENCODE(1, TOPAZHP_CR_SPE_MVD_CLIP_ENABLE)
2860                         | F_ENCODE( 62, TOPAZHP_CR_SPE_MVD_POS_CLIP)
2861                         | F_ENCODE((uint32_t)(-64), TOPAZHP_CR_SPE_MVD_NEG_CLIP);
2862                 }
2863                 break;
2864             case IMG_STANDARD_MPEG4:
2865             case IMG_STANDARD_MPEG2:
2866                 {
2867                     IMG_UINT8 uX, uY, uResidualSize;
2868                     //The maximum MPEG4 and MPEG2 motion vector differential in 1/2 pixels is
2869                     //calculated as 1 << (fcode - 1) * 32 or *16 in MPEG2
2870 
2871                     uResidualSize=(ctx->eStandard == IMG_STANDARD_MPEG4 ? 32 : 16);
2872 
2873                     uX = tng__min(128 - 1, (((1<<(ctx->sBiasTables.ui32FCode - 1)) * uResidualSize)/4) - 1);
2874                     uY = tng__min(104 - 1, (((1<<(ctx->sBiasTables.ui32FCode - 1)) * uResidualSize)/4) - 1);
2875 
2876                     //Write to register
2877                     psMtxEncContext->ui32IPEVectorClipping = F_ENCODE(1, TOPAZHP_CR_IPE_VECTOR_CLIPPING_ENABLED)
2878                         | F_ENCODE(uX, TOPAZHP_CR_IPE_VECTOR_CLIPPING_X)
2879                         | F_ENCODE(uY, TOPAZHP_CR_IPE_VECTOR_CLIPPING_Y);
2880 
2881                     psMtxEncContext->ui32SPEMvdClipRange = F_ENCODE(0, TOPAZHP_CR_SPE_MVD_CLIP_ENABLE);
2882                 }
2883                 break;
2884             case IMG_STANDARD_JPEG:
2885 			case IMG_STANDARD_NONE:
2886 			default:
2887 			    break;
2888         }
2889 #ifdef FIRMWARE_BIAS
2890     //copy the bias tables
2891     {
2892         int n;
2893         for (n = 52; n >= 0; n -= 2)    {
2894             psMtxEncContext->aui32DirectBias_P[n >> 1] = ctx->sBiasTables.aui32DirectBias_P[n];
2895             psMtxEncContext->aui32InterBias_P[n >> 1] = ctx->sBiasTables.aui32InterBias_P[n];
2896             psMtxEncContext->aui32DirectBias_B[n >> 1] = ctx->sBiasTables.aui32DirectBias_B[n];
2897             psMtxEncContext->aui32InterBias_B[n >> 1] = ctx->sBiasTables.aui32InterBias_B[n];
2898         }
2899     }
2900 #endif
2901 
2902     //copy the scale-tables
2903     tng__generate_scale_tables(psMtxEncContext);
2904 //      memcpy(psMtxEncContext->ui32InterIntraScale, ctx->ui32InterIntraScale, sizeof(IMG_UINT32)*SCALE_TBL_SZ);
2905 //      memcpy(psMtxEncContext->ui32SkippedCodedScale, ctx->ui32SkippedCodedScale, sizeof(IMG_UINT32)*SCALE_TBL_SZ);
2906 
2907     // WEIGHTED PREDICTION
2908     psMtxEncContext->b8WeightedPredictionEnabled = ctx->bWeightedPrediction;
2909     psMtxEncContext->ui8MTXWeightedImplicitBiPred = ctx->ui8VPWeightedImplicitBiPred;
2910 
2911     // SEI_INSERTION
2912     psMtxEncContext->b8InsertHRDparams = ctx->bInsertHRDParams;
2913     if (psMtxEncContext->b8InsertHRDparams & !ctx->sRCParams.ui32BitsPerSecond) {   //ctx->uBitRate
2914         /* HRD parameters are meaningless without a bitrate */
2915         psMtxEncContext->b8InsertHRDparams = IMG_FALSE;
2916     }
2917     if (psMtxEncContext->b8InsertHRDparams) {
2918         psMtxEncContext->ui64ClockDivBitrate = (90000 * 0x100000000LL);
2919         psMtxEncContext->ui64ClockDivBitrate /= ctx->sRCParams.ui32BitsPerSecond;                       //ctx->uBitRate;
2920         psMtxEncContext->ui32MaxBufferMultClockDivBitrate = (IMG_UINT32)(((IMG_UINT64)(ctx->sRCParams.ui32BufferSize) *
2921                 (IMG_UINT64) 90000) / (IMG_UINT64) ctx->sRCParams.ui32BitsPerSecond);
2922     }
2923 
2924     memcpy(&psMtxEncContext->sInParams, &ctx->sPicParams.sInParams, sizeof(IN_RC_PARAMS));
2925     // Update MV Scaling settings
2926     // IDR
2927     //      memcpy(&psMtxEncContext->sMVSettingsIdr, &ctx->sMVSettingsIdr, sizeof(IMG_MV_SETTINGS));
2928     // NonB (I or P)
2929     //      for (i = 0; i <= MAX_BFRAMES; i++)
2930     //              memcpy(&psMtxEncContext->sMVSettingsNonB[i], &ctx->sMVSettingsNonB[i], sizeof(IMG_MV_SETTINGS));
2931 
2932     psMtxEncContext->ui32LRITC_Cache_Chunk_Config =
2933         F_ENCODE(ctx->uChunksPerMb, INTEL_CH_PM) |
2934         F_ENCODE(ctx->uMaxChunks, INTEL_CH_MX) |
2935         F_ENCODE(ctx->uMaxChunks - ctx->uPriorityChunks, INTEL_CH_PY);
2936 
2937 
2938     //they would be set in function tng__prepare_templates()
2939     psMtxEncContext->ui32FirstPicFlags = ctx->ui32FirstPicFlags;
2940     psMtxEncContext->ui32NonFirstPicFlags = ctx->ui32NonFirstPicFlags;
2941 
2942 #ifdef LTREFHEADER
2943     psMtxEncContext->i8SliceHeaderSlotNum = -1;
2944 #endif
2945 
2946     {
2947         memset(psMtxEncContext->aui8PicOnLevel, 0, sizeof(psMtxEncContext->aui8PicOnLevel));
2948         psb_buffer_map(&(ps_mem->bufs_flat_gop), &(ps_mem->bufs_flat_gop.virtual_addr));
2949         if (ps_mem->bufs_flat_gop.virtual_addr == NULL) {
2950            drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping flat gop\n", __FUNCTION__);
2951            return ;
2952         }
2953         tng__minigop_generate_flat(ps_mem->bufs_flat_gop.virtual_addr, psMtxEncContext->ui32BFrameCount,
2954             psMtxEncContext->ui8RefSpacing, psMtxEncContext->aui8PicOnLevel);
2955         psb_buffer_unmap(&(ps_mem->bufs_flat_gop));
2956 
2957         if (ctx->sRCParams.b16Hierarchical) {
2958             memset(psMtxEncContext->aui8PicOnLevel, 0, sizeof(psMtxEncContext->aui8PicOnLevel));
2959             psb_buffer_map(&(ps_mem->bufs_hierar_gop), &(ps_mem->bufs_hierar_gop.virtual_addr));
2960             if (ps_mem->bufs_hierar_gop.virtual_addr == NULL) {
2961                 drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping sei header\n", __FUNCTION__);
2962                 return ;
2963             }
2964             tng_minigop_generate_hierarchical(ps_mem->bufs_hierar_gop.virtual_addr, psMtxEncContext->ui32BFrameCount,
2965                 psMtxEncContext->ui8RefSpacing, psMtxEncContext->aui8PicOnLevel);
2966             psb_buffer_unmap(&(ps_mem->bufs_hierar_gop));
2967         }
2968     }
2969 
2970 #if INPUT_SCALER_SUPPORTED
2971     if (ctx->bEnableScaler) {
2972         IMG_UINT8 sccCoeffs[4][16];
2973         IMG_UINT32 ui32PitchX, ui32PitchY;
2974         IMG_INT32 i32Phase, i32Tap;
2975 
2976         ui32PitchX = (((IMG_UINT32)(psVideoParams->ui16SourceWidth - psVideoParams->ui8CropLeft - psVideoParams->ui8CropRight)) << 12) / psVideoParams->ui16Width;
2977         ui32PitchY = (((IMG_UINT32)(psVideoParams->ui16SourceFrameHeight - psVideoParams->ui8CropTop - psVideoParams->ui8CropBottom)) << 12) / psVideoParams->ui16FrameHeight;
2978 
2979         // Input size
2980         psMtxEncContext->ui32ScalerInputSizeReg = F_ENCODE(psVideoParams->ui16SourceWidth - 1, TOPAZHP_EXT_CR_SCALER_INPUT_WIDTH_MIN1) |
2981             F_ENCODE((psVideoParams->ui16SourceFrameHeight >> (psVideo->bIsInterlaced ? 1 : 0)) - 1, TOPAZHP_EXT_CR_SCALER_INPUT_HEIGHT_MIN1);
2982 
2983         psMtxEncContext->ui32ScalerCropReg = F_ENCODE(psVideoParams->ui8CropLeft, TOPAZHP_EXT_CR_SCALER_INPUT_CROP_HOR) |
2984             F_ENCODE(psVideoParams->ui8CropTop, TOPAZHP_EXT_CR_SCALER_INPUT_CROP_VER);
2985 
2986         // Scale factors
2987         psMtxEncContext->ui32ScalerPitchReg = 0;
2988 
2989         if (ui32PitchX > 0x3FFF) {
2990             psMtxEncContext->ui32ScalerPitchReg |= F_ENCODE(1, TOPAZHP_EXT_CR_SCALER_HOR_BILINEAR_FILTER);
2991             ui32PitchX >>= 1;
2992         }
2993 
2994         if (ui32PitchX > 0x3FFF) {
2995             ui32PitchX = 0x3FFF;
2996         }
2997 
2998         if (ui32PitchY > 0x3FFF) {
2999             psMtxEncContext->ui32ScalerPitchReg |= F_ENCODE(1, TOPAZHP_EXT_CR_SCALER_VER_BILINEAR_FILTER);
3000             ui32PitchY >>= 1;
3001         }
3002 
3003         if (ui32PitchY > 0x3FFF) {
3004             ui32PitchY = 0x3FFF;
3005         }
3006 
3007         psMtxEncContext->ui32ScalerPitchReg |= F_ENCODE(ui32PitchX, TOPAZHP_EXT_CR_SCALER_INPUT_HOR_PITCH) |
3008             F_ENCODE(ui32PitchY, TOPAZHP_EXT_CR_SCALER_INPUT_VER_PITCH);
3009 
3010 
3011         // Coefficients
3012         VIDEO_CalcCoefs_FromPitch(((IMG_FLOAT)ui32PitchX) / 4096.0f, sccCoeffs);
3013 
3014         for (i32Phase = 0; i32Phase < 4; i32Phase++) {
3015             psMtxEncContext->asHorScalerCoeffRegs[i32Phase] = 0;
3016             for (i32Tap = 0; i32Tap < 4; i32Tap++) 	{
3017                 psMtxEncContext->asHorScalerCoeffRegs[i32Phase] |= F_ENCODE(sccCoeffs[3 - i32Tap][(i32Phase * 2) + 1], TOPAZHP_EXT_CR_SCALER_HOR_LUMA_COEFF(i32Tap));
3018             }
3019         }
3020 
3021         VIDEO_CalcCoefs_FromPitch(((IMG_FLOAT)ui32PitchY) / 4096.0f, sccCoeffs);
3022 
3023         for (i32Phase = 0; i32Phase < 4; i32Phase++) {
3024             psMtxEncContext->asVerScalerCoeffRegs[i32Phase] = 0;
3025             for (i32Tap = 0; i32Tap < 4; i32Tap++) {
3026                 psMtxEncContext->asVerScalerCoeffRegs[i32Phase] |= F_ENCODE(sccCoeffs[3 - i32Tap][(i32Phase * 2) + 1], TOPAZHP_EXT_CR_SCALER_VER_LUMA_COEFF(i32Tap));
3027             }
3028         }
3029     } else {
3030         // Disable scaling
3031         psMtxEncContext->ui32ScalerInputSizeReg = 0;
3032     }
3033 #endif // INPUT_SCALER_SUPPORTED
3034 
3035     psb_buffer_unmap(&(ps_mem->bufs_mtx_context));
3036 
3037     return ;
3038 }
3039 
tng__setvideo_cmdbuf(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)3040 static void tng__setvideo_cmdbuf(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
3041 {
3042     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
3043     context_ENC_mem_size *ps_mem_size = &(ctx->ctx_mem_size);
3044 #ifndef _TNG_FRAMES_
3045     context_ENC_frame_buf *ps_buf = &(ctx->ctx_frame_buf);
3046 #endif
3047     IMG_MTX_VIDEO_CONTEXT* psMtxEncContext = NULL;
3048     IMG_INT32 i;
3049 
3050     psb_buffer_map(&(ps_mem->bufs_mtx_context), &(ps_mem->bufs_mtx_context.virtual_addr));
3051     if (ps_mem->bufs_mtx_context.virtual_addr == NULL) {
3052         drv_debug_msg(VIDEO_DEBUG_ERROR, "%s error: mapping sei header\n", __FUNCTION__);
3053         return ;
3054     }
3055     psMtxEncContext = (IMG_MTX_VIDEO_CONTEXT*)(ps_mem->bufs_mtx_context.virtual_addr);
3056 
3057     tng_cmdbuf_set_phys(&(psMtxEncContext->ui32MVSettingsBTable), 0,
3058         &(ps_mem->bufs_mv_setting_btable), 0, 0);
3059     if (ctx->sRCParams.b16Hierarchical)
3060         tng_cmdbuf_set_phys(&psMtxEncContext->ui32MVSettingsHierarchical, 0,
3061             &(ps_mem->bufs_mv_setting_hierar), 0, 0);
3062 #ifdef _TNG_FRAMES_
3063     tng_cmdbuf_set_phys(psMtxEncContext->apReconstructured, ctx->i32PicNodes,
3064         &(ps_mem->bufs_recon_pictures), 0, ps_mem_size->recon_pictures);
3065 #else
3066     for (i = 0; i < ctx->i32PicNodes; i++) {
3067         tng_cmdbuf_set_phys(&(psMtxEncContext->apReconstructured[i]), 0,
3068             &(ps_buf->ref_surface[i]->psb_surface->buf), 0, 0);
3069     }
3070 #endif
3071 
3072     tng_cmdbuf_set_phys(psMtxEncContext->apColocated, ctx->i32PicNodes,
3073         &(ps_mem->bufs_colocated), 0, ps_mem_size->colocated);
3074 
3075     tng_cmdbuf_set_phys(psMtxEncContext->apMV, ctx->i32MVStores,
3076         &(ps_mem->bufs_mv), 0, ps_mem_size->mv);
3077 
3078     if (ctx->bEnableMVC) {
3079         tng_cmdbuf_set_phys(psMtxEncContext->apInterViewMV, 2,
3080             &(ps_mem->bufs_interview_mv), 0, ps_mem_size->interview_mv);
3081     }
3082 
3083     tng_cmdbuf_set_phys(psMtxEncContext->apWritebackRegions, WB_FIFO_SIZE,
3084         &(ctx->bufs_writeback), 0, ps_mem_size->writeback);
3085 
3086     tng_cmdbuf_set_phys(psMtxEncContext->apAboveParams, (IMG_UINT32)(ctx->ui8PipesToUse),
3087         &(ps_mem->bufs_above_params), 0, ps_mem_size->above_params);
3088 
3089     // SEI_INSERTION
3090     if (ctx->bInsertHRDParams) {
3091         tng_cmdbuf_set_phys(&psMtxEncContext->pSEIBufferingPeriodTemplate, 0,
3092             &(ps_mem->bufs_sei_header), ps_mem_size->sei_header, ps_mem_size->sei_header);
3093         tng_cmdbuf_set_phys(&psMtxEncContext->pSEIPictureTimingTemplate, 0,
3094             &(ps_mem->bufs_sei_header), ps_mem_size->sei_header * 2, ps_mem_size->sei_header);
3095     }
3096 
3097     tng_cmdbuf_set_phys(psMtxEncContext->apSliceParamsTemplates, NUM_SLICE_TYPES,
3098         &(ps_mem->bufs_slice_template), 0, ps_mem_size->slice_template);
3099 
3100     tng_cmdbuf_set_phys(psMtxEncContext->aui32SliceMap, ctx->ui8SlotsInUse,
3101         &(ps_mem->bufs_slice_map), 0, ps_mem_size->slice_map);
3102 
3103     // WEIGHTED PREDICTION
3104     if (ctx->bWeightedPrediction || (ctx->ui8VPWeightedImplicitBiPred == WBI_EXPLICIT)) {
3105         tng_cmdbuf_set_phys(psMtxEncContext->aui32WeightedPredictionVirtAddr, ctx->ui8SlotsInUse,
3106             &(ps_mem->bufs_weighted_prediction), 0, ps_mem_size->weighted_prediction);
3107     }
3108 
3109     tng_cmdbuf_set_phys(&psMtxEncContext->ui32FlatGopStruct, 0, &(ps_mem->bufs_flat_gop), 0, 0);
3110     if (psMtxEncContext->b8Hierarchical)
3111         tng_cmdbuf_set_phys(&psMtxEncContext->ui32HierarGopStruct, 0, &(ps_mem->bufs_hierar_gop), 0, 0);
3112 
3113 #ifdef LTREFHEADER
3114     tng_cmdbuf_set_phys(psMtxEncContext->aui32LTRefHeader, ctx->ui8SlotsInUse,
3115         &(ps_mem->bufs_lt_ref_header), 0, ps_mem_size->lt_ref_header);
3116 #endif
3117 
3118     tng_cmdbuf_set_phys(psMtxEncContext->apPicHdrTemplates, 4,
3119         &(ps_mem->bufs_pic_template), 0, ps_mem_size->pic_template);
3120 
3121     if (ctx->eStandard == IMG_STANDARD_H264) {
3122         tng_cmdbuf_set_phys(&(psMtxEncContext->apSeqHeader), 0,
3123             &(ps_mem->bufs_seq_header), 0, ps_mem_size->seq_header);
3124         if (ctx->bEnableMVC)
3125             tng_cmdbuf_set_phys(&(psMtxEncContext->apSubSetSeqHeader), 0,
3126                 &(ps_mem->bufs_sub_seq_header), 0, ps_mem_size->seq_header);
3127     }
3128 
3129     if (ctx->ui8EnableSelStatsFlags & ESF_FIRST_STAGE_STATS) {
3130         tng_cmdbuf_set_phys(psMtxEncContext->pFirstPassOutParamAddr, ctx->ui8SlotsInUse,
3131             &(ps_mem->bufs_first_pass_out_params), 0, ps_mem_size->first_pass_out_params);
3132     }
3133 
3134 #ifndef EXCLUDE_BEST_MP_DECISION_DATA
3135     // Store the feedback memory address for all "5" slots in the context
3136     if (ctx->ui8EnableSelStatsFlags & ESF_MP_BEST_MB_DECISION_STATS
3137         || ctx->ui8EnableSelStatsFlags & ESF_MP_BEST_MOTION_VECTOR_STATS) {
3138         tng_cmdbuf_set_phys(psMtxEncContext->pFirstPassOutBestMultipassParamAddr, ctx->ui8SlotsInUse,
3139             &(ps_mem->bufs_first_pass_out_best_multipass_param), 0, ps_mem_size->first_pass_out_best_multipass_param);
3140     }
3141 #endif
3142 
3143     //Store the MB-Input control parameter memory for all the 5-slots in the context
3144     if (ctx->bEnableInpCtrl) {
3145         tng_cmdbuf_set_phys(psMtxEncContext->pMBCtrlInParamsAddr, ctx->ui8SlotsInUse,
3146             &(ps_mem->bufs_mb_ctrl_in_params), 0, ps_mem_size->mb_ctrl_in_params);
3147     }
3148 
3149     psb_buffer_unmap(&(ps_mem->bufs_mtx_context));
3150 
3151     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s end\n", __FUNCTION__);
3152 
3153     return ;
3154 }
3155 
tng__validate_params(context_ENC_p ctx)3156 static VAStatus tng__validate_params(context_ENC_p ctx)
3157 {
3158     VAStatus vaStatus = VA_STATUS_SUCCESS;
3159     IMG_UINT16 ui16WidthInMbs = (ctx->ui16Width + 15) >> 4;
3160     IMG_UINT16 ui16PictureHeight = ((ctx->ui16FrameHeight >> (ctx->bIsInterlaced ? 1 : 0)) + 15) & ~15;
3161     IMG_UINT16 ui16FrameHeightInMbs = (ctx->ui16FrameHeight + 15) >> 4;
3162 
3163     if ((ctx->ui16Width & 0xf) != 0) {
3164         return VA_STATUS_ERROR_INVALID_PARAMETER;
3165     }
3166 
3167     if ((ctx->ui16FrameHeight & 0xf) != 0) {
3168         return VA_STATUS_ERROR_INVALID_PARAMETER;
3169     }
3170 
3171     ctx->uMBspS = ui16WidthInMbs * ui16FrameHeightInMbs * ctx->sRCParams.ui32FrameRate;
3172 
3173     if (ctx->ui32CoreRev >= MIN_36_REV) {
3174         if ((ctx->ui16Width > 4096) || (ctx->ui16PictureHeight > 4096)) {
3175             return VA_STATUS_ERROR_INVALID_PARAMETER;
3176         }
3177         if ((ui16WidthInMbs << 4) * ui16PictureHeight > 2048 * 2048) {
3178             return VA_STATUS_ERROR_INVALID_PARAMETER;
3179         }
3180     } else {
3181         if ((ctx->ui16Width > 2048) || (ui16PictureHeight > 2048)) {
3182             return VA_STATUS_ERROR_INVALID_PARAMETER;
3183         }
3184     }
3185 
3186     if (ctx->eStandard == IMG_STANDARD_H264) {
3187         if ((ctx->ui8DeblockIDC == 0) && (ctx->bArbitrarySO))
3188             ctx->ui8DeblockIDC = 2;
3189 
3190         if ((ctx->ui8DeblockIDC == 0) && ((IMG_UINT32)(ctx->ui8PipesToUse) > 1) && (ctx->ui8SlicesPerPicture > 1)) {
3191             drv_debug_msg(VIDEO_DEBUG_GENERAL, "WARNING: Full deblocking with multiple pipes will cause a mismatch between reconstructed and encoded video\n");
3192             drv_debug_msg(VIDEO_DEBUG_GENERAL, "Consider using -deblockIDC 2 or -deblockIDC 1 instead if matching reconstructed video is required.\n");
3193             drv_debug_msg(VIDEO_DEBUG_GENERAL, "WARNING: Forcing -deblockIDC = 2 for HW verification.\n");
3194             ctx->ui8DeblockIDC = 2;
3195         }
3196     } else if (ctx->eStandard == IMG_STANDARD_H263) {
3197 		ctx->bArbitrarySO = IMG_FALSE;
3198 		ctx->ui8DeblockIDC = 1;
3199     } else {
3200         ctx->ui8DeblockIDC = 1;
3201     }
3202 
3203     //ctx->sRCParams.ui32SliceByteLimit = 0;
3204     ctx->sRCParams.ui32SliceMBLimit = 0;
3205     //slice params
3206     if (ctx->ui8SlicesPerPicture == 0)
3207         ctx->ui8SlicesPerPicture = ctx->sCapsParams.ui16RecommendedSlices;
3208     else {
3209         if (ctx->ui8SlicesPerPicture > ctx->sCapsParams.ui16MaxSlices)
3210             ctx->ui8SlicesPerPicture = ctx->sCapsParams.ui16MaxSlices;
3211         else if (ctx->ui8SlicesPerPicture < ctx->sCapsParams.ui16MinSlices)
3212             ctx->ui8SlicesPerPicture = ctx->sCapsParams.ui16MinSlices;
3213     }
3214 
3215     if (ctx->ui32pseudo_rand_seed == UNINIT_PARAM) {
3216         // When -randseed is uninitialised, initialise seed using other commandline values
3217         ctx->ui32pseudo_rand_seed = (IMG_UINT32) ((ctx->sRCParams.ui32InitialQp +
3218             ctx->ui16PictureHeight + ctx->ui16Width + ctx->sRCParams.ui32BitsPerSecond) & 0xffffffff);
3219         // iQP_Luma + pParams->uHeight + pParams->uWidth + pParams->uBitRate) & 0xffffffff);
3220     }
3221 
3222     if (ctx->eStandard == IMG_STANDARD_H264) {
3223         ctx->ui8PipesToUse = tng__min(ctx->ui8PipesToUse, ctx->ui8SlicesPerPicture);
3224     } else {
3225         ctx->ui8PipesToUse = 1;
3226     }
3227 
3228     return vaStatus;
3229 }
3230 
tng__validate_busize(context_ENC_p ctx)3231 static VAStatus tng__validate_busize(context_ENC_p ctx)
3232 {
3233     //IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
3234     // if no BU size is given then pick one ourselves, if doing arbitrary slice order then make BU = width in bu's
3235     // forces slice boundaries to no be mid-row
3236     if (ctx->bArbitrarySO || (ctx->ui32BasicUnit == 0)) {
3237         ctx->ui32BasicUnit = (ctx->ui16Width / 16);
3238         drv_debug_msg(VIDEO_DEBUG_GENERAL, "Patched Basic unit to %d\n", ctx->ui32BasicUnit);
3239     } else {
3240         IMG_UINT32 ui32MBs, ui32MBsperSlice, ui32MBsLastSlice;
3241         IMG_UINT32 ui32BUs;
3242         IMG_INT32  i32SliceHeight;
3243         IMG_UINT32 ui32MaxSlicesPerPipe, ui32MaxMBsPerPipe, ui32MaxBUsPerPipe;
3244 
3245         ui32MBs  = ctx->ui16PictureHeight * ctx->ui16Width / (16 * 16);
3246 
3247         i32SliceHeight = ctx->ui16PictureHeight / ctx->ui8SlicesPerPicture;
3248         i32SliceHeight &= ~15;
3249 
3250         ui32MBsperSlice = (i32SliceHeight * ctx->ui16Width) / (16 * 16);
3251         ui32MBsLastSlice = ui32MBs - (ui32MBsperSlice * (ctx->ui8SlicesPerPicture - 1));
3252 
3253         // they have given us a basic unit so validate it
3254         if (ctx->ui32BasicUnit < 6) {
3255             drv_debug_msg(VIDEO_DEBUG_GENERAL, "\nERROR: Basic unit size too small, must be greater than 6\n");
3256             return VA_STATUS_ERROR_UNKNOWN;
3257         }
3258 
3259         if (ctx->ui32BasicUnit > ui32MBsperSlice) {
3260             drv_debug_msg(VIDEO_DEBUG_GENERAL, "\nERROR: Basic unit size(%d) too large", ctx->ui32BasicUnit);
3261             drv_debug_msg(VIDEO_DEBUG_GENERAL, " must not be greater than the number of macroblocks in a slice (%d)\n", ui32MBsperSlice);
3262             return VA_STATUS_ERROR_UNKNOWN;
3263         }
3264         if (ctx->ui32BasicUnit > ui32MBsLastSlice) {
3265             drv_debug_msg(VIDEO_DEBUG_GENERAL, "\nERROR: Basic unit size(%d) too large", ctx->ui32BasicUnit);
3266             drv_debug_msg(VIDEO_DEBUG_GENERAL, " must not be greater than the number of macroblocks in a slice (%d)\n", ui32MBsLastSlice);
3267             return VA_STATUS_ERROR_UNKNOWN;
3268         }
3269 
3270         ui32BUs = ui32MBsperSlice / ctx->ui32BasicUnit;
3271         if ((ui32BUs * ctx->ui32BasicUnit) != ui32MBsperSlice) {
3272             drv_debug_msg(VIDEO_DEBUG_GENERAL, "\nERROR: Basic unit size(%d) not an integer divisor of MB's in a slice(%d)",
3273                                      ctx->ui32BasicUnit, ui32MBsperSlice);
3274             return VA_STATUS_ERROR_UNKNOWN;
3275         }
3276 
3277         ui32BUs = ui32MBsLastSlice / ctx->ui32BasicUnit;
3278         if ((ui32BUs * ctx->ui32BasicUnit) != ui32MBsLastSlice) {
3279             drv_debug_msg(VIDEO_DEBUG_GENERAL, "\nERROR: Basic unit size(%d) not an integer divisor of MB's in the last slice(%d)",
3280                                      ctx->ui32BasicUnit, ui32MBsLastSlice);
3281             return VA_STATUS_ERROR_UNKNOWN;
3282         }
3283 
3284         // check if the number of BUs per pipe is greater than 200
3285         ui32MaxSlicesPerPipe = (IMG_UINT32)(ctx->ui8SlicesPerPicture + ctx->ui8PipesToUse - 1) / (IMG_UINT32)(ctx->ui8PipesToUse);
3286         ui32MaxMBsPerPipe = (ui32MBsperSlice * (ui32MaxSlicesPerPipe - 1)) + ui32MBsLastSlice;
3287         ui32MaxBUsPerPipe = (ui32MaxMBsPerPipe + ctx->ui32BasicUnit - 1) / ctx->ui32BasicUnit;
3288         if (ui32MaxBUsPerPipe > 200) {
3289             drv_debug_msg(VIDEO_DEBUG_GENERAL, "\nERROR: Basic unit size too small. There must be less than 201 basic units per slice");
3290             return VA_STATUS_ERROR_UNKNOWN;
3291         }
3292     }
3293 
3294     ctx->sRCParams.ui32BUSize = ctx->ui32BasicUnit;
3295     return VA_STATUS_SUCCESS;
3296 }
3297 
tng__cmdbuf_new_codec(context_ENC_p ctx)3298 static VAStatus tng__cmdbuf_new_codec(context_ENC_p ctx)
3299 {
3300      VAStatus vaStatus = VA_STATUS_SUCCESS;
3301      tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
3302      psb_driver_data_p driver_data = ctx->obj_context->driver_data;
3303      context_ENC_mem *ps_mem = &(ctx->ctx_mem[0]);
3304 
3305      *cmdbuf->cmd_idx++ =
3306         ((MTX_CMDID_SW_NEW_CODEC & MTX_CMDWORD_ID_MASK) << MTX_CMDWORD_ID_SHIFT) |
3307         ((ctx->eCodec        & MTX_CMDWORD_CORE_MASK) << MTX_CMDWORD_CORE_SHIFT) |
3308         (((driver_data->context_id & MTX_CMDWORD_COUNT_MASK) << MTX_CMDWORD_COUNT_SHIFT));
3309  //       (((driver_data->drm_context & MTX_CMDWORD_COUNT_MASK) << MTX_CMDWORD_COUNT_SHIFT));
3310 
3311      tng_cmdbuf_insert_command_param((ctx->ui16Width << 16) | ctx->ui16PictureHeight);
3312 
3313     return vaStatus;
3314 }
3315 
tng__cmdbuf_doheader(context_ENC_p ctx)3316 static VAStatus tng__cmdbuf_doheader(context_ENC_p ctx)
3317 {
3318     VAStatus vaStatus = VA_STATUS_SUCCESS;
3319     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ctx->ui32StreamID]);
3320      tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
3321 
3322     cmdbuf->cmd_idx_saved[TNG_CMDBUF_PIC_HEADER_IDX] = cmdbuf->cmd_idx;
3323     tng_cmdbuf_insert_command(ctx->obj_context, 0,
3324                                       MTX_CMDID_DO_HEADER,
3325                                       0,
3326                                       &(ps_mem->bufs_seq_header),
3327                                       0);
3328     return vaStatus;
3329 }
3330 
tng__cmdbuf_lowpower(context_ENC_p ctx)3331 static VAStatus tng__cmdbuf_lowpower(context_ENC_p ctx)
3332 {
3333     VAStatus vaStatus = VA_STATUS_SUCCESS;
3334     tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
3335     psb_driver_data_p driver_data = ctx->obj_context->driver_data;
3336 
3337     *cmdbuf->cmd_idx++ =
3338         ((MTX_CMDID_SW_LEAVE_LOWPOWER & MTX_CMDWORD_ID_MASK) << MTX_CMDWORD_ID_SHIFT) |
3339         (((ctx->ui32RawFrameCount == 0 ? 1 : 0)  & MTX_CMDWORD_CORE_MASK) << MTX_CMDWORD_CORE_SHIFT) |
3340         (((driver_data->context_id & MTX_CMDWORD_COUNT_MASK) << MTX_CMDWORD_COUNT_SHIFT));
3341 
3342     tng_cmdbuf_insert_command_param(ctx->eCodec);
3343 
3344     return vaStatus;
3345 }
3346 
tng__cmdbuf_load_bias(context_ENC_p ctx)3347 static VAStatus tng__cmdbuf_load_bias(context_ENC_p ctx)
3348 {
3349     VAStatus vaStatus = VA_STATUS_SUCCESS;
3350 
3351     //init bias parameters
3352      tng_init_bias_params(ctx);
3353 
3354      vaStatus = tng__generate_bias(ctx);
3355      if (vaStatus != VA_STATUS_SUCCESS) {
3356          drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: generate bias params\n", __FUNCTION__, vaStatus);
3357      }
3358 
3359      vaStatus = tng_load_bias(ctx, IMG_INTER_P);
3360      if (vaStatus != VA_STATUS_SUCCESS) {
3361          drv_debug_msg(VIDEO_DEBUG_ERROR, "%s: load bias params\n", __FUNCTION__, vaStatus);
3362      }
3363     return vaStatus;
3364 }
3365 
tng__cmdbuf_setvideo(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)3366 static VAStatus tng__cmdbuf_setvideo(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
3367 {
3368     VAStatus vaStatus = VA_STATUS_SUCCESS;
3369     context_ENC_mem *ps_mem = &(ctx->ctx_mem[ui32StreamIndex]);
3370 
3371     tng__setvideo_params(ctx, ui32StreamIndex);
3372     tng__setvideo_cmdbuf(ctx, ui32StreamIndex);
3373 
3374     tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID,
3375         MTX_CMDID_SETVIDEO, 0, &(ps_mem->bufs_mtx_context), 0);
3376 
3377     return vaStatus;
3378 }
3379 
tng__rc_update(context_ENC_p ctx,IMG_UINT32 ui32NewBitrate,IMG_UINT8 ui8NewFrameQP,IMG_UINT8 ui8NewFrameMinQP,IMG_UINT8 ui8NewFrameMaxQP,IMG_UINT16 ui16NewIntraPeriod)3380 static void tng__rc_update(
3381     context_ENC_p ctx,
3382     IMG_UINT32 ui32NewBitrate,
3383     IMG_UINT8 ui8NewFrameQP,
3384     IMG_UINT8 ui8NewFrameMinQP,
3385     IMG_UINT8 ui8NewFrameMaxQP,
3386     IMG_UINT16 ui16NewIntraPeriod)
3387 {
3388     psb_buffer_p buf = (psb_buffer_p)(F_ENCODE(ui8NewFrameMinQP, MTX_MSG_RC_UPDATE_MIN_QP) |
3389                         F_ENCODE(ui8NewFrameMaxQP, MTX_MSG_RC_UPDATE_MAX_QP) |
3390                         F_ENCODE(ui16NewIntraPeriod, MTX_MSG_RC_UPDATE_INTRA));
3391     tng_cmdbuf_insert_command(
3392                         ctx->obj_context,
3393                         ctx->ui32StreamID,
3394                         MTX_CMDID_RC_UPDATE,
3395                         F_ENCODE(ui8NewFrameQP, MTX_MSG_RC_UPDATE_QP) |
3396                             F_ENCODE(ui32NewBitrate, MTX_MSG_RC_UPDATE_BITRATE),
3397                         buf,
3398                         0);
3399 }
3400 
tng__update_ratecontrol(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)3401 static VAStatus tng__update_ratecontrol(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
3402 {
3403     VAStatus vaStatus = VA_STATUS_SUCCESS;
3404     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
3405     IMG_UINT32 ui32CmdData = 0;
3406     IMG_UINT32 ui32NewBitsPerFrame = 0;
3407     IMG_UINT8 ui8NewVCMIFrameQP = 0;
3408 
3409     if (!(ctx->rc_update_flag))
3410         return vaStatus;
3411 
3412     tng__setup_rcdata(ctx);
3413 
3414     drv_debug_msg(VIDEO_DEBUG_GENERAL,
3415         "%s: frame[%d] bits_per_second = %d, min_qp = %d, max_qp = %d, initial_qp = %d\n",
3416         __FUNCTION__, ctx->ui32FrameCount[ui32StreamIndex], psRCParams->ui32BitsPerSecond,
3417         psRCParams->iMinQP, ctx->max_qp, psRCParams->ui32InitialQp);
3418 
3419     if (ctx->rc_update_flag & RC_MASK_frame_rate) {
3420 	tng__rc_update(ctx, psRCParams->ui32BitsPerSecond, -1, -1, -1, -1);
3421 	ctx->rc_update_flag &= ~RC_MASK_frame_rate;
3422     }
3423 
3424     if (ctx->rc_update_flag & RC_MASK_bits_per_second) {
3425 	tng__rc_update(ctx, psRCParams->ui32BitsPerSecond, -1, -1, -1, -1);
3426 	ctx->rc_update_flag &= ~RC_MASK_bits_per_second;
3427     }
3428 
3429     if (ctx->rc_update_flag & RC_MASK_min_qp) {
3430 	tng__rc_update(ctx, -1, -1, psRCParams->iMinQP, -1, -1);
3431 	ctx->rc_update_flag &= ~RC_MASK_min_qp;
3432     }
3433 
3434     if (ctx->rc_update_flag & RC_MASK_max_qp) {
3435 	tng__rc_update(ctx, -1, -1, -1, ctx->max_qp, -1);
3436 	ctx->rc_update_flag &= ~RC_MASK_max_qp;
3437     }
3438 
3439     if (ctx->rc_update_flag & RC_MASK_initial_qp) {
3440 	tng__rc_update(ctx, -1, psRCParams->ui32InitialQp, -1, -1, -1);
3441 	ctx->rc_update_flag &= ~RC_MASK_initial_qp;
3442     }
3443 
3444     if (ctx->rc_update_flag & RC_MASK_intra_period) {
3445 	tng__rc_update(ctx, -1, -1, -1, -1, ctx->ui32IntraCnt);
3446 	ctx->rc_update_flag &= ~RC_MASK_intra_period;
3447     }
3448 
3449     return vaStatus;
3450 }
3451 
tng__update_frametype(context_ENC_p ctx,IMG_FRAME_TYPE eFrameType)3452 static VAStatus tng__update_frametype(context_ENC_p ctx, IMG_FRAME_TYPE eFrameType)
3453 {
3454     VAStatus vaStatus = VA_STATUS_SUCCESS;
3455     IMG_UINT32 ui32CmdData = 0;
3456 
3457     ui32CmdData = F_ENCODE(IMG_PICMGMT_REF_TYPE, MTX_MSG_PICMGMT_SUBTYPE) |
3458                 F_ENCODE(eFrameType, MTX_MSG_PICMGMT_DATA);
3459 
3460     tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID,
3461         MTX_CMDID_PICMGMT ,
3462         ui32CmdData, 0, 0);
3463 
3464     return vaStatus;
3465 }
3466 
tng__cmdbuf_send_picmgmt(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)3467 static VAStatus tng__cmdbuf_send_picmgmt(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
3468 {
3469     VAStatus vaStatus = VA_STATUS_SUCCESS;
3470     IMG_RC_PARAMS *psRCParams = &(ctx->sRCParams);
3471 
3472     if (!(ctx->rc_update_flag))
3473         return vaStatus;
3474 
3475     //tng__setup_rcdata(ctx);
3476     drv_debug_msg(VIDEO_DEBUG_GENERAL,
3477         "%s: ui32BitsPerSecond = %d, ui32FrameRate = %d, ui32InitialQp = %d\n",
3478         __FUNCTION__, psRCParams->ui32BitsPerSecond,
3479         psRCParams->ui32FrameRate, psRCParams->ui32InitialQp);
3480     drv_debug_msg(VIDEO_DEBUG_GENERAL,
3481         "%s: frame_count[%d] = %d\n", __FUNCTION__,
3482         ui32StreamIndex, ctx->ui32FrameCount[ui32StreamIndex]);
3483 
3484     return vaStatus;
3485 }
3486 
3487 
tng__cmdbuf_provide_buffer(context_ENC_p ctx,IMG_UINT32 ui32StreamIndex)3488 static VAStatus tng__cmdbuf_provide_buffer(context_ENC_p ctx, IMG_UINT32 ui32StreamIndex)
3489 {
3490     VAStatus vaStatus = VA_STATUS_SUCCESS;
3491 
3492     if (ctx->ui8PipesToUse == 1) {
3493         tng_send_codedbuf(ctx, ctx->ui8SlotsCoded);
3494     } else {
3495         /*Make sure DMA start is 128bits alignment*/
3496         tng_send_codedbuf(ctx, ctx->ui8SlotsCoded * 2);
3497         tng_send_codedbuf(ctx, ctx->ui8SlotsCoded * 2 + 1);
3498     }
3499 
3500     if (ctx->sRCParams.ui16BFrames > 0)
3501         tng__provide_buffer_BFrames(ctx, ui32StreamIndex);
3502     else
3503         tng__provide_buffer_PFrames(ctx, ui32StreamIndex);
3504 /*
3505     if (ctx->ui32LastPicture != 0) {
3506         drv_debug_msg(VIDEO_DEBUG_GENERAL,
3507             "%s: frame_count[%d] = %d\n", __FUNCTION__,
3508             ui32StreamIndex, ctx->ui32FrameCount[ui32StreamIndex]);
3509         tng_picmgmt_update(ctx,IMG_PICMGMT_EOS, ctx->ui32LastPicture);
3510     }
3511 */
3512 #ifdef _TOPAZHP_REC_
3513     tng_send_rec_frames(ctx, -1, 0);
3514     tng_send_ref_frames(ctx, 0, 0);
3515     tng_send_ref_frames(ctx, 1, 0);
3516 #endif
3517 
3518     ctx->ui8SlotsCoded = (ctx->ui8SlotsCoded + 1) & 1;
3519 
3520     return vaStatus;
3521 }
3522 
tng__set_ctx_buf(context_ENC_p ctx,IMG_UINT32 __maybe_unused ui32StreamID)3523 VAStatus tng__set_ctx_buf(context_ENC_p ctx, IMG_UINT32 __maybe_unused ui32StreamID)
3524 {
3525     VAStatus vaStatus = VA_STATUS_SUCCESS;
3526     IMG_UINT8 ui8IsJpeg;
3527 
3528     vaStatus = tng__validate_params(ctx);
3529     if (vaStatus != VA_STATUS_SUCCESS) {
3530         drv_debug_msg(VIDEO_DEBUG_ERROR, "validate params");
3531     }
3532 
3533     vaStatus = tng__validate_busize(ctx);
3534     if (vaStatus != VA_STATUS_SUCCESS) {
3535         drv_debug_msg(VIDEO_DEBUG_ERROR, "validate busize");
3536     }
3537     ctx->ctx_cmdbuf[0].ui32LowCmdCount = 0xa5a5a5a5 %  MAX_TOPAZ_CMD_COUNT;
3538     ctx->ctx_cmdbuf[0].ui32HighCmdCount = 0;
3539     ctx->ctx_cmdbuf[0].ui32HighWBReceived = 0;
3540 
3541     ui8IsJpeg = (ctx->eStandard == IMG_STANDARD_JPEG) ? 1 : 0;
3542     vaStatus = tng__alloc_context_buffer(ctx, ui8IsJpeg, 0);
3543     if (vaStatus != VA_STATUS_SUCCESS) {
3544         drv_debug_msg(VIDEO_DEBUG_ERROR, "setup enc profile");
3545     }
3546     return vaStatus;
3547 }
3548 
tng__set_headers(context_ENC_p ctx,IMG_UINT32 __maybe_unused ui32StreamID)3549 static VAStatus tng__set_headers (context_ENC_p ctx, IMG_UINT32 __maybe_unused ui32StreamID)
3550 {
3551     VAStatus vaStatus = VA_STATUS_SUCCESS;
3552     IMG_UINT8 ui8SlotIdx = 0;
3553 
3554     vaStatus = tng__prepare_templates(ctx, 0);
3555     if (vaStatus != VA_STATUS_SUCCESS) {
3556         drv_debug_msg(VIDEO_DEBUG_ERROR, "prepare_templates\n");
3557     }
3558 
3559     for (ui8SlotIdx = 0; ui8SlotIdx < ctx->ui8SlotsInUse; ui8SlotIdx++)
3560         tng_fill_slice_map(ctx, (IMG_UINT32)ui8SlotIdx, 0);
3561 
3562     return vaStatus;
3563 }
3564 
tng__set_cmd_buf(context_ENC_p ctx,IMG_UINT32 __maybe_unused ui32StreamID)3565 static VAStatus tng__set_cmd_buf(context_ENC_p ctx, IMG_UINT32 __maybe_unused ui32StreamID)
3566 {
3567     VAStatus vaStatus = VA_STATUS_SUCCESS;
3568 
3569     vaStatus = tng__cmdbuf_new_codec(ctx);
3570     if (vaStatus != VA_STATUS_SUCCESS) {
3571         drv_debug_msg(VIDEO_DEBUG_ERROR, "cmdbuf new codec\n");
3572     }
3573 
3574     vaStatus = tng__cmdbuf_lowpower(ctx);
3575     if (vaStatus != VA_STATUS_SUCCESS) {
3576         drv_debug_msg(VIDEO_DEBUG_ERROR, "cmdbuf lowpower\n");
3577     }
3578 
3579     vaStatus = tng__cmdbuf_load_bias(ctx);
3580     if (vaStatus != VA_STATUS_SUCCESS) {
3581         drv_debug_msg(VIDEO_DEBUG_ERROR, "cmdbuf load bias\n");
3582     }
3583 
3584     vaStatus = tng__cmdbuf_setvideo(ctx, 0);
3585     if (vaStatus != VA_STATUS_SUCCESS) {
3586         drv_debug_msg(VIDEO_DEBUG_ERROR, "cmdbuf setvideo\n");
3587     }
3588     return vaStatus;
3589 }
3590 
tng__end_one_frame(context_ENC_p ctx,IMG_UINT32 ui32StreamID)3591 VAStatus tng__end_one_frame(context_ENC_p ctx, IMG_UINT32 ui32StreamID)
3592 {
3593     VAStatus vaStatus = VA_STATUS_SUCCESS;
3594     context_ENC_frame_buf *ps_buf = &(ctx->ctx_frame_buf);
3595 
3596     drv_debug_msg(VIDEO_DEBUG_GENERAL, "ui32StreamID is %d.\n", ui32StreamID);
3597 
3598     /* save current settings */
3599     ps_buf->previous_src_surface = ps_buf->src_surface;
3600 #ifdef _TNG_FRAMES_
3601     ps_buf->previous_ref_surface = ps_buf->ref_surface;
3602 #else
3603     ps_buf->previous_ref_surface = ps_buf->ref_surface[0];
3604 #endif
3605 
3606     /*Frame Skip flag in Coded Buffer of frame N determines if frame N+2
3607     * should be skipped, which means sending encoding commands of frame N+1 doesn't
3608     * have to wait until frame N is completed encoded. It reduces the precision of
3609     * rate control but improves HD encoding performance a lot.*/
3610     ps_buf->pprevious_coded_buf = ps_buf->previous_coded_buf;
3611     ps_buf->previous_coded_buf = ps_buf->coded_buf;
3612 
3613     ctx->ePreFrameType = ctx->eFrameType;
3614 
3615     return vaStatus;
3616 }
3617 
tng_EndPicture(context_ENC_p ctx)3618 VAStatus tng_EndPicture(context_ENC_p ctx)
3619 {
3620     VAStatus vaStatus = VA_STATUS_SUCCESS;
3621     tng_cmdbuf_p cmdbuf = ctx->obj_context->tng_cmdbuf;
3622     context_ENC_mem *ps_mem = &(ctx->ctx_mem[0]);
3623     unsigned int offset;
3624     int value;
3625 
3626     drv_debug_msg(VIDEO_DEBUG_GENERAL,"%s: ctx->ui8SlicesPerPicture = %d, ctx->ui32FrameCount[0] = %d\n",
3627          __FUNCTION__, ctx->ui8SlicesPerPicture, ctx->ui32FrameCount[0]);
3628 
3629     if (ctx->ui32FrameCount[0] == 0) {
3630         vaStatus = tng__set_ctx_buf(ctx, 0);
3631         if (vaStatus != VA_STATUS_SUCCESS) {
3632             drv_debug_msg(VIDEO_DEBUG_ERROR, "set ctx buf \n");
3633         }
3634         vaStatus = tng__set_headers(ctx, 0);
3635         if (vaStatus != VA_STATUS_SUCCESS) {
3636             drv_debug_msg(VIDEO_DEBUG_ERROR, "set headers \n");
3637         }
3638 
3639         vaStatus = tng__set_cmd_buf(ctx, 0);
3640         if (vaStatus != VA_STATUS_SUCCESS) {
3641            drv_debug_msg(VIDEO_DEBUG_ERROR, "set cmd buf \n");
3642         }
3643 
3644 #ifdef _TOPAZHP_PDUMP_
3645 	tng_trace_setvideo(ctx, 0);
3646 #endif
3647     } else {
3648         vaStatus = tng__cmdbuf_lowpower(ctx);
3649         if (vaStatus != VA_STATUS_SUCCESS) {
3650             drv_debug_msg(VIDEO_DEBUG_ERROR, "cmdbuf lowpower\n");
3651         }
3652     }
3653 
3654     if (ctx->sRCParams.eRCMode != IMG_RCMODE_NONE ||
3655 	ctx->rc_update_flag) {
3656         vaStatus = tng__update_ratecontrol(ctx, ctx->ui32StreamID);
3657         if (vaStatus != VA_STATUS_SUCCESS) {
3658             drv_debug_msg(VIDEO_DEBUG_ERROR, "send picmgmt");
3659         }
3660     }
3661 
3662     if ((ctx->idr_force_flag == 1) && (ctx->sRCParams.ui16BFrames == 0)){
3663         vaStatus = tng__update_frametype(ctx, IMG_FRAME_IDR);
3664         if (vaStatus != VA_STATUS_SUCCESS) {
3665             drv_debug_msg(VIDEO_DEBUG_ERROR, "send picmgmt IDR");
3666         }
3667         ctx->idr_force_flag =0;
3668     }
3669 
3670     vaStatus = tng__cmdbuf_provide_buffer(ctx, ctx->ui32StreamID);
3671     if (vaStatus != VA_STATUS_SUCCESS) {
3672         drv_debug_msg(VIDEO_DEBUG_ERROR, "provide buffer");
3673     }
3674 
3675     if (ctx->bEnableAIR == IMG_TRUE ||
3676 	ctx->bEnableCIR == IMG_TRUE) {
3677 	tng_air_set_input_control(ctx, 0);
3678 
3679 	if (ctx->bEnableAIR == IMG_TRUE)
3680 	    tng_air_set_output_control(ctx, 0);
3681     }
3682 
3683     if (ctx->eStandard == IMG_STANDARD_MPEG4) {
3684         if (ctx->ui32FrameCount[0] == 0) {
3685             vaStatus = tng__cmdbuf_doheader(ctx);
3686             if (vaStatus != VA_STATUS_SUCCESS) {
3687                 drv_debug_msg(VIDEO_DEBUG_ERROR, "cmdbuf doheader\n");
3688             }
3689         }
3690         tng__MPEG4ES_send_seq_header(ctx, ctx->ui32StreamID);
3691     }
3692 
3693     if (ctx->bInsertHRDParams)
3694 	tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID,
3695 	    MTX_CMDID_DO_HEADER, 0, &(ps_mem->bufs_sei_header), 0);
3696 
3697     tng_cmdbuf_insert_command(ctx->obj_context, ctx->ui32StreamID,
3698         MTX_CMDID_ENCODE_FRAME, 0, 0, 0);
3699 
3700 #ifdef _TOPAZHP_CMDBUF_
3701     drv_debug_msg(VIDEO_DEBUG_GENERAL, "%s addr = 0x%08x \n", __FUNCTION__, cmdbuf);
3702     tng__trace_cmdbuf_words(cmdbuf);
3703     tng__trace_cmdbuf(cmdbuf, ctx->ui32StreamID);
3704 #endif
3705 
3706     //    tng_buffer_unmap(ctx, ctx->ui32StreamID);
3707     tng_cmdbuf_mem_unmap(cmdbuf);
3708 
3709     vaStatus = tng__end_one_frame(ctx, 0);
3710     if (vaStatus != VA_STATUS_SUCCESS) {
3711        drv_debug_msg(VIDEO_DEBUG_ERROR, "setting when one frame ends\n");
3712     }
3713 
3714     if (tng_context_flush_cmdbuf(ctx->obj_context)) {
3715         vaStatus = VA_STATUS_ERROR_UNKNOWN;
3716     }
3717 
3718 
3719     ++(ctx->ui32FrameCount[ctx->ui32StreamID]);
3720     ++(ctx->ui32RawFrameCount);
3721     return vaStatus;
3722 }
3723