/****************************************************************************** * * Copyright (C) 2018 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ***************************************************************************** * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore */ /*! ****************************************************************************** * \file ihevce_frame_process_utils.c * * \brief * This file contains definitions of top level functions related to frame * processing * * \date * 18/09/2012 * * \author * Ittiam * * List of Functions * * ****************************************************************************** */ /*****************************************************************************/ /* File Includes */ /*****************************************************************************/ /* System include files */ #include #include #include #include #include #include /* User include files */ #include "ihevc_typedefs.h" #include "itt_video_api.h" #include "ihevce_api.h" #include "rc_cntrl_param.h" #include "rc_frame_info_collector.h" #include "rc_look_ahead_params.h" #include "ihevc_defs.h" #include "ihevc_debug.h" #include "ihevc_macros.h" #include "ihevc_structs.h" #include "ihevc_platform_macros.h" #include "ihevc_deblk.h" #include "ihevc_itrans_recon.h" #include "ihevc_chroma_itrans_recon.h" #include "ihevc_chroma_intra_pred.h" #include "ihevc_intra_pred.h" #include "ihevc_inter_pred.h" #include "ihevc_mem_fns.h" #include "ihevc_padding.h" #include "ihevc_weighted_pred.h" #include "ihevc_sao.h" #include "ihevc_resi_trans.h" #include "ihevc_quant_iquant_ssd.h" #include "ihevc_cabac_tables.h" #include "ihevc_common_tables.h" #include "ihevce_defs.h" #include "ihevce_hle_interface.h" #include "ihevce_hle_q_func.h" #include "ihevce_lap_enc_structs.h" #include "ihevce_multi_thrd_structs.h" #include "ihevce_multi_thrd_funcs.h" #include "ihevce_me_common_defs.h" #include "ihevce_had_satd.h" #include "ihevce_error_checks.h" #include "ihevce_error_codes.h" #include "ihevce_bitstream.h" #include "ihevce_cabac.h" #include "ihevce_function_selector.h" #include "ihevce_enc_structs.h" #include "ihevce_global_tables.h" #include "ihevce_rc_enc_structs.h" #include "ihevce_rc_interface.h" #include "ihevce_frame_process_utils.h" #include "cast_types.h" #include "osal.h" #include "osal_defaults.h" /*****************************************************************************/ /* Globals */ /*****************************************************************************/ /************** Version Number string *******************/ UWORD8 gau1_version_string[] = "i265-v4.13-218 Build "; /*****************************************************************************/ /* Function Definitions */ /*****************************************************************************/ /*! ****************************************************************************** * * @brief * API to return frame qp in constant qp mode based on init I frame qp, * slice type and current temporal layer. * * I picture is given the same qp as the init qp configure in static params * P picture is set equal to I frame qp + 1 * B picture is set equal to P frame qp + temporal layer * * @param[in] static_params_frame_qp * frame level qp set for I frames in create time params * * @param[in] slice_type * slice type for current frame (I/P/B) * * @param[in] temporal_id * temoporal layer ID of the current frame. This is associalted with B frame. * temporal layer ID. I and P frames have temporal_id set to 0. * * @param[in] min_qp * minimum qp to be allocated for this frame. * * @param[in] max_qp * maximum qp to be allocated for this frame * * @return * current frame qp * * @author * Ittiam * * @remarks * This is right place to plug in frame level RC call for current frame qp * allocation later when RC support is added * ***************************************************************************** */ WORD32 ihevce_get_cur_frame_qp( WORD32 static_params_frame_qp, WORD32 slice_type, WORD32 temporal_id, WORD32 min_qp, WORD32 max_qp, rc_quant_t *ps_rc_quant_ctxt) { WORD32 i4_curr_qp = static_params_frame_qp; /* sanity checks */ ASSERT(max_qp >= min_qp); ASSERT((min_qp >= ps_rc_quant_ctxt->i2_min_qp) && (min_qp <= ps_rc_quant_ctxt->i2_max_qp)); ASSERT( (static_params_frame_qp >= ps_rc_quant_ctxt->i2_min_qp) && (static_params_frame_qp <= ps_rc_quant_ctxt->i2_max_qp)); if(ISLICE == slice_type) { /* I frame qp is same as init qp in static params */ i4_curr_qp = static_params_frame_qp; } else if(PSLICE == slice_type) { /* P frame qp is I frame qp + 1 */ i4_curr_qp = static_params_frame_qp + 1; } else if(BSLICE == slice_type) { /* B frame qp is I frame qp + 1 + temporal layer id */ i4_curr_qp = static_params_frame_qp + temporal_id + 1; } else { /* illegal slice type */ ASSERT(0); } i4_curr_qp = CLIP3(i4_curr_qp, min_qp, max_qp); return (i4_curr_qp); } /*! ****************************************************************************** * \if Function name : calc_block_ssim \endif * * \brief * Calc Block SSIM * * \return * None * * \author * Ittiam ***************************************************************************** */ unsigned int calc_block_ssim( unsigned char *pu1_ref, unsigned char *pu1_tst, unsigned char *pu1_win, WORD32 i4_horz_jump, unsigned short u2_ref_stride, unsigned short u2_tst_stride, unsigned char u1_win_size, unsigned char u1_win_q_shift) { unsigned int u4_wtd_ref_mean, u4_wtd_tst_mean, u4_wtd_ref_sq, u4_wtd_tst_sq, u4_wtd_ref_tst; unsigned int u4_wtd_ref_mean_sq, u4_wtd_tst_mean_sq, u4_wtd_ref_tst_mean_prod; unsigned char u1_wt, u1_ref_smpl, u1_tst_smpl; unsigned short u2_wtd_ref_smpl, u2_wtd_tst_smpl, u2_win_q_rounding; int i4_row, i4_col; u4_wtd_ref_mean = 0; u4_wtd_tst_mean = 0; u4_wtd_ref_sq = 0; u4_wtd_tst_sq = 0; u4_wtd_ref_tst = 0; for(i4_row = 0; i4_row < u1_win_size; i4_row++) { for(i4_col = 0; i4_col < u1_win_size; i4_col++) { u1_wt = *pu1_win++; u1_ref_smpl = pu1_ref[i4_col * i4_horz_jump]; u1_tst_smpl = pu1_tst[i4_col * i4_horz_jump]; u2_wtd_ref_smpl = u1_wt * u1_ref_smpl; u2_wtd_tst_smpl = u1_wt * u1_tst_smpl; u4_wtd_ref_mean += u2_wtd_ref_smpl; u4_wtd_tst_mean += u2_wtd_tst_smpl; u4_wtd_ref_sq += u2_wtd_ref_smpl * u1_ref_smpl; u4_wtd_tst_sq += u2_wtd_tst_smpl * u1_tst_smpl; u4_wtd_ref_tst += u2_wtd_ref_smpl * u1_tst_smpl; } pu1_ref += u2_ref_stride; pu1_tst += u2_tst_stride; } { unsigned int u4_num, u4_den, u4_term1; u2_win_q_rounding = (1 << u1_win_q_shift) >> 1; u4_wtd_ref_mean += (u2_win_q_rounding >> 8); u4_wtd_tst_mean += (u2_win_q_rounding >> 8); /* Keep the mean terms within 16-bits before squaring */ u4_wtd_ref_mean >>= (u1_win_q_shift - 8); u4_wtd_tst_mean >>= (u1_win_q_shift - 8); /* Bring down the square of sum terms to same Q format as the sum of square terms */ u4_wtd_ref_mean_sq = (u4_wtd_ref_mean * u4_wtd_ref_mean + 16) >> (16 - u1_win_q_shift); u4_wtd_tst_mean_sq = (u4_wtd_tst_mean * u4_wtd_tst_mean + 16) >> (16 - u1_win_q_shift); u4_wtd_ref_tst_mean_prod = (u4_wtd_ref_mean * u4_wtd_tst_mean + 16) >> (16 - u1_win_q_shift); /* Compute self and cross variances */ if(u4_wtd_ref_sq > u4_wtd_ref_mean_sq) u4_wtd_ref_sq -= u4_wtd_ref_mean_sq; else u4_wtd_ref_sq = 0; if(u4_wtd_tst_sq > u4_wtd_tst_mean_sq) u4_wtd_tst_sq -= u4_wtd_tst_mean_sq; else u4_wtd_tst_sq = 0; if(u4_wtd_ref_tst > u4_wtd_ref_tst_mean_prod) u4_wtd_ref_tst -= u4_wtd_ref_tst_mean_prod; else u4_wtd_ref_tst = 0; /* Keep the numerator in Q12 format before division */ u4_num = ((u4_wtd_ref_tst_mean_prod << 1) + C1) << (12 - u1_win_q_shift); u4_den = ((u4_wtd_ref_mean_sq + u4_wtd_tst_mean_sq) + C1 + u2_win_q_rounding) >> u1_win_q_shift; u4_term1 = (u4_num) / u4_den; u4_num = (u4_wtd_ref_tst << 1) + C2; u4_den = (u4_wtd_ref_sq + u4_wtd_tst_sq) + C2; /* If numerator takes less than 20-bits, product would not overflow; so no need to normalize */ if(u4_num < 1048576) { return ((u4_num * u4_term1) / u4_den); } /* While the above should be done really with getRange calculation, for simplicity, the other cases go through a less accurate calculation */ u4_num = (u4_num + u2_win_q_rounding) >> u1_win_q_shift; u4_den = (u4_den + u2_win_q_rounding) >> u1_win_q_shift; /* What is returned is SSIM in 1Q12 */ return ((u4_term1 * u4_num) / u4_den); } } /*! ****************************************************************************** * \if Function name : ihevce_fill_sei_payload \endif * * \brief * Fills SEI Payload * * \param[in] ps_enc_ctxt * Encoder Context * * \param[in] ps_curr_inp * Current Input pointer * * \param[in] ps_curr_out * Current Output pointer * * \return * None * * \author * Ittiam * ***************************************************************************** */ void ihevce_fill_sei_payload( enc_ctxt_t *ps_enc_ctxt, ihevce_lap_enc_buf_t *ps_curr_inp, frm_proc_ent_cod_ctxt_t *ps_curr_out) { UWORD32 *pu4_length, i4_cmd_len; UWORD32 *pu4_tag, i4_pic_type; UWORD8 *pu1_user_data; pu4_tag = ((UWORD32 *)(ps_curr_inp->s_input_buf.pv_synch_ctrl_bufs)); ps_curr_out->u4_num_sei_payload = 0; i4_pic_type = ps_curr_inp->s_lap_out.i4_pic_type; (void)ps_enc_ctxt; while(1) { if(((*pu4_tag) & IHEVCE_COMMANDS_TAG_MASK) == IHEVCE_SYNCH_API_END_TAG) break; pu4_length = pu4_tag + 1; pu1_user_data = (UWORD8 *)(pu4_length + 1); i4_cmd_len = *pu4_length; if((*pu4_tag & IHEVCE_COMMANDS_TAG_MASK) == IHEVCE_SYNCH_API_REG_KEYFRAME_SEI_TAG) { if(i4_pic_type == IV_IDR_FRAME) { memcpy( (void *)((ps_curr_out->as_sei_payload[ps_curr_out->u4_num_sei_payload] .pu1_sei_payload)), (void *)pu1_user_data, i4_cmd_len); ps_curr_out->as_sei_payload[ps_curr_out->u4_num_sei_payload].u4_payload_length = (i4_cmd_len); ps_curr_out->as_sei_payload[ps_curr_out->u4_num_sei_payload].u4_payload_type = ((*pu4_tag & IHEVCE_PAYLOAD_TYPE_MASK) >> IHEVCE_PAYLOAD_TYPE_SHIFT); ps_curr_out->u4_num_sei_payload++; } } else if((*pu4_tag & IHEVCE_COMMANDS_TAG_MASK) == IHEVCE_SYNCH_API_REG_ALLFRAME_SEI_TAG) { memcpy( (void *)(( ps_curr_out->as_sei_payload[ps_curr_out->u4_num_sei_payload].pu1_sei_payload)), (void *)pu1_user_data, i4_cmd_len); ps_curr_out->as_sei_payload[ps_curr_out->u4_num_sei_payload].u4_payload_length = (i4_cmd_len); ps_curr_out->as_sei_payload[ps_curr_out->u4_num_sei_payload].u4_payload_type = ((*pu4_tag & IHEVCE_PAYLOAD_TYPE_MASK) >> IHEVCE_PAYLOAD_TYPE_SHIFT); ps_curr_out->u4_num_sei_payload++; } //The formula (((x-1)>>2)+1) gives us the ceiling of (x mod 4). Hence this will take the pointer to the next address boundary divisible by 4. //And then we add 2 bytes for the tag and the payload length. if(i4_cmd_len) pu4_tag += (((i4_cmd_len - 1) >> 2) + 1 + 2); else pu4_tag += 2; } } /*! ****************************************************************************** * \if Function name : ihevce_dyn_bitrate \endif * * \brief * Call back function to be called for changing the bitrate * * * \return * None * * \author * Ittiam * ***************************************************************************** */ void ihevce_dyn_bitrate(void *pv_hle_ctxt, void *pv_dyn_bitrate_prms) { ihevce_hle_ctxt_t *ps_hle_ctxt = (ihevce_hle_ctxt_t *)pv_hle_ctxt; ihevce_dyn_config_prms_t *ps_dyn_bitrate_prms = (ihevce_dyn_config_prms_t *)pv_dyn_bitrate_prms; enc_ctxt_t *ps_enc_ctxt = (enc_ctxt_t *)ps_hle_ctxt->apv_enc_hdl[ps_dyn_bitrate_prms->i4_tgt_res_id]; ihevce_static_cfg_params_t *ps_static_cfg_params = ps_hle_ctxt->ps_static_cfg_prms; if(ps_enc_ctxt->ps_stat_prms->i4_log_dump_level > 0) { ps_static_cfg_params->s_sys_api.ihevce_printf( ps_static_cfg_params->s_sys_api.pv_cb_handle, "\n Average Bitrate changed to %d", ps_dyn_bitrate_prms->i4_new_tgt_bitrate); ps_static_cfg_params->s_sys_api.ihevce_printf( ps_static_cfg_params->s_sys_api.pv_cb_handle, "\n Peak Bitrate changed to %d", ps_dyn_bitrate_prms->i4_new_peak_bitrate); } /* acquire mutex lock for rate control calls */ osal_mutex_lock(ps_enc_ctxt->pv_rc_mutex_lock_hdl); ihevce_rc_register_dyn_change_bitrate( ps_enc_ctxt->s_module_ctxt.apv_rc_ctxt[ps_dyn_bitrate_prms->i4_tgt_br_id], (LWORD64)ps_dyn_bitrate_prms->i4_new_tgt_bitrate, (LWORD64)ps_dyn_bitrate_prms->i4_new_peak_bitrate, ps_dyn_bitrate_prms->i4_new_rate_factor, ps_enc_ctxt->ps_stat_prms->s_config_prms.i4_rate_control_mode); /*unlock rate control context*/ osal_mutex_unlock(ps_enc_ctxt->pv_rc_mutex_lock_hdl); return; } /*! ****************************************************************************** * \if Function name : ihevce_validate_encoder_parameters \endif * * \brief * Call back function to be called for changing the bitrate * * \return * None * * \author * Ittiam ***************************************************************************** */ WORD32 ihevce_validate_encoder_parameters(ihevce_static_cfg_params_t *ps_static_cfg_prms) { return (ihevce_hle_validate_static_params(ps_static_cfg_prms)); } /*! ****************************************************************************** * \if Function name : ihevce_get_encoder_version \endif * * \brief * Call back function to be called for changing the bitrate * * \return * None * * \author * Ittiam ***************************************************************************** */ const char *ihevce_get_encoder_version() { return ((const char *)gau1_version_string); }