/****************************************************************************** * * Copyright (C) 2018 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at: * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ***************************************************************************** * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore */ /****************************************************************************/ /* File Name : rc_rd_model.c */ /* */ /* Description : Implall the Functions to Model the */ /* Rate Distortion Behaviour of the Codec over the Last */ /* Few Frames. */ /* */ /* List of Functions : update_frame_rd_model */ /* estimate_mpeg2_qp_for_resbits */ /* */ /* Issues / Problems : None */ /* */ /* Revision History : */ /* DD MM YYYY Author(s) Changes (Describe the changes made) */ /* 21 06 2006 ittiam Initial Version */ /****************************************************************************/ /*****************************************************************************/ /* File Includes */ /*****************************************************************************/ /* System include files */ #include #include #include #include /* System include files */ #include "ittiam_datatypes.h" #include "rc_common.h" #include "var_q_operator.h" #include "mem_req_and_acq.h" #include "rc_rd_model.h" #include "rc_rd_model_struct.h" #if !(RC_FIXED_POINT) #if NON_STEADSTATE_CODE WORD32 rc_rd_model_num_fill_use_free_memtab( rc_rd_model_t **pps_rc_rd_model, itt_memtab_t *ps_memtab, ITT_FUNC_TYPE_E e_func_type) { WORD32 i4_mem_tab_idx = 0; static rc_rd_model_t s_rc_rd_model_temp; /* Hack for al alloc, during which we dont have any state memory. Dereferencing can cause issues */ if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB) (*pps_rc_rd_model) = &s_rc_rd_model_temp; /*for src rate control state structure*/ if(e_func_type != GET_NUM_MEMTAB) { fill_memtab( &ps_memtab[i4_mem_tab_idx], sizeof(rc_rd_model_t), MEM_TAB_ALIGNMENT, PERSISTENT, DDR); use_or_fill_base(&ps_memtab[0], (void **)pps_rc_rd_model, e_func_type); } i4_mem_tab_idx++; return (i4_mem_tab_idx); } void init_frm_rc_rd_model(rc_rd_model_t *ps_rd_model, UWORD8 u1_max_frames_modelled) { /*ps_rd_model = ps_rd_model + u1_pic_type;*/ ps_rd_model->u1_num_frms_in_model = 0; ps_rd_model->u1_curr_frm_counter = 0; ps_rd_model->u1_max_frms_to_model = u1_max_frames_modelled; /* ps_rd_model->u1_min_frames_for_quad_model = u1_min_frames_for_quad_model; ps_rd_model->u1_min_frames_for_lin_model = u1_min_frames_for_lin_model; */ ps_rd_model->model_coeff_a_quad = 0; ps_rd_model->model_coeff_b_quad = 0; ps_rd_model->model_coeff_c_quad = 0; ps_rd_model->model_coeff_a_lin = 0; ps_rd_model->model_coeff_b_lin = 0; ps_rd_model->model_coeff_c_lin = 0; ps_rd_model->model_coeff_a_lin_wo_int = 0; ps_rd_model->model_coeff_b_lin_wo_int = 0; ps_rd_model->model_coeff_c_lin_wo_int = 0; } void reset_frm_rc_rd_model(rc_rd_model_t *ps_rd_model) { /*ps_rd_model = ps_rd_model + u1_pic_type;*/ ps_rd_model->u1_num_frms_in_model = 0; ps_rd_model->u1_curr_frm_counter = 0; ps_rd_model->model_coeff_a_quad = 0; ps_rd_model->model_coeff_b_quad = 0; ps_rd_model->model_coeff_c_quad = 0; ps_rd_model->model_coeff_a_lin = 0; ps_rd_model->model_coeff_b_lin = 0; ps_rd_model->model_coeff_c_lin = 0; ps_rd_model->model_coeff_a_lin_wo_int = 0; ps_rd_model->model_coeff_b_lin_wo_int = 0; ps_rd_model->model_coeff_c_lin_wo_int = 0; } #endif /* #if NON_STEADSTATE_CODE */ #if ENABLE_QUAD_MODEL static UWORD8 find_model_coeffs( UWORD32 *pi4_res_bits, UWORD32 *pi4_sad_h264, UWORD8 *pu1_num_skips, UWORD8 *pui_avg_mpeg2_qp, UWORD8 u1_num_frms, UWORD8 u1_model_used, WORD8 *pi1_frame_index, model_coeff *pmc_model_coeff, model_coeff *pmc_model_coeff_lin, model_coeff *pmc_model_coeff_lin_wo_int, rc_rd_model_t *ps_rd_model) { UWORD32 i; UWORD8 u1_num_frms_used = 0; UWORD8 u1_frm_indx; float sum_y = 0; float sum_x_y = 0; float sum_x2_y = 0; float sum_x = 0; float sum_x2 = 0; float sum_x3 = 0; float sum_x4 = 0; float var_x2_y = 0; float var_x_y = 0; float var_x2_x = 0; float var_x2_x2 = 0; float var_x_x = 0; float x0, y0; float model_coeff_a, model_coeff_b, model_coeff_c, model_coeff_den; for(i = 0; i < u1_num_frms; i++) { if(-1 == pi1_frame_index[i]) continue; u1_frm_indx = (UWORD8)pi1_frame_index[i]; y0 = (float)(pi4_res_bits[u1_frm_indx]); x0 = (float)(pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx]); sum_y += y0; sum_x_y += x0 * y0; sum_x2_y += x0 * x0 * y0; sum_x += x0; sum_x2 += x0 * x0; sum_x3 += x0 * x0 * x0; sum_x4 += x0 * x0 * x0 * x0; u1_num_frms_used++; } sum_y /= u1_num_frms_used; sum_x_y /= u1_num_frms_used; sum_x2_y /= u1_num_frms_used; sum_x /= u1_num_frms_used; sum_x2 /= u1_num_frms_used; sum_x3 /= u1_num_frms_used; sum_x4 /= u1_num_frms_used; #if !QUAD u1_model_used = LIN_MODEL; #endif if((QUAD_MODEL == u1_model_used) && (u1_num_frms_used <= MIN_FRAMES_FOR_QUAD_MODEL)) { u1_model_used = LIN_MODEL; } if(QUAD_MODEL == u1_model_used) { var_x2_y = sum_x2_y - sum_x2 * sum_y; var_x_y = sum_x_y - sum_x * sum_y; var_x2_x = sum_x3 - sum_x2 * sum_x; var_x2_x2 = sum_x4 - sum_x2 * sum_x2; var_x_x = sum_x2 - sum_x * sum_x; model_coeff_den = (var_x2_x * var_x2_x - var_x2_x2 * var_x_x); if(0 != model_coeff_den) { model_coeff_b = (var_x_y * var_x2_x - var_x2_y * var_x_x); model_coeff_b /= model_coeff_den; model_coeff_a = (var_x2_y * var_x2_x - var_x_y * var_x2_x2); model_coeff_a /= model_coeff_den; model_coeff_c = sum_y - (model_coeff_a * sum_x) - (model_coeff_b * sum_x2); } pmc_model_coeff[0] = model_coeff_b; pmc_model_coeff[1] = model_coeff_a; pmc_model_coeff[2] = model_coeff_c; } if(NULL != pmc_model_coeff_lin) { var_x_y = sum_x_y - sum_x * sum_y; var_x_x = sum_x2 - sum_x * sum_x; if(0 != var_x_x) { model_coeff_a = (var_x_y / var_x_x); model_coeff_c = sum_y - (model_coeff_a * sum_x); /*model_coeff_b = 0;*/ model_coeff_b = model_coeff_a; pmc_model_coeff_lin[0] = model_coeff_b; pmc_model_coeff_lin[1] = model_coeff_a; pmc_model_coeff_lin[2] = model_coeff_c; } } if(NULL != pmc_model_coeff_lin_wo_int) { UWORD8 u1_curr_frame_index; UWORD8 u1_avgqp_prvfrm; UWORD32 u4_prevfrm_bits, u4_prevfrm_sad; u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter; if(0 == u1_curr_frame_index) u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); else u1_curr_frame_index--; u1_avgqp_prvfrm = ps_rd_model->pu1_avg_qp[u1_curr_frame_index]; u4_prevfrm_bits = ps_rd_model->pi4_res_bits[u1_curr_frame_index]; u4_prevfrm_sad = ps_rd_model->pi4_sad[u1_curr_frame_index]; if(0 != u4_prevfrm_sad) model_coeff_a = (float)(u4_prevfrm_bits * u1_avgqp_prvfrm) / u4_prevfrm_sad; else model_coeff_a = 0; model_coeff_b = 0; model_coeff_c = 0; pmc_model_coeff_lin_wo_int[0] = model_coeff_b; pmc_model_coeff_lin_wo_int[1] = model_coeff_a; pmc_model_coeff_lin_wo_int[2] = model_coeff_c; } return u1_model_used; } static WORD8 refine_set_of_points( UWORD32 *pi4_res_bits, UWORD32 *pi4_sad_h264, UWORD8 *pu1_num_skips, UWORD8 *pui_avg_mpeg2_qp, UWORD8 u1_num_frms, WORD8 *pi1_frame_index, model_coeff *pmc_model_coeff, float *pfl_avg_deviation) { float fl_avg_deviation, fl_estimated_bits, fl_deviation, x_val; UWORD8 u1_return_value = 1; UWORD32 i; UWORD8 u1_num_frms_used, u1_frm_indx; u1_num_frms_used = 0; fl_avg_deviation = 0; for(i = 0; i < u1_num_frms; i++) { if(-1 == pi1_frame_index[i]) continue; u1_frm_indx = (UWORD8)pi1_frame_index[i]; x_val = pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx]; fl_estimated_bits = (pmc_model_coeff[0] * x_val * x_val) + (pmc_model_coeff[1] * x_val) + (pmc_model_coeff[2]); fl_deviation = fabs(pi4_res_bits[u1_frm_indx] - fl_estimated_bits) / (float)pi4_res_bits[u1_frm_indx]; fl_deviation = fl_deviation * fl_deviation; fl_avg_deviation += fl_deviation; u1_num_frms_used++; } fl_avg_deviation /= u1_num_frms_used; /*fl_avg_deviation = sqrt(fl_avg_deviation);*/ fl_avg_deviation = (fl_avg_deviation); for(i = 0; i < u1_num_frms; i++) { if((-1 == pi1_frame_index[i]) && (i != 0)) continue; u1_frm_indx = (UWORD8)pi1_frame_index[i]; x_val = pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx]; fl_estimated_bits = (pmc_model_coeff[0] * x_val * x_val) + (pmc_model_coeff[1] * x_val) + (pmc_model_coeff[2]); fl_deviation = fabs(pi4_res_bits[u1_frm_indx] - fl_estimated_bits) / (float)pi4_res_bits[u1_frm_indx]; fl_deviation = fl_deviation * fl_deviation; if(fl_deviation > (fl_avg_deviation)) { pi1_frame_index[i] = -1; } } if(fl_avg_deviation > 0.0625) u1_return_value = 0; if(fl_avg_deviation < 0.0225) u1_return_value = 2; *pfl_avg_deviation = fl_avg_deviation; return (u1_return_value); } static void calc_avg_sqr_dev_for_model( UWORD32 *pi4_res_bits, UWORD32 *pi4_sad_h264, UWORD8 *pu1_num_skips, UWORD8 *pui_avg_mpeg2_qp, UWORD8 u1_num_frms, WORD8 *pi1_frame_index, model_coeff *pmc_model_coeff, float *pfl_avg_deviation) { float fl_avg_deviation, fl_estimated_bits, fl_deviation, x_val; UWORD8 u1_return_value = 1; UWORD32 i; UWORD8 u1_num_frms_used, u1_frm_indx; u1_num_frms_used = 0; fl_avg_deviation = 0; for(i = 0; i < u1_num_frms; i++) { if(-1 == pi1_frame_index[i]) continue; u1_frm_indx = (UWORD8)pi1_frame_index[i]; u1_frm_indx = (UWORD8)i; x_val = pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx]; fl_estimated_bits = (pmc_model_coeff[1] * x_val) + (pmc_model_coeff[2]); fl_deviation = fabs(pi4_res_bits[u1_frm_indx] - fl_estimated_bits) / (float)pi4_res_bits[u1_frm_indx]; fl_deviation = fl_deviation * fl_deviation; fl_avg_deviation += fl_deviation; u1_num_frms_used++; } fl_avg_deviation /= u1_num_frms_used; /*fl_avg_deviation = sqrt(fl_avg_deviation);*/ fl_avg_deviation = (fl_avg_deviation); *pfl_avg_deviation = fl_avg_deviation; /*return (u1_return_value);*/ } static void update_frame_rd_model(rc_rd_model_t *ps_rd_model) { WORD8 pi1_frame_index[MAX_FRAMES_MODELLED], pi1_frame_index_initial[MAX_FRAMES_MODELLED]; UWORD8 u1_num_skips_temp; UWORD8 u1_avg_mpeg2_qp_temp, u1_min_mpeg2_qp, u1_max_mpeg2_qp; UWORD8 u1_num_frms_input, u1_num_active_frames, u1_reject_frame; UWORD32 u4_num_skips; UWORD8 u1_min2_mpeg2_qp, u1_max2_mpeg2_qp; UWORD8 u1_min_qp_frame_indx, u1_max_qp_frame_indx; UWORD8 pu1_num_frames[MPEG2_QP_ELEM]; model_coeff model_coeff_array[3], model_coeff_array_lin[3], model_coeff_array_lin_wo_int[3]; UWORD32 i; UWORD8 u1_curr_frame_index; UWORD8 u1_quad_model_valid, u1_lin_model_valid; float fl_quad_avg_dev, fl_lin_avg_dev; UWORD8 u1_check_model; /*ps_rd_model += u1_pic_type;*/ u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter; ps_rd_model->u1_model_used = QUAD_MODEL; if(0 == u1_curr_frame_index) u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); else u1_curr_frame_index--; /************************************************************************/ /* Rearrange data to be fed into a Linear Regression Module */ /* Module finds a,b,c such that */ /* y = ax + bx^2 + c */ /************************************************************************/ u4_num_skips = 0; u1_num_frms_input = 0; memset(pu1_num_frames, 0, MPEG2_QP_ELEM); memset(pi1_frame_index, -1, MAX_FRAMES_MODELLED); u1_min_mpeg2_qp = MAX_MPEG2_QP; u1_max_mpeg2_qp = 0; u1_num_active_frames = ps_rd_model->u1_num_frms_in_model; if(u1_num_active_frames > MAX_ACTIVE_FRAMES) u1_num_active_frames = MAX_ACTIVE_FRAMES; /************************************************************************/ /* Choose the set of Points to be used for MSE fit of Quadratic model */ /* Points chosen are spread across the Qp range. Max of 2 points are */ /* chosen for a Qp. */ /************************************************************************/ for(i = 0; i < u1_num_active_frames; i++) { u1_reject_frame = 0; u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index]; u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index]; if((0 == u4_num_skips) && (0 != u1_num_skips_temp)) u1_reject_frame = 1; if((1 == u4_num_skips) && (u1_num_skips_temp > 1)) u1_reject_frame = 1; if(pu1_num_frames[u1_avg_mpeg2_qp_temp] >= 2) u1_reject_frame = 1; if(0 == i) u1_reject_frame = 0; if(0 == u1_reject_frame) { pi1_frame_index[u1_num_frms_input] = (WORD8)u1_curr_frame_index; pu1_num_frames[u1_avg_mpeg2_qp_temp] += 1; if(u1_min_mpeg2_qp > u1_avg_mpeg2_qp_temp) u1_min_mpeg2_qp = u1_avg_mpeg2_qp_temp; if(u1_max_mpeg2_qp < u1_avg_mpeg2_qp_temp) u1_max_mpeg2_qp = u1_avg_mpeg2_qp_temp; u1_num_frms_input++; } if(0 == u1_curr_frame_index) u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); else u1_curr_frame_index--; } /************************************************************************/ /* Add Pivot Points to the Data set to be used for finding Quadratic */ /* Model Coeffs. These will help in constraining the shape of Quadratic*/ /* to adapt too much to the Local deviations. */ /************************************************************************/ u1_min2_mpeg2_qp = u1_min_mpeg2_qp; u1_max2_mpeg2_qp = u1_max_mpeg2_qp; u1_min_qp_frame_indx = INVALID_FRAME_INDEX; u1_max_qp_frame_indx = INVALID_FRAME_INDEX; /* Loop runnning over the Stored Frame Level Data to find frames of MinQp and MaxQp */ for(; i < ps_rd_model->u1_num_frms_in_model; i++) { u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index]; u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index]; if(((0 == u4_num_skips) && (0 != u1_num_skips_temp)) || ((1 == u4_num_skips) && (u1_num_skips_temp > 1))) continue; if(u1_min2_mpeg2_qp > u1_avg_mpeg2_qp_temp) { u1_min2_mpeg2_qp = u1_avg_mpeg2_qp_temp; u1_min_qp_frame_indx = u1_curr_frame_index; } if(u1_max2_mpeg2_qp < u1_avg_mpeg2_qp_temp) { u1_max2_mpeg2_qp = u1_avg_mpeg2_qp_temp; u1_max_qp_frame_indx = u1_curr_frame_index; } if(0 == u1_curr_frame_index) u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); else u1_curr_frame_index--; } /* Add the Chosen Points to the regression data set */ if(INVALID_FRAME_INDEX != u1_min_qp_frame_indx) { pi1_frame_index[u1_num_frms_input] = (WORD8)u1_min_qp_frame_indx; u1_num_frms_input++; } if(INVALID_FRAME_INDEX != u1_max_qp_frame_indx) { pi1_frame_index[u1_num_frms_input] = (WORD8)u1_max_qp_frame_indx; u1_num_frms_input++; } memcpy(pi1_frame_index_initial, pi1_frame_index, MAX_FRAMES_MODELLED); if(QUAD_MODEL == ps_rd_model->u1_model_used) { if(u1_num_frms_input < (MIN_FRAMES_FOR_QUAD_MODEL)) ps_rd_model->u1_model_used = LIN_MODEL; if((WORD32)u1_max_mpeg2_qp < ((WORD32)(21 * u1_min_mpeg2_qp) >> 4)) ps_rd_model->u1_model_used = LIN_MODEL; } if(LIN_MODEL == ps_rd_model->u1_model_used) { if(u1_num_frms_input < MIN_FRAMES_FOR_LIN_MODEL) ps_rd_model->u1_model_used = PREV_FRAME_MODEL; if((WORD32)u1_max_mpeg2_qp < ((WORD32)(19 * u1_min_mpeg2_qp) >> 4)) ps_rd_model->u1_model_used = PREV_FRAME_MODEL; } /***** Call the Module to Return the Coeffs for the Fed Data *****/ ps_rd_model->u1_model_used = find_model_coeffs( ps_rd_model->pi4_res_bits, ps_rd_model->pi4_sad, ps_rd_model->pu1_num_skips, ps_rd_model->pu1_avg_qp, u1_num_frms_input, ps_rd_model->u1_model_used, pi1_frame_index, model_coeff_array, model_coeff_array_lin, model_coeff_array_lin_wo_int, ps_rd_model); if((model_coeff_array_lin[2] > 0) || (model_coeff_array_lin[0] < 0)) u1_lin_model_valid = 0; else { u1_lin_model_valid = 1; /* lin deviation calculation */ calc_avg_sqr_dev_for_model( ps_rd_model->pi4_res_bits, ps_rd_model->pi4_sad, ps_rd_model->pu1_num_skips, ps_rd_model->pu1_avg_qp, u1_num_frms_input, pi1_frame_index_initial, model_coeff_array_lin, &fl_lin_avg_dev); } if(QUAD_MODEL == ps_rd_model->u1_model_used) { u1_check_model = refine_set_of_points( ps_rd_model->pi4_res_bits, ps_rd_model->pi4_sad, ps_rd_model->pu1_num_skips, ps_rd_model->pu1_avg_qp, u1_num_frms_input, pi1_frame_index, model_coeff_array, &fl_quad_avg_dev); if(2 == u1_check_model) { ps_rd_model->u1_model_used = QUAD_MODEL; } else { /*******************************************************************/ /* Make sure that some of the Pivot Points are used in the Refined */ /* data set. 1. Previous Frame */ /*******************************************************************/ /*pi1_frame_index[0] = ps_rd_model->u1_curr_frm_counter;*/ ps_rd_model->u1_model_used = find_model_coeffs( ps_rd_model->pi4_res_bits, ps_rd_model->pi4_sad, ps_rd_model->pu1_num_skips, ps_rd_model->pu1_avg_qp, u1_num_frms_input, ps_rd_model->u1_model_used, pi1_frame_index, model_coeff_array, NULL, NULL, ps_rd_model); u1_check_model = refine_set_of_points( ps_rd_model->pi4_res_bits, ps_rd_model->pi4_sad, ps_rd_model->pu1_num_skips, ps_rd_model->pu1_avg_qp, u1_num_frms_input, pi1_frame_index, model_coeff_array, &fl_quad_avg_dev); if((0 == u1_check_model)) { #if RC_MODEL_USED_BUG_FIX if((fl_lin_avg_dev < fl_quad_avg_dev) && (1 == u1_lin_model_valid)) #endif ps_rd_model->u1_model_used = LIN_MODEL; } } } if(QUAD_MODEL == ps_rd_model->u1_model_used) { /*min_res_bits = model_coeff_c - ((model_coeff_a * model_coeff_a) / (4 * model_coeff_b));*/ if(model_coeff_array[0] < 0) ps_rd_model->u1_model_used = LIN_MODEL; /*if ((model_coeff_a * model_coeff_b) > 0) u1_model_used = LIN_MODEL;*/ } if(LIN_MODEL == ps_rd_model->u1_model_used) { if((model_coeff_array_lin[2] > 0) || (model_coeff_array_lin[0] < 0)) ps_rd_model->u1_model_used = PREV_FRAME_MODEL; } #if RC_MODEL_USED_BUG_FIX /* Another threshold of .25 on deviation i.e. deviation greater than 25% */ if((QUAD_MODEL == ps_rd_model->u1_model_used) && (fl_quad_avg_dev > .25)) ps_rd_model->u1_model_used = PREV_FRAME_MODEL; if((LIN_MODEL == ps_rd_model->u1_model_used) && (fl_lin_avg_dev > .25)) ps_rd_model->u1_model_used = PREV_FRAME_MODEL; #endif /* #if RC_MODEL_USED_BUG_FIX */ ps_rd_model->model_coeff_b_quad = model_coeff_array[0]; ps_rd_model->model_coeff_a_quad = model_coeff_array[1]; ps_rd_model->model_coeff_c_quad = model_coeff_array[2]; ps_rd_model->model_coeff_b_lin = model_coeff_array_lin[0]; ps_rd_model->model_coeff_a_lin = model_coeff_array_lin[1]; ps_rd_model->model_coeff_c_lin = model_coeff_array_lin[2]; ps_rd_model->model_coeff_b_lin_wo_int = model_coeff_array_lin_wo_int[0]; ps_rd_model->model_coeff_a_lin_wo_int = model_coeff_array_lin_wo_int[1]; ps_rd_model->model_coeff_c_lin_wo_int = model_coeff_array_lin_wo_int[2]; /*ps_rd_model->u1_model_used = PREV_FRAME_MODEL;*/ } #endif /* ENABLE_QUAD_MODEL */ UWORD32 estimate_bits_for_qp(rc_rd_model_t *ps_rd_model, UWORD32 u4_estimated_sad, UWORD8 u1_avg_qp) { float fl_num_bits; /*ps_rd_model += u1_curr_pic_type;*/ { fl_num_bits = ps_rd_model->model_coeff_a_lin_wo_int * ((float)(u4_estimated_sad / u1_avg_qp)); } return ((UWORD32)fl_num_bits); } UWORD8 find_qp_for_target_bits( rc_rd_model_t *ps_rd_model, UWORD32 u4_target_res_bits, UWORD32 u4_estimated_sad, UWORD8 u1_min_qp, UWORD8 u1_max_qp) { UWORD8 u1_qp; float x_value, f_qp; /*ps_rd_model += u1_curr_pic_type;*/ #if ENABLE_QUAD_MODEL if(QUAD_MODEL == ps_rd_model->u1_model_used) { float det; det = (ps_rd_model->model_coeff_a_quad * ps_rd_model->model_coeff_a_quad) - (4 * (ps_rd_model->model_coeff_b_quad) * (ps_rd_model->model_coeff_c_quad - u4_target_res_bits)); if(det > 0) { x_value = sqrt(det); x_value = (x_value - ps_rd_model->model_coeff_a_quad) / (2 * ps_rd_model->model_coeff_b_quad); } else ps_rd_model->u1_model_used = PREV_FRAME_MODEL; } if(LIN_MODEL == ps_rd_model->u1_model_used) { x_value = ((float)u4_target_res_bits - ps_rd_model->model_coeff_c_lin) / (ps_rd_model->model_coeff_b_lin); } #else ps_rd_model->u1_model_used = PREV_FRAME_MODEL; #endif if(PREV_FRAME_MODEL == ps_rd_model->u1_model_used) { x_value = (float)u4_target_res_bits / ps_rd_model->model_coeff_a_lin_wo_int; } if(0 != x_value) f_qp = u4_estimated_sad / x_value; else f_qp = 255; if(f_qp > 255) f_qp = 255; /* Truncating the QP to the Max and Min Qp values possible */ if(f_qp < u1_min_qp) f_qp = u1_min_qp; if(f_qp > u1_max_qp) f_qp = u1_max_qp; u1_qp = (UWORD8)(f_qp + 0.5); return u1_qp; } void add_frame_to_rd_model( rc_rd_model_t *ps_rd_model, UWORD32 i4_res_bits, UWORD8 u1_avg_mp2qp, UWORD32 i4_sad_h264, UWORD8 u1_num_skips) { UWORD8 u1_curr_frame_index; /*ps_rd_model += u1_curr_pic_type;*/ u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter; /*** Insert the Present Frame Data into the RD Model State Memory ***/ ps_rd_model->pi4_res_bits[u1_curr_frame_index] = i4_res_bits; ps_rd_model->pi4_sad[u1_curr_frame_index] = i4_sad_h264; ps_rd_model->pu1_num_skips[u1_curr_frame_index] = u1_num_skips; ps_rd_model->pu1_avg_qp[u1_curr_frame_index] = u1_avg_mp2qp; ps_rd_model->u1_curr_frm_counter++; if(MAX_FRAMES_MODELLED == ps_rd_model->u1_curr_frm_counter) ps_rd_model->u1_curr_frm_counter = 0; if(ps_rd_model->u1_num_frms_in_model < ps_rd_model->u1_max_frms_to_model) { ps_rd_model->u1_num_frms_in_model++; } update_frame_rd_model(ps_rd_model); } WORD32 calc_per_frm_bits( rc_rd_model_t *ps_rd_model, /* array of model structs */ UWORD16 *pu2_num_pics_of_a_pic_type, /* N1, N2,...Nk */ UWORD8 * pu1_update_pic_type_model, /* flag which tells whether or not to update model coefficients of a particular pic-type */ UWORD8 u1_num_pic_types, /* value of k */ UWORD32 * pu4_num_skip_of_a_pic_type, /* the number of skips of that pic-type. It "may" be used to update the model coefficients at a later point. Right now it is not being used at all. */ UWORD8 u1_base_pic_type, /* base pic type index wrt which alpha & beta are calculated */ float *pfl_gamma, /* gamma_i = beta_i / alpha_i */ float *pfl_eta, UWORD8 u1_curr_pic_type, /* the current pic-type for which the targetted bits need to be computed */ UWORD32 u4_bits_for_sub_gop, /* the number of bits to be consumed for the remaining part of sub-gop */ UWORD32 u4_curr_estimated_sad, UWORD8 *pu1_curr_pic_type_qp) /* output of this function */ { WORD32 i4_per_frm_bits_Ti; UWORD8 u1_i; rc_rd_model_t *ps_rd_model_of_pic_type; /* first part of this function updates all the model coefficients */ /*for all the pic-types */ { for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) { if((0 != pu2_num_pics_of_a_pic_type[u1_i]) && (1 == pu1_update_pic_type_model[u1_i])) { /* ps_rd_model_of_pic_type = ps_rd_model + u1_i; */ update_frame_rd_model(&ps_rd_model[u1_i]); } } } /* The second part of this function deals with solving the equation using all the pic-types models */ { UWORD8 u1_combined_model_used; /* first choose the model to be used */ u1_combined_model_used = QUAD_MODEL; for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) { ps_rd_model_of_pic_type = ps_rd_model + u1_i; if((0 != pu2_num_pics_of_a_pic_type[u1_i]) && (QUAD_MODEL != ps_rd_model_of_pic_type->u1_model_used)) { u1_combined_model_used = LIN_MODEL; break; } } if(u1_combined_model_used == LIN_MODEL) { for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) { ps_rd_model_of_pic_type = ps_rd_model + u1_i; if((0 != pu2_num_pics_of_a_pic_type[u1_i]) && (QUAD_MODEL != ps_rd_model_of_pic_type->u1_model_used) && (LIN_MODEL != ps_rd_model_of_pic_type->u1_model_used)) { u1_combined_model_used = PREV_FRAME_MODEL; break; } } } /* solve the equation for the */ { model_coeff eff_A; model_coeff eff_B; model_coeff eff_C; float fl_determinant; float fl_sad_by_qp_base; float fl_sad_by_qp_curr_frm; float fl_qp_curr_frm; float fl_bits_for_curr_frm; /* If the combined chosen model is quad model */ if(QUAD_MODEL == u1_combined_model_used) { eff_A = 0.0; eff_B = 0.0; eff_C = 0.0; for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) { ps_rd_model_of_pic_type = ps_rd_model + u1_i; eff_A += ((pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) * ps_rd_model_of_pic_type->model_coeff_a_quad * pfl_gamma[u1_i]); eff_B += ((pfl_eta[u1_i] * pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) * ps_rd_model_of_pic_type->model_coeff_b_quad * pfl_gamma[u1_i] * pfl_gamma[u1_i]); eff_C += (pu2_num_pics_of_a_pic_type[u1_i] * ps_rd_model_of_pic_type->model_coeff_c_quad); } eff_C -= u4_bits_for_sub_gop; fl_determinant = eff_A * eff_A - 4 * eff_B * eff_C; if(fl_determinant < 0) { u1_combined_model_used = PREV_FRAME_MODEL; /* TO BE replaced by LIN_MODEL later */ } else { fl_determinant = sqrt(fl_determinant); fl_sad_by_qp_base = fl_determinant - eff_A; fl_sad_by_qp_base = fl_sad_by_qp_base / (2 * eff_B); fl_sad_by_qp_curr_frm = fl_sad_by_qp_base * pfl_gamma[u1_curr_pic_type] * pfl_eta[u1_curr_pic_type]; ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type; fl_bits_for_curr_frm = ps_rd_model_of_pic_type->model_coeff_a_quad * fl_sad_by_qp_curr_frm + ps_rd_model_of_pic_type->model_coeff_b_quad * fl_sad_by_qp_curr_frm * fl_sad_by_qp_curr_frm + ps_rd_model_of_pic_type->model_coeff_c_quad; } } /* If the combined chosen model is linear model with an intercept */ if(LIN_MODEL == u1_combined_model_used) { eff_A = 0.0; eff_B = 0.0; eff_C = 0.0; for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) { ps_rd_model_of_pic_type = ps_rd_model + u1_i; eff_A += ((pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) * ps_rd_model_of_pic_type->model_coeff_a_lin * pfl_gamma[u1_i]); eff_C += (pu2_num_pics_of_a_pic_type[u1_i] * ps_rd_model_of_pic_type->model_coeff_c_lin); } eff_C -= u4_bits_for_sub_gop; fl_determinant = (-(eff_C / eff_A)); if((fl_determinant) <= 0) { u1_combined_model_used = PREV_FRAME_MODEL; } else { fl_sad_by_qp_base = fl_determinant; fl_sad_by_qp_curr_frm = fl_sad_by_qp_base * pfl_gamma[u1_curr_pic_type] * pfl_eta[u1_curr_pic_type]; ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type; fl_bits_for_curr_frm = ps_rd_model_of_pic_type->model_coeff_a_lin * fl_sad_by_qp_curr_frm + ps_rd_model_of_pic_type->model_coeff_c_lin; } } /* If the combined chosen model is linear model without an intercept */ if(PREV_FRAME_MODEL == u1_combined_model_used) { eff_A = 0.0; eff_B = 0.0; eff_C = 0.0; for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) { ps_rd_model_of_pic_type = ps_rd_model + u1_i; eff_A += ((pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) * ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int * pfl_gamma[u1_i]); } fl_sad_by_qp_base = u4_bits_for_sub_gop / eff_A; fl_sad_by_qp_curr_frm = fl_sad_by_qp_base * pfl_gamma[u1_curr_pic_type] * pfl_eta[u1_curr_pic_type]; ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type; fl_bits_for_curr_frm = ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int * fl_sad_by_qp_curr_frm; } /* store the model that was finally used to calculate Qp. This is so that the same model is used in further calculations for this picture. */ ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type; ps_rd_model_of_pic_type->u1_model_used = u1_combined_model_used; i4_per_frm_bits_Ti = (WORD32)(fl_bits_for_curr_frm + 0.5); if(fl_sad_by_qp_curr_frm > 0) fl_qp_curr_frm = (float)u4_curr_estimated_sad / fl_sad_by_qp_curr_frm; else fl_qp_curr_frm = 255; if(fl_qp_curr_frm > 255) fl_qp_curr_frm = 255; *pu1_curr_pic_type_qp = (fl_qp_curr_frm + 0.5); } } return (i4_per_frm_bits_Ti); } model_coeff get_linear_coefficient(rc_rd_model_t *ps_rd_model) { /*UWORD32 linear_coeff: linear_coeff = ps_rd_model->model_coeff_a_lin_wo_int;*/ return (ps_rd_model->model_coeff_a_lin_wo_int); } #endif /* !(RC_FIXED_POINT) */ WORD32 rc_rd_model_dummy_for_avoiding_warnings( rc_rd_model_t **pps_rc_rd_model, itt_memtab_t *ps_memtab, ITT_FUNC_TYPE_E e_func_type) { WORD32 i4_mem_tab_idx = 0; static rc_rd_model_t s_rc_rd_model_temp; /* Hack for al alloc, during which we dont have any state memory. Dereferencing can cause issues */ if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB) (*pps_rc_rd_model) = &s_rc_rd_model_temp; /*for src rate control state structure*/ if(e_func_type != GET_NUM_MEMTAB) { fill_memtab( &ps_memtab[i4_mem_tab_idx], sizeof(rc_rd_model_t), MEM_TAB_ALIGNMENT, PERSISTENT, DDR); use_or_fill_base(&ps_memtab[0], (void **)pps_rc_rd_model, e_func_type); } i4_mem_tab_idx++; return (i4_mem_tab_idx); }