| /****************************************************************************** |
| * |
| * Copyright (C) 2015 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at: |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| * |
| ***************************************************************************** |
| * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore |
| */ |
| |
| /****************************************************************************/ |
| /* File Name : irc_rd_model.c */ |
| /* */ |
| /* Description : Implall the Functions to Model the */ |
| /* Rate Distortion Behaviour of the Codec over the Last */ |
| /* Few Frames. */ |
| /* */ |
| /* List of Functions : irc_update_frame_rd_model */ |
| /* estimate_mpeg2_qp_for_resbits */ |
| /* */ |
| /* Issues / Problems : None */ |
| /* */ |
| /* Revision History : */ |
| /* DD MM YYYY Author(s) Changes (Describe the changes made) */ |
| /* 21 06 2006 Sarat Initial Version */ |
| /****************************************************************************/ |
| |
| /* System include files */ |
| #include <stdarg.h> |
| #include <stdlib.h> |
| #include <stdio.h> |
| #include <string.h> |
| #include "math.h" |
| |
| /* User include files */ |
| #include "irc_datatypes.h" |
| #include "irc_common.h" |
| #include "irc_mem_req_and_acq.h" |
| #include "irc_rd_model.h" |
| #include "irc_rd_model_struct.h" |
| |
| |
| WORD32 irc_rd_model_num_fill_use_free_memtab(rc_rd_model_t **pps_rc_rd_model, |
| itt_memtab_t *ps_memtab, |
| ITT_FUNC_TYPE_E e_func_type) |
| { |
| WORD32 i4_mem_tab_idx = 0; |
| rc_rd_model_t s_rc_rd_model_temp; |
| |
| /* |
| * Hack for al alloc, during which we don't have any state memory. |
| * Dereferencing can cause issues |
| */ |
| if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB) |
| (*pps_rc_rd_model) = &s_rc_rd_model_temp; |
| |
| /*for src rate control state structure*/ |
| if(e_func_type != GET_NUM_MEMTAB) |
| { |
| fill_memtab(&ps_memtab[i4_mem_tab_idx], sizeof(rc_rd_model_t), |
| ALIGN_128_BYTE, PERSISTENT, DDR); |
| use_or_fill_base(&ps_memtab[0], (void**)pps_rc_rd_model, e_func_type); |
| } |
| i4_mem_tab_idx++; |
| |
| return (i4_mem_tab_idx); |
| } |
| |
| void irc_init_frm_rc_rd_model(rc_rd_model_t *ps_rd_model, |
| UWORD8 u1_max_frames_modelled) |
| { |
| |
| ps_rd_model->u1_num_frms_in_model = 0; |
| ps_rd_model->u1_curr_frm_counter = 0; |
| ps_rd_model->u1_max_frms_to_model = u1_max_frames_modelled; |
| |
| ps_rd_model->model_coeff_a_lin_wo_int = 0; |
| ps_rd_model->model_coeff_b_lin_wo_int = 0; |
| ps_rd_model->model_coeff_c_lin_wo_int = 0; |
| } |
| |
| void irc_reset_frm_rc_rd_model(rc_rd_model_t *ps_rd_model) |
| { |
| ps_rd_model->u1_num_frms_in_model = 0; |
| ps_rd_model->u1_curr_frm_counter = 0; |
| |
| ps_rd_model->model_coeff_a_lin_wo_int = 0; |
| ps_rd_model->model_coeff_b_lin_wo_int = 0; |
| ps_rd_model->model_coeff_c_lin_wo_int = 0; |
| } |
| |
| static UWORD8 find_model_coeffs(UWORD32 *pi4_res_bits, |
| UWORD32 *pi4_sad_h264, |
| UWORD8 *pu1_num_skips, |
| UWORD8 *pui_avg_mpeg2_qp, |
| UWORD8 u1_num_frms, |
| UWORD8 u1_model_used, |
| WORD8 *pi1_frame_index, |
| model_coeff *pmc_model_coeff, |
| model_coeff *pmc_model_coeff_lin, |
| model_coeff *pmc_model_coeff_lin_wo_int, |
| rc_rd_model_t *ps_rd_model) |
| { |
| UWORD32 i; |
| UWORD8 u1_num_frms_used = 0; |
| UWORD8 u1_frm_indx; |
| |
| float sum_y = 0; |
| float sum_x_y = 0; |
| float sum_x2_y = 0; |
| float sum_x = 0; |
| float sum_x2 = 0; |
| float sum_x3 = 0; |
| float sum_x4 = 0; |
| |
| float x0, y0; |
| float model_coeff_a = 0.0, model_coeff_b = 0.0, model_coeff_c = 0.0; |
| |
| #if !(ENABLE_QUAD_RC_MODEL||ENABLE_LIN_MODEL_WITH_INTERCEPT) |
| UNUSED(pu1_num_skips); |
| UNUSED(pmc_model_coeff); |
| UNUSED(pmc_model_coeff_lin); |
| #endif |
| |
| for(i = 0; i < u1_num_frms; i++) |
| { |
| if(-1 == pi1_frame_index[i]) |
| continue; |
| |
| u1_frm_indx = (UWORD8)pi1_frame_index[i]; |
| |
| y0 = (float)(pi4_res_bits[u1_frm_indx]); |
| x0 = (float)(pi4_sad_h264[u1_frm_indx] |
| / (float)pui_avg_mpeg2_qp[u1_frm_indx]); |
| |
| sum_y += y0; |
| sum_x_y += x0 * y0; |
| sum_x2_y += x0 * x0 * y0; |
| sum_x += x0; |
| sum_x2 += x0 * x0; |
| sum_x3 += x0 * x0 * x0; |
| sum_x4 += x0 * x0 * x0 * x0; |
| u1_num_frms_used++; |
| } |
| |
| sum_y /= u1_num_frms_used; |
| sum_x_y /= u1_num_frms_used; |
| sum_x2_y /= u1_num_frms_used; |
| sum_x /= u1_num_frms_used; |
| sum_x2 /= u1_num_frms_used; |
| sum_x3 /= u1_num_frms_used; |
| sum_x4 /= u1_num_frms_used; |
| |
| { |
| UWORD8 u1_curr_frame_index; |
| UWORD8 u1_avgqp_prvfrm; |
| UWORD32 u4_prevfrm_bits, u4_prevfrm_sad; |
| |
| u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter; |
| if(0 == u1_curr_frame_index) |
| u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); |
| else |
| u1_curr_frame_index--; |
| |
| u1_avgqp_prvfrm = ps_rd_model->pu1_avg_qp[u1_curr_frame_index]; |
| u4_prevfrm_bits = ps_rd_model->pi4_res_bits[u1_curr_frame_index]; |
| u4_prevfrm_sad = ps_rd_model->pi4_sad[u1_curr_frame_index]; |
| |
| if(0 != u4_prevfrm_sad) |
| model_coeff_a = (float)(u4_prevfrm_bits * u1_avgqp_prvfrm) |
| / u4_prevfrm_sad; |
| else |
| model_coeff_a = 0; |
| |
| model_coeff_b = 0; |
| model_coeff_c = 0; |
| |
| pmc_model_coeff_lin_wo_int[0] = model_coeff_b; |
| pmc_model_coeff_lin_wo_int[1] = model_coeff_a; |
| pmc_model_coeff_lin_wo_int[2] = model_coeff_c; |
| } |
| |
| return u1_model_used; |
| } |
| |
| static void irc_update_frame_rd_model(rc_rd_model_t *ps_rd_model) |
| { |
| WORD8 pi1_frame_index[MAX_FRAMES_MODELLED], |
| pi1_frame_index_initial[MAX_FRAMES_MODELLED]; |
| |
| UWORD8 u1_num_skips_temp; |
| UWORD8 u1_avg_mpeg2_qp_temp, u1_min_mpeg2_qp, u1_max_mpeg2_qp; |
| UWORD8 u1_num_frms_input, u1_num_active_frames, u1_reject_frame; |
| UWORD32 u4_num_skips; |
| |
| UWORD8 u1_min2_mpeg2_qp, u1_max2_mpeg2_qp; |
| UWORD8 u1_min_qp_frame_indx, u1_max_qp_frame_indx; |
| UWORD8 pu1_num_frames[MPEG2_QP_ELEM]; |
| model_coeff model_coeff_array[3], model_coeff_array_lin[3], |
| model_coeff_array_lin_wo_int[3]; |
| UWORD32 i; |
| UWORD8 u1_curr_frame_index; |
| |
| u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter; |
| |
| ps_rd_model->u1_model_used = PREV_FRAME_MODEL; |
| |
| if(0 == u1_curr_frame_index) |
| u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); |
| else |
| u1_curr_frame_index--; |
| |
| /************************************************************************/ |
| /* Rearrange data to be fed into a Linear Regression Module */ |
| /* Module finds a,b,c such that */ |
| /* y = ax + bx^2 + c */ |
| /************************************************************************/ |
| u4_num_skips = 0; |
| u1_num_frms_input = 0; |
| memset(pu1_num_frames, 0, MPEG2_QP_ELEM); |
| memset(pi1_frame_index, -1, MAX_FRAMES_MODELLED); |
| u1_min_mpeg2_qp = MAX_MPEG2_QP; |
| u1_max_mpeg2_qp = 0; |
| |
| u1_num_active_frames = ps_rd_model->u1_num_frms_in_model; |
| if(u1_num_active_frames > MAX_ACTIVE_FRAMES) |
| { |
| u1_num_active_frames = MAX_ACTIVE_FRAMES; |
| } |
| |
| /************************************************************************/ |
| /* Choose the set of Points to be used for MSE fit of Quadratic model */ |
| /* Points chosen are spread across the Qp range. Max of 2 points are */ |
| /* chosen for a Qp. */ |
| /************************************************************************/ |
| for(i = 0; i < u1_num_active_frames; i++) |
| { |
| u1_reject_frame = 0; |
| u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index]; |
| u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index]; |
| |
| if((0 == u4_num_skips) && (0 != u1_num_skips_temp)) |
| u1_reject_frame = 1; |
| if((1 == u4_num_skips) && (u1_num_skips_temp > 1)) |
| u1_reject_frame = 1; |
| if(pu1_num_frames[u1_avg_mpeg2_qp_temp] >= 2) |
| u1_reject_frame = 1; |
| |
| if(0 == i) |
| u1_reject_frame = 0; |
| |
| if(0 == u1_reject_frame) |
| { |
| pi1_frame_index[u1_num_frms_input] = (WORD8)u1_curr_frame_index; |
| pu1_num_frames[u1_avg_mpeg2_qp_temp] += 1; |
| |
| if(u1_min_mpeg2_qp > u1_avg_mpeg2_qp_temp) |
| u1_min_mpeg2_qp = u1_avg_mpeg2_qp_temp; |
| if(u1_max_mpeg2_qp < u1_avg_mpeg2_qp_temp) |
| u1_max_mpeg2_qp = u1_avg_mpeg2_qp_temp; |
| |
| u1_num_frms_input++; |
| } |
| |
| if(0 == u1_curr_frame_index) |
| u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); |
| else |
| u1_curr_frame_index--; |
| } |
| |
| /************************************************************************/ |
| /* Add Pivot Points to the Data set to be used for finding Quadratic */ |
| /* Model Coeffs. These will help in constraining the shape of Quadratic*/ |
| /* to adapt too much to the Local deviations. */ |
| /************************************************************************/ |
| u1_min2_mpeg2_qp = u1_min_mpeg2_qp; |
| u1_max2_mpeg2_qp = u1_max_mpeg2_qp; |
| u1_min_qp_frame_indx = INVALID_FRAME_INDEX; |
| u1_max_qp_frame_indx = INVALID_FRAME_INDEX; |
| |
| /* Loop runnning over the Stored Frame Level Data |
| to find frames of MinQp and MaxQp */ |
| for(; i < ps_rd_model->u1_num_frms_in_model; i++) |
| { |
| u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index]; |
| u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index]; |
| |
| if(((0 == u4_num_skips) && (0 != u1_num_skips_temp)) |
| || ((1 == u4_num_skips) && (u1_num_skips_temp > 1))) |
| continue; |
| |
| if(u1_min2_mpeg2_qp > u1_avg_mpeg2_qp_temp) |
| { |
| u1_min2_mpeg2_qp = u1_avg_mpeg2_qp_temp; |
| u1_min_qp_frame_indx = u1_curr_frame_index; |
| } |
| if(u1_max2_mpeg2_qp < u1_avg_mpeg2_qp_temp) |
| { |
| u1_max2_mpeg2_qp = u1_avg_mpeg2_qp_temp; |
| u1_max_qp_frame_indx = u1_curr_frame_index; |
| } |
| if(0 == u1_curr_frame_index) |
| u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1); |
| else |
| u1_curr_frame_index--; |
| } |
| |
| /* Add the Chosen Points to the regression data set */ |
| if(INVALID_FRAME_INDEX != u1_min_qp_frame_indx) |
| { |
| pi1_frame_index[u1_num_frms_input] = (WORD8)u1_min_qp_frame_indx; |
| u1_num_frms_input++; |
| } |
| if(INVALID_FRAME_INDEX != u1_max_qp_frame_indx) |
| { |
| pi1_frame_index[u1_num_frms_input] = (WORD8)u1_max_qp_frame_indx; |
| u1_num_frms_input++; |
| } |
| memcpy(pi1_frame_index_initial, pi1_frame_index, MAX_FRAMES_MODELLED); |
| |
| /***** Call the Module to Return the Coeffs for the Fed Data *****/ |
| ps_rd_model->u1_model_used = find_model_coeffs(ps_rd_model->pi4_res_bits, |
| ps_rd_model->pi4_sad, |
| ps_rd_model->pu1_num_skips, |
| ps_rd_model->pu1_avg_qp, |
| u1_num_frms_input, |
| ps_rd_model->u1_model_used, |
| pi1_frame_index, |
| model_coeff_array, |
| model_coeff_array_lin, |
| model_coeff_array_lin_wo_int, |
| ps_rd_model); |
| |
| ps_rd_model->model_coeff_b_lin_wo_int = model_coeff_array_lin_wo_int[0]; |
| ps_rd_model->model_coeff_a_lin_wo_int = model_coeff_array_lin_wo_int[1]; |
| ps_rd_model->model_coeff_c_lin_wo_int = model_coeff_array_lin_wo_int[2]; |
| } |
| |
| UWORD32 irc_estimate_bits_for_qp(rc_rd_model_t *ps_rd_model, |
| UWORD32 u4_estimated_sad, |
| UWORD8 u1_avg_qp) |
| { |
| float fl_num_bits = 0; |
| |
| fl_num_bits = ps_rd_model->model_coeff_a_lin_wo_int |
| * ((float)(u4_estimated_sad / u1_avg_qp)); |
| |
| return ((UWORD32)fl_num_bits); |
| } |
| |
| UWORD8 irc_find_qp_for_target_bits(rc_rd_model_t *ps_rd_model, |
| UWORD32 u4_target_res_bits, |
| UWORD32 u4_estimated_sad, |
| UWORD8 u1_min_qp, |
| UWORD8 u1_max_qp) |
| { |
| UWORD8 u1_qp; |
| float x_value = 1.0, f_qp; |
| |
| ps_rd_model->u1_model_used = PREV_FRAME_MODEL; |
| |
| { |
| x_value = (float)u4_target_res_bits |
| / ps_rd_model->model_coeff_a_lin_wo_int; |
| } |
| |
| if(0 != x_value) |
| f_qp = u4_estimated_sad / x_value; |
| else |
| f_qp = 255; |
| |
| if(f_qp > 255) |
| f_qp = 255; |
| |
| /* Truncating the QP to the Max and Min Qp values possible */ |
| if(f_qp < u1_min_qp) |
| f_qp = u1_min_qp; |
| if(f_qp > u1_max_qp) |
| f_qp = u1_max_qp; |
| |
| u1_qp = (UWORD8)(f_qp + 0.5); |
| |
| return u1_qp; |
| } |
| |
| void irc_add_frame_to_rd_model(rc_rd_model_t *ps_rd_model, |
| UWORD32 i4_res_bits, |
| UWORD8 u1_avg_mp2qp, |
| UWORD32 i4_sad_h264, |
| UWORD8 u1_num_skips) |
| { |
| UWORD8 u1_curr_frame_index; |
| u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter; |
| |
| /*Insert the Present Frame Data into the RD Model State Memory*/ |
| ps_rd_model->pi4_res_bits[u1_curr_frame_index] = i4_res_bits; |
| ps_rd_model->pi4_sad[u1_curr_frame_index] = i4_sad_h264; |
| ps_rd_model->pu1_num_skips[u1_curr_frame_index] = u1_num_skips; |
| ps_rd_model->pu1_avg_qp[u1_curr_frame_index] = u1_avg_mp2qp; |
| |
| ps_rd_model->u1_curr_frm_counter++; |
| if(MAX_FRAMES_MODELLED == ps_rd_model->u1_curr_frm_counter) |
| ps_rd_model->u1_curr_frm_counter = 0; |
| |
| if(ps_rd_model->u1_num_frms_in_model < ps_rd_model->u1_max_frms_to_model) |
| { |
| ps_rd_model->u1_num_frms_in_model++; |
| } |
| irc_update_frame_rd_model(ps_rd_model); |
| } |
| |
| /***************************************************************************** |
| *Function Name : irc_calc_per_frm_bits |
| *Description : |
| *Inputs : pu2_num_pics_of_a_pic_type |
| * - pointer to RC api pointer |
| * pu2_num_pics_of_a_pic_type |
| * - N1, N2,...Nk |
| * pu1_update_pic_type_model |
| * - flag which tells whether or not to update model |
| * coefficients of a particular pic-type |
| * u1_num_pic_types |
| * - value of k |
| * pu4_num_skip_of_a_pic_type |
| * - the number of skips of that pic-type. It "may" be used to |
| * update the model coefficients at a later point. Right now |
| * it is not being used at all. |
| * u1_base_pic_type |
| * - base pic type index wrt which alpha & beta are calculated |
| * pfl_gamma |
| * - gamma_i = beta_i / alpha_i |
| * pfl_eta |
| * - |
| * u1_curr_pic_type |
| * - the current pic-type for which the targetted bits need to |
| * be computed |
| * u4_bits_for_sub_gop |
| * - the number of bits to be consumed for the remaining part of |
| * sub-gop |
| * u4_curr_estimated_sad |
| * - |
| * pu1_curr_pic_type_qp |
| * - output of this function |
| *****************************************************************************/ |
| |
| WORD32 irc_calc_per_frm_bits(rc_rd_model_t *ps_rd_model, |
| UWORD16 *pu2_num_pics_of_a_pic_type, |
| UWORD8 *pu1_update_pic_type_model, |
| UWORD8 u1_num_pic_types, |
| UWORD32 *pu4_num_skip_of_a_pic_type, |
| UWORD8 u1_base_pic_type, |
| float *pfl_gamma, |
| float *pfl_eta, |
| UWORD8 u1_curr_pic_type, |
| UWORD32 u4_bits_for_sub_gop, |
| UWORD32 u4_curr_estimated_sad, |
| UWORD8 *pu1_curr_pic_type_qp) |
| { |
| WORD32 i4_per_frm_bits_Ti; |
| UWORD8 u1_i; |
| rc_rd_model_t *ps_rd_model_of_pic_type; |
| |
| UNUSED(pu4_num_skip_of_a_pic_type); |
| UNUSED(u1_base_pic_type); |
| |
| /* First part of this function updates all the model coefficients */ |
| /*for all the pic-types */ |
| { |
| for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) |
| { |
| if((0 != pu2_num_pics_of_a_pic_type[u1_i]) |
| && (1 == pu1_update_pic_type_model[u1_i])) |
| { |
| irc_update_frame_rd_model(&ps_rd_model[u1_i]); |
| } |
| } |
| } |
| |
| /* |
| * The second part of this function deals with solving the |
| * equation using all the pic-types models |
| */ |
| { |
| UWORD8 u1_combined_model_used; |
| |
| /* solve the equation */ |
| { |
| model_coeff eff_A; |
| float fl_sad_by_qp_base; |
| float fl_sad_by_qp_curr_frm = 1.0; |
| float fl_qp_curr_frm; |
| float fl_bits_for_curr_frm = 0; |
| |
| |
| |
| /* If the combined chosen model is linear model without an intercept */ |
| |
| u1_combined_model_used = PREV_FRAME_MODEL; |
| { |
| eff_A = 0.0; |
| |
| for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++) |
| { |
| ps_rd_model_of_pic_type = ps_rd_model + u1_i; |
| |
| eff_A += ((pfl_eta[u1_i] |
| + pu2_num_pics_of_a_pic_type[u1_i]- 1) |
| * ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int |
| * pfl_gamma[u1_i]); |
| } |
| |
| fl_sad_by_qp_base = u4_bits_for_sub_gop / eff_A; |
| |
| fl_sad_by_qp_curr_frm = fl_sad_by_qp_base |
| * pfl_gamma[u1_curr_pic_type] |
| * pfl_eta[u1_curr_pic_type]; |
| |
| ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type; |
| |
| fl_bits_for_curr_frm = |
| ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int |
| * fl_sad_by_qp_curr_frm; |
| } |
| |
| /* |
| * Store the model that was finally used to calculate Qp. |
| * This is so that the same model is used in further calculations |
| * for this picture. |
| */ |
| ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type; |
| ps_rd_model_of_pic_type->u1_model_used = u1_combined_model_used; |
| |
| i4_per_frm_bits_Ti = (WORD32)(fl_bits_for_curr_frm + 0.5); |
| |
| if(fl_sad_by_qp_curr_frm > 0) |
| fl_qp_curr_frm = (float)u4_curr_estimated_sad |
| / fl_sad_by_qp_curr_frm; |
| else |
| fl_qp_curr_frm = 255; |
| |
| if(fl_qp_curr_frm > 255) |
| fl_qp_curr_frm = 255; |
| |
| *pu1_curr_pic_type_qp = (fl_qp_curr_frm + 0.5); |
| |
| } |
| } |
| return (i4_per_frm_bits_Ti); |
| } |
| |
| model_coeff irc_get_linear_coefficient(rc_rd_model_t *ps_rd_model) |
| { |
| return (ps_rd_model->model_coeff_a_lin_wo_int); |
| } |
| |
| |