libavc/encoder/irc_rd_model.c
Ram Mohan M 50fd862b8d libavcenc: Remove duplicate code and improve readability
This commit does not introduce any new functionality w.r.t previous
commit. But it fixes few things. They are listed below:
1. Guard Bands in header files are fixed
2. Header files contains function definition comments. These are same
as in source file. Maintaining same comment at two locations is
unnecessary. These are removed.
3. Improved consistency and code indentation
4. Removed comments that dont align with implementation
5. Grouped headers of a workspace together
2023-10-01 01:37:17 +05:30

564 lines
20 KiB
C

/******************************************************************************
*
* Copyright (C) 2015 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
*****************************************************************************
* Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
*/
/****************************************************************************/
/* File Name : irc_rd_model.c */
/* */
/* Description : Implall the Functions to Model the */
/* Rate Distortion Behaviour of the Codec over the Last */
/* Few Frames. */
/* */
/* List of Functions : irc_update_frame_rd_model */
/* estimate_mpeg2_qp_for_resbits */
/* */
/* Issues / Problems : None */
/* */
/* Revision History : */
/* DD MM YYYY Author(s) Changes (Describe the changes made) */
/* 21 06 2006 Sarat Initial Version */
/****************************************************************************/
/* System include files */
#include <stdarg.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>
#include "math.h"
/* User include files */
#include "irc_datatypes.h"
#include "irc_common.h"
#include "irc_mem_req_and_acq.h"
#include "irc_rd_model.h"
#include "irc_rd_model_struct.h"
WORD32 irc_rd_model_num_fill_use_free_memtab(rc_rd_model_t **pps_rc_rd_model,
itt_memtab_t *ps_memtab,
ITT_FUNC_TYPE_E e_func_type)
{
WORD32 i4_mem_tab_idx = 0;
rc_rd_model_t s_rc_rd_model_temp;
/*
* Hack for al alloc, during which we don't have any state memory.
* Dereferencing can cause issues
*/
if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB)
(*pps_rc_rd_model) = &s_rc_rd_model_temp;
/*for src rate control state structure*/
if(e_func_type != GET_NUM_MEMTAB)
{
fill_memtab(&ps_memtab[i4_mem_tab_idx], sizeof(rc_rd_model_t),
ALIGN_128_BYTE, PERSISTENT, DDR);
use_or_fill_base(&ps_memtab[0], (void**)pps_rc_rd_model, e_func_type);
}
i4_mem_tab_idx++;
return (i4_mem_tab_idx);
}
void irc_init_frm_rc_rd_model(rc_rd_model_t *ps_rd_model,
UWORD8 u1_max_frames_modelled)
{
ps_rd_model->u1_num_frms_in_model = 0;
ps_rd_model->u1_curr_frm_counter = 0;
ps_rd_model->u1_max_frms_to_model = u1_max_frames_modelled;
ps_rd_model->model_coeff_a_lin_wo_int = 0;
ps_rd_model->model_coeff_b_lin_wo_int = 0;
ps_rd_model->model_coeff_c_lin_wo_int = 0;
}
void irc_reset_frm_rc_rd_model(rc_rd_model_t *ps_rd_model)
{
ps_rd_model->u1_num_frms_in_model = 0;
ps_rd_model->u1_curr_frm_counter = 0;
ps_rd_model->model_coeff_a_lin_wo_int = 0;
ps_rd_model->model_coeff_b_lin_wo_int = 0;
ps_rd_model->model_coeff_c_lin_wo_int = 0;
}
static UWORD8 find_model_coeffs(UWORD32 *pi4_res_bits,
UWORD32 *pi4_sad_h264,
UWORD8 *pu1_num_skips,
UWORD8 *pui_avg_mpeg2_qp,
UWORD8 u1_num_frms,
UWORD8 u1_model_used,
WORD8 *pi1_frame_index,
model_coeff *pmc_model_coeff,
model_coeff *pmc_model_coeff_lin,
model_coeff *pmc_model_coeff_lin_wo_int,
rc_rd_model_t *ps_rd_model)
{
UWORD32 i;
UWORD8 u1_num_frms_used = 0;
UWORD8 u1_frm_indx;
float sum_y = 0;
float sum_x_y = 0;
float sum_x2_y = 0;
float sum_x = 0;
float sum_x2 = 0;
float sum_x3 = 0;
float sum_x4 = 0;
float x0, y0;
float model_coeff_a = 0.0, model_coeff_b = 0.0, model_coeff_c = 0.0;
UNUSED(pu1_num_skips);
UNUSED(pmc_model_coeff);
UNUSED(pmc_model_coeff_lin);
for(i = 0; i < u1_num_frms; i++)
{
if(-1 == pi1_frame_index[i])
continue;
u1_frm_indx = (UWORD8)pi1_frame_index[i];
y0 = (float)(pi4_res_bits[u1_frm_indx]);
x0 = (float)(pi4_sad_h264[u1_frm_indx]
/ (float)pui_avg_mpeg2_qp[u1_frm_indx]);
sum_y += y0;
sum_x_y += x0 * y0;
sum_x2_y += x0 * x0 * y0;
sum_x += x0;
sum_x2 += x0 * x0;
sum_x3 += x0 * x0 * x0;
sum_x4 += x0 * x0 * x0 * x0;
u1_num_frms_used++;
}
sum_y /= u1_num_frms_used;
sum_x_y /= u1_num_frms_used;
sum_x2_y /= u1_num_frms_used;
sum_x /= u1_num_frms_used;
sum_x2 /= u1_num_frms_used;
sum_x3 /= u1_num_frms_used;
sum_x4 /= u1_num_frms_used;
{
UWORD8 u1_curr_frame_index;
UWORD8 u1_avgqp_prvfrm;
UWORD32 u4_prevfrm_bits, u4_prevfrm_sad;
u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter;
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
u1_avgqp_prvfrm = ps_rd_model->pu1_avg_qp[u1_curr_frame_index];
u4_prevfrm_bits = ps_rd_model->pi4_res_bits[u1_curr_frame_index];
u4_prevfrm_sad = ps_rd_model->pi4_sad[u1_curr_frame_index];
if(0 != u4_prevfrm_sad)
model_coeff_a = (float)(u4_prevfrm_bits * u1_avgqp_prvfrm)
/ u4_prevfrm_sad;
else
model_coeff_a = 0;
model_coeff_b = 0;
model_coeff_c = 0;
pmc_model_coeff_lin_wo_int[0] = model_coeff_b;
pmc_model_coeff_lin_wo_int[1] = model_coeff_a;
pmc_model_coeff_lin_wo_int[2] = model_coeff_c;
}
return u1_model_used;
}
static void irc_update_frame_rd_model(rc_rd_model_t *ps_rd_model)
{
WORD8 pi1_frame_index[MAX_FRAMES_MODELLED],
pi1_frame_index_initial[MAX_FRAMES_MODELLED];
UWORD8 u1_num_skips_temp;
UWORD8 u1_avg_mpeg2_qp_temp, u1_min_mpeg2_qp, u1_max_mpeg2_qp;
UWORD8 u1_num_frms_input, u1_num_active_frames, u1_reject_frame;
UWORD32 u4_num_skips;
UWORD8 u1_min2_mpeg2_qp, u1_max2_mpeg2_qp;
UWORD8 u1_min_qp_frame_indx, u1_max_qp_frame_indx;
UWORD8 pu1_num_frames[MPEG2_QP_ELEM];
model_coeff model_coeff_array[3], model_coeff_array_lin[3],
model_coeff_array_lin_wo_int[3];
UWORD32 i;
UWORD8 u1_curr_frame_index;
u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter;
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
/************************************************************************/
/* Rearrange data to be fed into a Linear Regression Module */
/* Module finds a,b,c such that */
/* y = ax + bx^2 + c */
/************************************************************************/
u4_num_skips = 0;
u1_num_frms_input = 0;
memset(pu1_num_frames, 0, MPEG2_QP_ELEM);
memset(pi1_frame_index, -1, MAX_FRAMES_MODELLED);
u1_min_mpeg2_qp = MAX_MPEG2_QP;
u1_max_mpeg2_qp = 0;
u1_num_active_frames = ps_rd_model->u1_num_frms_in_model;
if(u1_num_active_frames > MAX_ACTIVE_FRAMES)
{
u1_num_active_frames = MAX_ACTIVE_FRAMES;
}
/************************************************************************/
/* Choose the set of Points to be used for MSE fit of Quadratic model */
/* Points chosen are spread across the Qp range. Max of 2 points are */
/* chosen for a Qp. */
/************************************************************************/
for(i = 0; i < u1_num_active_frames; i++)
{
u1_reject_frame = 0;
u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index];
u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index];
if((0 == u4_num_skips) && (0 != u1_num_skips_temp))
u1_reject_frame = 1;
if((1 == u4_num_skips) && (u1_num_skips_temp > 1))
u1_reject_frame = 1;
if(pu1_num_frames[u1_avg_mpeg2_qp_temp] >= 2)
u1_reject_frame = 1;
if(0 == i)
u1_reject_frame = 0;
if(0 == u1_reject_frame)
{
pi1_frame_index[u1_num_frms_input] = (WORD8)u1_curr_frame_index;
pu1_num_frames[u1_avg_mpeg2_qp_temp] += 1;
if(u1_min_mpeg2_qp > u1_avg_mpeg2_qp_temp)
u1_min_mpeg2_qp = u1_avg_mpeg2_qp_temp;
if(u1_max_mpeg2_qp < u1_avg_mpeg2_qp_temp)
u1_max_mpeg2_qp = u1_avg_mpeg2_qp_temp;
u1_num_frms_input++;
}
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
}
/************************************************************************/
/* Add Pivot Points to the Data set to be used for finding Quadratic */
/* Model Coeffs. These will help in constraining the shape of Quadratic*/
/* to adapt too much to the Local deviations. */
/************************************************************************/
u1_min2_mpeg2_qp = u1_min_mpeg2_qp;
u1_max2_mpeg2_qp = u1_max_mpeg2_qp;
u1_min_qp_frame_indx = INVALID_FRAME_INDEX;
u1_max_qp_frame_indx = INVALID_FRAME_INDEX;
/* Loop runnning over the Stored Frame Level Data
to find frames of MinQp and MaxQp */
for(; i < ps_rd_model->u1_num_frms_in_model; i++)
{
u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index];
u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index];
if(((0 == u4_num_skips) && (0 != u1_num_skips_temp))
|| ((1 == u4_num_skips) && (u1_num_skips_temp > 1)))
continue;
if(u1_min2_mpeg2_qp > u1_avg_mpeg2_qp_temp)
{
u1_min2_mpeg2_qp = u1_avg_mpeg2_qp_temp;
u1_min_qp_frame_indx = u1_curr_frame_index;
}
if(u1_max2_mpeg2_qp < u1_avg_mpeg2_qp_temp)
{
u1_max2_mpeg2_qp = u1_avg_mpeg2_qp_temp;
u1_max_qp_frame_indx = u1_curr_frame_index;
}
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
}
/* Add the Chosen Points to the regression data set */
if(INVALID_FRAME_INDEX != u1_min_qp_frame_indx)
{
pi1_frame_index[u1_num_frms_input] = (WORD8)u1_min_qp_frame_indx;
u1_num_frms_input++;
}
if(INVALID_FRAME_INDEX != u1_max_qp_frame_indx)
{
pi1_frame_index[u1_num_frms_input] = (WORD8)u1_max_qp_frame_indx;
u1_num_frms_input++;
}
memcpy(pi1_frame_index_initial, pi1_frame_index, MAX_FRAMES_MODELLED);
/***** Call the Module to Return the Coeffs for the Fed Data *****/
ps_rd_model->u1_model_used = find_model_coeffs(ps_rd_model->pi4_res_bits,
ps_rd_model->pi4_sad,
ps_rd_model->pu1_num_skips,
ps_rd_model->pu1_avg_qp,
u1_num_frms_input,
ps_rd_model->u1_model_used,
pi1_frame_index,
model_coeff_array,
model_coeff_array_lin,
model_coeff_array_lin_wo_int,
ps_rd_model);
ps_rd_model->model_coeff_b_lin_wo_int = model_coeff_array_lin_wo_int[0];
ps_rd_model->model_coeff_a_lin_wo_int = model_coeff_array_lin_wo_int[1];
ps_rd_model->model_coeff_c_lin_wo_int = model_coeff_array_lin_wo_int[2];
}
UWORD32 irc_estimate_bits_for_qp(rc_rd_model_t *ps_rd_model,
UWORD32 u4_estimated_sad,
UWORD8 u1_avg_qp)
{
float fl_num_bits = 0;
fl_num_bits = ps_rd_model->model_coeff_a_lin_wo_int
* ((float)(u4_estimated_sad / u1_avg_qp));
return ((UWORD32)fl_num_bits);
}
UWORD8 irc_find_qp_for_target_bits(rc_rd_model_t *ps_rd_model,
UWORD32 u4_target_res_bits,
UWORD32 u4_estimated_sad,
UWORD8 u1_min_qp,
UWORD8 u1_max_qp)
{
UWORD8 u1_qp;
float x_value = 1.0, f_qp;
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
{
x_value = (float)u4_target_res_bits
/ ps_rd_model->model_coeff_a_lin_wo_int;
}
if(0 != x_value)
f_qp = u4_estimated_sad / x_value;
else
f_qp = 255;
if(f_qp > 255)
f_qp = 255;
/* Truncating the QP to the Max and Min Qp values possible */
if(f_qp < u1_min_qp)
f_qp = u1_min_qp;
if(f_qp > u1_max_qp)
f_qp = u1_max_qp;
u1_qp = (UWORD8)(f_qp + 0.5);
return u1_qp;
}
void irc_add_frame_to_rd_model(rc_rd_model_t *ps_rd_model,
UWORD32 i4_res_bits,
UWORD8 u1_avg_mp2qp,
UWORD32 i4_sad_h264,
UWORD8 u1_num_skips)
{
UWORD8 u1_curr_frame_index;
u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter;
/*Insert the Present Frame Data into the RD Model State Memory*/
ps_rd_model->pi4_res_bits[u1_curr_frame_index] = i4_res_bits;
ps_rd_model->pi4_sad[u1_curr_frame_index] = i4_sad_h264;
ps_rd_model->pu1_num_skips[u1_curr_frame_index] = u1_num_skips;
ps_rd_model->pu1_avg_qp[u1_curr_frame_index] = u1_avg_mp2qp;
ps_rd_model->u1_curr_frm_counter++;
if(MAX_FRAMES_MODELLED == ps_rd_model->u1_curr_frm_counter)
ps_rd_model->u1_curr_frm_counter = 0;
if(ps_rd_model->u1_num_frms_in_model < ps_rd_model->u1_max_frms_to_model)
{
ps_rd_model->u1_num_frms_in_model++;
}
irc_update_frame_rd_model(ps_rd_model);
}
/*****************************************************************************
*Function Name : irc_calc_per_frm_bits
*Description :
*Inputs : pu2_num_pics_of_a_pic_type
* - pointer to RC api pointer
* pu2_num_pics_of_a_pic_type
* - N1, N2,...Nk
* pu1_update_pic_type_model
* - flag which tells whether or not to update model
* coefficients of a particular pic-type
* u1_num_pic_types
* - value of k
* pu4_num_skip_of_a_pic_type
* - the number of skips of that pic-type. It "may" be used to
* update the model coefficients at a later point. Right now
* it is not being used at all.
* u1_base_pic_type
* - base pic type index wrt which alpha & beta are calculated
* pfl_gamma
* - gamma_i = beta_i / alpha_i
* pfl_eta
* -
* u1_curr_pic_type
* - the current pic-type for which the targetted bits need to
* be computed
* u4_bits_for_sub_gop
* - the number of bits to be consumed for the remaining part of
* sub-gop
* u4_curr_estimated_sad
* -
* pu1_curr_pic_type_qp
* - output of this function
*****************************************************************************/
WORD32 irc_calc_per_frm_bits(rc_rd_model_t *ps_rd_model,
UWORD16 *pu2_num_pics_of_a_pic_type,
UWORD8 *pu1_update_pic_type_model,
UWORD8 u1_num_pic_types,
UWORD32 *pu4_num_skip_of_a_pic_type,
UWORD8 u1_base_pic_type,
float *pfl_gamma,
float *pfl_eta,
UWORD8 u1_curr_pic_type,
UWORD32 u4_bits_for_sub_gop,
UWORD32 u4_curr_estimated_sad,
UWORD8 *pu1_curr_pic_type_qp)
{
WORD32 i4_per_frm_bits_Ti;
UWORD8 u1_i;
rc_rd_model_t *ps_rd_model_of_pic_type;
UNUSED(pu4_num_skip_of_a_pic_type);
UNUSED(u1_base_pic_type);
/* First part of this function updates all the model coefficients */
/*for all the pic-types */
{
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
if((0 != pu2_num_pics_of_a_pic_type[u1_i])
&& (1 == pu1_update_pic_type_model[u1_i]))
{
irc_update_frame_rd_model(&ps_rd_model[u1_i]);
}
}
}
/*
* The second part of this function deals with solving the
* equation using all the pic-types models
*/
{
UWORD8 u1_combined_model_used;
/* solve the equation */
{
model_coeff eff_A;
float fl_sad_by_qp_base;
float fl_sad_by_qp_curr_frm = 1.0;
float fl_qp_curr_frm;
float fl_bits_for_curr_frm = 0;
/* If the combined chosen model is linear model without an intercept */
u1_combined_model_used = PREV_FRAME_MODEL;
{
eff_A = 0.0;
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
ps_rd_model_of_pic_type = ps_rd_model + u1_i;
eff_A += ((pfl_eta[u1_i]
+ pu2_num_pics_of_a_pic_type[u1_i]- 1)
* ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int
* pfl_gamma[u1_i]);
}
fl_sad_by_qp_base = u4_bits_for_sub_gop / eff_A;
fl_sad_by_qp_curr_frm = fl_sad_by_qp_base
* pfl_gamma[u1_curr_pic_type]
* pfl_eta[u1_curr_pic_type];
ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type;
fl_bits_for_curr_frm =
ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int
* fl_sad_by_qp_curr_frm;
}
/*
* Store the model that was finally used to calculate Qp.
* This is so that the same model is used in further calculations
* for this picture.
*/
ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type;
ps_rd_model_of_pic_type->u1_model_used = u1_combined_model_used;
i4_per_frm_bits_Ti = (WORD32)(fl_bits_for_curr_frm + 0.5);
if(fl_sad_by_qp_curr_frm > 0)
fl_qp_curr_frm = (float)u4_curr_estimated_sad
/ fl_sad_by_qp_curr_frm;
else
fl_qp_curr_frm = 255;
if(fl_qp_curr_frm > 255)
fl_qp_curr_frm = 255;
*pu1_curr_pic_type_qp = (fl_qp_curr_frm + 0.5);
}
}
return (i4_per_frm_bits_Ti);
}
model_coeff irc_get_linear_coefficient(rc_rd_model_t *ps_rd_model)
{
return (ps_rd_model->model_coeff_a_lin_wo_int);
}