aosp12/external/libhevc/encoder/rc_rd_model.c

1023 lines
35 KiB
C

/******************************************************************************
*
* Copyright (C) 2018 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at:
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
*****************************************************************************
* Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore
*/
/****************************************************************************/
/* File Name : rc_rd_model.c */
/* */
/* Description : Implall the Functions to Model the */
/* Rate Distortion Behaviour of the Codec over the Last */
/* Few Frames. */
/* */
/* List of Functions : update_frame_rd_model */
/* estimate_mpeg2_qp_for_resbits */
/* */
/* Issues / Problems : None */
/* */
/* Revision History : */
/* DD MM YYYY Author(s) Changes (Describe the changes made) */
/* 21 06 2006 ittiam Initial Version */
/****************************************************************************/
/*****************************************************************************/
/* File Includes */
/*****************************************************************************/
/* System include files */
#include <stdarg.h>
#include <stdlib.h>
#include <stdio.h>
#include <math.h>
/* System include files */
#include "ittiam_datatypes.h"
#include "rc_common.h"
#include "var_q_operator.h"
#include "mem_req_and_acq.h"
#include "rc_rd_model.h"
#include "rc_rd_model_struct.h"
#if !(RC_FIXED_POINT)
#if NON_STEADSTATE_CODE
WORD32 rc_rd_model_num_fill_use_free_memtab(
rc_rd_model_t **pps_rc_rd_model, itt_memtab_t *ps_memtab, ITT_FUNC_TYPE_E e_func_type)
{
WORD32 i4_mem_tab_idx = 0;
static rc_rd_model_t s_rc_rd_model_temp;
/* Hack for al alloc, during which we dont have any state memory.
Dereferencing can cause issues */
if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB)
(*pps_rc_rd_model) = &s_rc_rd_model_temp;
/*for src rate control state structure*/
if(e_func_type != GET_NUM_MEMTAB)
{
fill_memtab(
&ps_memtab[i4_mem_tab_idx], sizeof(rc_rd_model_t), MEM_TAB_ALIGNMENT, PERSISTENT, DDR);
use_or_fill_base(&ps_memtab[0], (void **)pps_rc_rd_model, e_func_type);
}
i4_mem_tab_idx++;
return (i4_mem_tab_idx);
}
void init_frm_rc_rd_model(rc_rd_model_t *ps_rd_model, UWORD8 u1_max_frames_modelled)
{
/*ps_rd_model = ps_rd_model + u1_pic_type;*/
ps_rd_model->u1_num_frms_in_model = 0;
ps_rd_model->u1_curr_frm_counter = 0;
ps_rd_model->u1_max_frms_to_model = u1_max_frames_modelled;
/*
ps_rd_model->u1_min_frames_for_quad_model = u1_min_frames_for_quad_model;
ps_rd_model->u1_min_frames_for_lin_model = u1_min_frames_for_lin_model;
*/
ps_rd_model->model_coeff_a_quad = 0;
ps_rd_model->model_coeff_b_quad = 0;
ps_rd_model->model_coeff_c_quad = 0;
ps_rd_model->model_coeff_a_lin = 0;
ps_rd_model->model_coeff_b_lin = 0;
ps_rd_model->model_coeff_c_lin = 0;
ps_rd_model->model_coeff_a_lin_wo_int = 0;
ps_rd_model->model_coeff_b_lin_wo_int = 0;
ps_rd_model->model_coeff_c_lin_wo_int = 0;
}
void reset_frm_rc_rd_model(rc_rd_model_t *ps_rd_model)
{
/*ps_rd_model = ps_rd_model + u1_pic_type;*/
ps_rd_model->u1_num_frms_in_model = 0;
ps_rd_model->u1_curr_frm_counter = 0;
ps_rd_model->model_coeff_a_quad = 0;
ps_rd_model->model_coeff_b_quad = 0;
ps_rd_model->model_coeff_c_quad = 0;
ps_rd_model->model_coeff_a_lin = 0;
ps_rd_model->model_coeff_b_lin = 0;
ps_rd_model->model_coeff_c_lin = 0;
ps_rd_model->model_coeff_a_lin_wo_int = 0;
ps_rd_model->model_coeff_b_lin_wo_int = 0;
ps_rd_model->model_coeff_c_lin_wo_int = 0;
}
#endif /* #if NON_STEADSTATE_CODE */
#if ENABLE_QUAD_MODEL
static UWORD8 find_model_coeffs(
UWORD32 *pi4_res_bits,
UWORD32 *pi4_sad_h264,
UWORD8 *pu1_num_skips,
UWORD8 *pui_avg_mpeg2_qp,
UWORD8 u1_num_frms,
UWORD8 u1_model_used,
WORD8 *pi1_frame_index,
model_coeff *pmc_model_coeff,
model_coeff *pmc_model_coeff_lin,
model_coeff *pmc_model_coeff_lin_wo_int,
rc_rd_model_t *ps_rd_model)
{
UWORD32 i;
UWORD8 u1_num_frms_used = 0;
UWORD8 u1_frm_indx;
float sum_y = 0;
float sum_x_y = 0;
float sum_x2_y = 0;
float sum_x = 0;
float sum_x2 = 0;
float sum_x3 = 0;
float sum_x4 = 0;
float var_x2_y = 0;
float var_x_y = 0;
float var_x2_x = 0;
float var_x2_x2 = 0;
float var_x_x = 0;
float x0, y0;
float model_coeff_a, model_coeff_b, model_coeff_c, model_coeff_den;
for(i = 0; i < u1_num_frms; i++)
{
if(-1 == pi1_frame_index[i])
continue;
u1_frm_indx = (UWORD8)pi1_frame_index[i];
y0 = (float)(pi4_res_bits[u1_frm_indx]);
x0 = (float)(pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx]);
sum_y += y0;
sum_x_y += x0 * y0;
sum_x2_y += x0 * x0 * y0;
sum_x += x0;
sum_x2 += x0 * x0;
sum_x3 += x0 * x0 * x0;
sum_x4 += x0 * x0 * x0 * x0;
u1_num_frms_used++;
}
sum_y /= u1_num_frms_used;
sum_x_y /= u1_num_frms_used;
sum_x2_y /= u1_num_frms_used;
sum_x /= u1_num_frms_used;
sum_x2 /= u1_num_frms_used;
sum_x3 /= u1_num_frms_used;
sum_x4 /= u1_num_frms_used;
#if !QUAD
u1_model_used = LIN_MODEL;
#endif
if((QUAD_MODEL == u1_model_used) && (u1_num_frms_used <= MIN_FRAMES_FOR_QUAD_MODEL))
{
u1_model_used = LIN_MODEL;
}
if(QUAD_MODEL == u1_model_used)
{
var_x2_y = sum_x2_y - sum_x2 * sum_y;
var_x_y = sum_x_y - sum_x * sum_y;
var_x2_x = sum_x3 - sum_x2 * sum_x;
var_x2_x2 = sum_x4 - sum_x2 * sum_x2;
var_x_x = sum_x2 - sum_x * sum_x;
model_coeff_den = (var_x2_x * var_x2_x - var_x2_x2 * var_x_x);
if(0 != model_coeff_den)
{
model_coeff_b = (var_x_y * var_x2_x - var_x2_y * var_x_x);
model_coeff_b /= model_coeff_den;
model_coeff_a = (var_x2_y * var_x2_x - var_x_y * var_x2_x2);
model_coeff_a /= model_coeff_den;
model_coeff_c = sum_y - (model_coeff_a * sum_x) - (model_coeff_b * sum_x2);
}
pmc_model_coeff[0] = model_coeff_b;
pmc_model_coeff[1] = model_coeff_a;
pmc_model_coeff[2] = model_coeff_c;
}
if(NULL != pmc_model_coeff_lin)
{
var_x_y = sum_x_y - sum_x * sum_y;
var_x_x = sum_x2 - sum_x * sum_x;
if(0 != var_x_x)
{
model_coeff_a = (var_x_y / var_x_x);
model_coeff_c = sum_y - (model_coeff_a * sum_x);
/*model_coeff_b = 0;*/
model_coeff_b = model_coeff_a;
pmc_model_coeff_lin[0] = model_coeff_b;
pmc_model_coeff_lin[1] = model_coeff_a;
pmc_model_coeff_lin[2] = model_coeff_c;
}
}
if(NULL != pmc_model_coeff_lin_wo_int)
{
UWORD8 u1_curr_frame_index;
UWORD8 u1_avgqp_prvfrm;
UWORD32 u4_prevfrm_bits, u4_prevfrm_sad;
u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter;
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
u1_avgqp_prvfrm = ps_rd_model->pu1_avg_qp[u1_curr_frame_index];
u4_prevfrm_bits = ps_rd_model->pi4_res_bits[u1_curr_frame_index];
u4_prevfrm_sad = ps_rd_model->pi4_sad[u1_curr_frame_index];
if(0 != u4_prevfrm_sad)
model_coeff_a = (float)(u4_prevfrm_bits * u1_avgqp_prvfrm) / u4_prevfrm_sad;
else
model_coeff_a = 0;
model_coeff_b = 0;
model_coeff_c = 0;
pmc_model_coeff_lin_wo_int[0] = model_coeff_b;
pmc_model_coeff_lin_wo_int[1] = model_coeff_a;
pmc_model_coeff_lin_wo_int[2] = model_coeff_c;
}
return u1_model_used;
}
static WORD8 refine_set_of_points(
UWORD32 *pi4_res_bits,
UWORD32 *pi4_sad_h264,
UWORD8 *pu1_num_skips,
UWORD8 *pui_avg_mpeg2_qp,
UWORD8 u1_num_frms,
WORD8 *pi1_frame_index,
model_coeff *pmc_model_coeff,
float *pfl_avg_deviation)
{
float fl_avg_deviation, fl_estimated_bits, fl_deviation, x_val;
UWORD8 u1_return_value = 1;
UWORD32 i;
UWORD8 u1_num_frms_used, u1_frm_indx;
u1_num_frms_used = 0;
fl_avg_deviation = 0;
for(i = 0; i < u1_num_frms; i++)
{
if(-1 == pi1_frame_index[i])
continue;
u1_frm_indx = (UWORD8)pi1_frame_index[i];
x_val = pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx];
fl_estimated_bits = (pmc_model_coeff[0] * x_val * x_val) + (pmc_model_coeff[1] * x_val) +
(pmc_model_coeff[2]);
fl_deviation =
fabs(pi4_res_bits[u1_frm_indx] - fl_estimated_bits) / (float)pi4_res_bits[u1_frm_indx];
fl_deviation = fl_deviation * fl_deviation;
fl_avg_deviation += fl_deviation;
u1_num_frms_used++;
}
fl_avg_deviation /= u1_num_frms_used;
/*fl_avg_deviation = sqrt(fl_avg_deviation);*/
fl_avg_deviation = (fl_avg_deviation);
for(i = 0; i < u1_num_frms; i++)
{
if((-1 == pi1_frame_index[i]) && (i != 0))
continue;
u1_frm_indx = (UWORD8)pi1_frame_index[i];
x_val = pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx];
fl_estimated_bits = (pmc_model_coeff[0] * x_val * x_val) + (pmc_model_coeff[1] * x_val) +
(pmc_model_coeff[2]);
fl_deviation =
fabs(pi4_res_bits[u1_frm_indx] - fl_estimated_bits) / (float)pi4_res_bits[u1_frm_indx];
fl_deviation = fl_deviation * fl_deviation;
if(fl_deviation > (fl_avg_deviation))
{
pi1_frame_index[i] = -1;
}
}
if(fl_avg_deviation > 0.0625)
u1_return_value = 0;
if(fl_avg_deviation < 0.0225)
u1_return_value = 2;
*pfl_avg_deviation = fl_avg_deviation;
return (u1_return_value);
}
static void calc_avg_sqr_dev_for_model(
UWORD32 *pi4_res_bits,
UWORD32 *pi4_sad_h264,
UWORD8 *pu1_num_skips,
UWORD8 *pui_avg_mpeg2_qp,
UWORD8 u1_num_frms,
WORD8 *pi1_frame_index,
model_coeff *pmc_model_coeff,
float *pfl_avg_deviation)
{
float fl_avg_deviation, fl_estimated_bits, fl_deviation, x_val;
UWORD8 u1_return_value = 1;
UWORD32 i;
UWORD8 u1_num_frms_used, u1_frm_indx;
u1_num_frms_used = 0;
fl_avg_deviation = 0;
for(i = 0; i < u1_num_frms; i++)
{
if(-1 == pi1_frame_index[i])
continue;
u1_frm_indx = (UWORD8)pi1_frame_index[i];
u1_frm_indx = (UWORD8)i;
x_val = pi4_sad_h264[u1_frm_indx] / (float)pui_avg_mpeg2_qp[u1_frm_indx];
fl_estimated_bits = (pmc_model_coeff[1] * x_val) + (pmc_model_coeff[2]);
fl_deviation =
fabs(pi4_res_bits[u1_frm_indx] - fl_estimated_bits) / (float)pi4_res_bits[u1_frm_indx];
fl_deviation = fl_deviation * fl_deviation;
fl_avg_deviation += fl_deviation;
u1_num_frms_used++;
}
fl_avg_deviation /= u1_num_frms_used;
/*fl_avg_deviation = sqrt(fl_avg_deviation);*/
fl_avg_deviation = (fl_avg_deviation);
*pfl_avg_deviation = fl_avg_deviation;
/*return (u1_return_value);*/
}
static void update_frame_rd_model(rc_rd_model_t *ps_rd_model)
{
WORD8 pi1_frame_index[MAX_FRAMES_MODELLED], pi1_frame_index_initial[MAX_FRAMES_MODELLED];
UWORD8 u1_num_skips_temp;
UWORD8 u1_avg_mpeg2_qp_temp, u1_min_mpeg2_qp, u1_max_mpeg2_qp;
UWORD8 u1_num_frms_input, u1_num_active_frames, u1_reject_frame;
UWORD32 u4_num_skips;
UWORD8 u1_min2_mpeg2_qp, u1_max2_mpeg2_qp;
UWORD8 u1_min_qp_frame_indx, u1_max_qp_frame_indx;
UWORD8 pu1_num_frames[MPEG2_QP_ELEM];
model_coeff model_coeff_array[3], model_coeff_array_lin[3], model_coeff_array_lin_wo_int[3];
UWORD32 i;
UWORD8 u1_curr_frame_index;
UWORD8 u1_quad_model_valid, u1_lin_model_valid;
float fl_quad_avg_dev, fl_lin_avg_dev;
UWORD8 u1_check_model;
/*ps_rd_model += u1_pic_type;*/
u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter;
ps_rd_model->u1_model_used = QUAD_MODEL;
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
/************************************************************************/
/* Rearrange data to be fed into a Linear Regression Module */
/* Module finds a,b,c such that */
/* y = ax + bx^2 + c */
/************************************************************************/
u4_num_skips = 0;
u1_num_frms_input = 0;
memset(pu1_num_frames, 0, MPEG2_QP_ELEM);
memset(pi1_frame_index, -1, MAX_FRAMES_MODELLED);
u1_min_mpeg2_qp = MAX_MPEG2_QP;
u1_max_mpeg2_qp = 0;
u1_num_active_frames = ps_rd_model->u1_num_frms_in_model;
if(u1_num_active_frames > MAX_ACTIVE_FRAMES)
u1_num_active_frames = MAX_ACTIVE_FRAMES;
/************************************************************************/
/* Choose the set of Points to be used for MSE fit of Quadratic model */
/* Points chosen are spread across the Qp range. Max of 2 points are */
/* chosen for a Qp. */
/************************************************************************/
for(i = 0; i < u1_num_active_frames; i++)
{
u1_reject_frame = 0;
u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index];
u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index];
if((0 == u4_num_skips) && (0 != u1_num_skips_temp))
u1_reject_frame = 1;
if((1 == u4_num_skips) && (u1_num_skips_temp > 1))
u1_reject_frame = 1;
if(pu1_num_frames[u1_avg_mpeg2_qp_temp] >= 2)
u1_reject_frame = 1;
if(0 == i)
u1_reject_frame = 0;
if(0 == u1_reject_frame)
{
pi1_frame_index[u1_num_frms_input] = (WORD8)u1_curr_frame_index;
pu1_num_frames[u1_avg_mpeg2_qp_temp] += 1;
if(u1_min_mpeg2_qp > u1_avg_mpeg2_qp_temp)
u1_min_mpeg2_qp = u1_avg_mpeg2_qp_temp;
if(u1_max_mpeg2_qp < u1_avg_mpeg2_qp_temp)
u1_max_mpeg2_qp = u1_avg_mpeg2_qp_temp;
u1_num_frms_input++;
}
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
}
/************************************************************************/
/* Add Pivot Points to the Data set to be used for finding Quadratic */
/* Model Coeffs. These will help in constraining the shape of Quadratic*/
/* to adapt too much to the Local deviations. */
/************************************************************************/
u1_min2_mpeg2_qp = u1_min_mpeg2_qp;
u1_max2_mpeg2_qp = u1_max_mpeg2_qp;
u1_min_qp_frame_indx = INVALID_FRAME_INDEX;
u1_max_qp_frame_indx = INVALID_FRAME_INDEX;
/* Loop runnning over the Stored Frame Level Data
to find frames of MinQp and MaxQp */
for(; i < ps_rd_model->u1_num_frms_in_model; i++)
{
u1_num_skips_temp = ps_rd_model->pu1_num_skips[u1_curr_frame_index];
u1_avg_mpeg2_qp_temp = ps_rd_model->pu1_avg_qp[u1_curr_frame_index];
if(((0 == u4_num_skips) && (0 != u1_num_skips_temp)) ||
((1 == u4_num_skips) && (u1_num_skips_temp > 1)))
continue;
if(u1_min2_mpeg2_qp > u1_avg_mpeg2_qp_temp)
{
u1_min2_mpeg2_qp = u1_avg_mpeg2_qp_temp;
u1_min_qp_frame_indx = u1_curr_frame_index;
}
if(u1_max2_mpeg2_qp < u1_avg_mpeg2_qp_temp)
{
u1_max2_mpeg2_qp = u1_avg_mpeg2_qp_temp;
u1_max_qp_frame_indx = u1_curr_frame_index;
}
if(0 == u1_curr_frame_index)
u1_curr_frame_index = (MAX_FRAMES_MODELLED - 1);
else
u1_curr_frame_index--;
}
/* Add the Chosen Points to the regression data set */
if(INVALID_FRAME_INDEX != u1_min_qp_frame_indx)
{
pi1_frame_index[u1_num_frms_input] = (WORD8)u1_min_qp_frame_indx;
u1_num_frms_input++;
}
if(INVALID_FRAME_INDEX != u1_max_qp_frame_indx)
{
pi1_frame_index[u1_num_frms_input] = (WORD8)u1_max_qp_frame_indx;
u1_num_frms_input++;
}
memcpy(pi1_frame_index_initial, pi1_frame_index, MAX_FRAMES_MODELLED);
if(QUAD_MODEL == ps_rd_model->u1_model_used)
{
if(u1_num_frms_input < (MIN_FRAMES_FOR_QUAD_MODEL))
ps_rd_model->u1_model_used = LIN_MODEL;
if((WORD32)u1_max_mpeg2_qp < ((WORD32)(21 * u1_min_mpeg2_qp) >> 4))
ps_rd_model->u1_model_used = LIN_MODEL;
}
if(LIN_MODEL == ps_rd_model->u1_model_used)
{
if(u1_num_frms_input < MIN_FRAMES_FOR_LIN_MODEL)
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
if((WORD32)u1_max_mpeg2_qp < ((WORD32)(19 * u1_min_mpeg2_qp) >> 4))
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
}
/***** Call the Module to Return the Coeffs for the Fed Data *****/
ps_rd_model->u1_model_used = find_model_coeffs(
ps_rd_model->pi4_res_bits,
ps_rd_model->pi4_sad,
ps_rd_model->pu1_num_skips,
ps_rd_model->pu1_avg_qp,
u1_num_frms_input,
ps_rd_model->u1_model_used,
pi1_frame_index,
model_coeff_array,
model_coeff_array_lin,
model_coeff_array_lin_wo_int,
ps_rd_model);
if((model_coeff_array_lin[2] > 0) || (model_coeff_array_lin[0] < 0))
u1_lin_model_valid = 0;
else
{
u1_lin_model_valid = 1;
/* lin deviation calculation */
calc_avg_sqr_dev_for_model(
ps_rd_model->pi4_res_bits,
ps_rd_model->pi4_sad,
ps_rd_model->pu1_num_skips,
ps_rd_model->pu1_avg_qp,
u1_num_frms_input,
pi1_frame_index_initial,
model_coeff_array_lin,
&fl_lin_avg_dev);
}
if(QUAD_MODEL == ps_rd_model->u1_model_used)
{
u1_check_model = refine_set_of_points(
ps_rd_model->pi4_res_bits,
ps_rd_model->pi4_sad,
ps_rd_model->pu1_num_skips,
ps_rd_model->pu1_avg_qp,
u1_num_frms_input,
pi1_frame_index,
model_coeff_array,
&fl_quad_avg_dev);
if(2 == u1_check_model)
{
ps_rd_model->u1_model_used = QUAD_MODEL;
}
else
{
/*******************************************************************/
/* Make sure that some of the Pivot Points are used in the Refined */
/* data set. 1. Previous Frame */
/*******************************************************************/
/*pi1_frame_index[0] = ps_rd_model->u1_curr_frm_counter;*/
ps_rd_model->u1_model_used = find_model_coeffs(
ps_rd_model->pi4_res_bits,
ps_rd_model->pi4_sad,
ps_rd_model->pu1_num_skips,
ps_rd_model->pu1_avg_qp,
u1_num_frms_input,
ps_rd_model->u1_model_used,
pi1_frame_index,
model_coeff_array,
NULL,
NULL,
ps_rd_model);
u1_check_model = refine_set_of_points(
ps_rd_model->pi4_res_bits,
ps_rd_model->pi4_sad,
ps_rd_model->pu1_num_skips,
ps_rd_model->pu1_avg_qp,
u1_num_frms_input,
pi1_frame_index,
model_coeff_array,
&fl_quad_avg_dev);
if((0 == u1_check_model))
{
#if RC_MODEL_USED_BUG_FIX
if((fl_lin_avg_dev < fl_quad_avg_dev) && (1 == u1_lin_model_valid))
#endif
ps_rd_model->u1_model_used = LIN_MODEL;
}
}
}
if(QUAD_MODEL == ps_rd_model->u1_model_used)
{
/*min_res_bits = model_coeff_c -
((model_coeff_a * model_coeff_a) / (4 * model_coeff_b));*/
if(model_coeff_array[0] < 0)
ps_rd_model->u1_model_used = LIN_MODEL;
/*if ((model_coeff_a * model_coeff_b) > 0)
u1_model_used = LIN_MODEL;*/
}
if(LIN_MODEL == ps_rd_model->u1_model_used)
{
if((model_coeff_array_lin[2] > 0) || (model_coeff_array_lin[0] < 0))
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
}
#if RC_MODEL_USED_BUG_FIX
/* Another threshold of .25 on deviation i.e. deviation greater than 25% */
if((QUAD_MODEL == ps_rd_model->u1_model_used) && (fl_quad_avg_dev > .25))
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
if((LIN_MODEL == ps_rd_model->u1_model_used) && (fl_lin_avg_dev > .25))
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
#endif /* #if RC_MODEL_USED_BUG_FIX */
ps_rd_model->model_coeff_b_quad = model_coeff_array[0];
ps_rd_model->model_coeff_a_quad = model_coeff_array[1];
ps_rd_model->model_coeff_c_quad = model_coeff_array[2];
ps_rd_model->model_coeff_b_lin = model_coeff_array_lin[0];
ps_rd_model->model_coeff_a_lin = model_coeff_array_lin[1];
ps_rd_model->model_coeff_c_lin = model_coeff_array_lin[2];
ps_rd_model->model_coeff_b_lin_wo_int = model_coeff_array_lin_wo_int[0];
ps_rd_model->model_coeff_a_lin_wo_int = model_coeff_array_lin_wo_int[1];
ps_rd_model->model_coeff_c_lin_wo_int = model_coeff_array_lin_wo_int[2];
/*ps_rd_model->u1_model_used = PREV_FRAME_MODEL;*/
}
#endif /* ENABLE_QUAD_MODEL */
UWORD32 estimate_bits_for_qp(rc_rd_model_t *ps_rd_model, UWORD32 u4_estimated_sad, UWORD8 u1_avg_qp)
{
float fl_num_bits;
/*ps_rd_model += u1_curr_pic_type;*/
{
fl_num_bits =
ps_rd_model->model_coeff_a_lin_wo_int * ((float)(u4_estimated_sad / u1_avg_qp));
}
return ((UWORD32)fl_num_bits);
}
UWORD8 find_qp_for_target_bits(
rc_rd_model_t *ps_rd_model,
UWORD32 u4_target_res_bits,
UWORD32 u4_estimated_sad,
UWORD8 u1_min_qp,
UWORD8 u1_max_qp)
{
UWORD8 u1_qp;
float x_value, f_qp;
/*ps_rd_model += u1_curr_pic_type;*/
#if ENABLE_QUAD_MODEL
if(QUAD_MODEL == ps_rd_model->u1_model_used)
{
float det;
det = (ps_rd_model->model_coeff_a_quad * ps_rd_model->model_coeff_a_quad) -
(4 * (ps_rd_model->model_coeff_b_quad) *
(ps_rd_model->model_coeff_c_quad - u4_target_res_bits));
if(det > 0)
{
x_value = sqrt(det);
x_value =
(x_value - ps_rd_model->model_coeff_a_quad) / (2 * ps_rd_model->model_coeff_b_quad);
}
else
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
}
if(LIN_MODEL == ps_rd_model->u1_model_used)
{
x_value = ((float)u4_target_res_bits - ps_rd_model->model_coeff_c_lin) /
(ps_rd_model->model_coeff_b_lin);
}
#else
ps_rd_model->u1_model_used = PREV_FRAME_MODEL;
#endif
if(PREV_FRAME_MODEL == ps_rd_model->u1_model_used)
{
x_value = (float)u4_target_res_bits / ps_rd_model->model_coeff_a_lin_wo_int;
}
if(0 != x_value)
f_qp = u4_estimated_sad / x_value;
else
f_qp = 255;
if(f_qp > 255)
f_qp = 255;
/* Truncating the QP to the Max and Min Qp values possible */
if(f_qp < u1_min_qp)
f_qp = u1_min_qp;
if(f_qp > u1_max_qp)
f_qp = u1_max_qp;
u1_qp = (UWORD8)(f_qp + 0.5);
return u1_qp;
}
void add_frame_to_rd_model(
rc_rd_model_t *ps_rd_model,
UWORD32 i4_res_bits,
UWORD8 u1_avg_mp2qp,
UWORD32 i4_sad_h264,
UWORD8 u1_num_skips)
{
UWORD8 u1_curr_frame_index;
/*ps_rd_model += u1_curr_pic_type;*/
u1_curr_frame_index = ps_rd_model->u1_curr_frm_counter;
/*** Insert the Present Frame Data into the RD Model State Memory ***/
ps_rd_model->pi4_res_bits[u1_curr_frame_index] = i4_res_bits;
ps_rd_model->pi4_sad[u1_curr_frame_index] = i4_sad_h264;
ps_rd_model->pu1_num_skips[u1_curr_frame_index] = u1_num_skips;
ps_rd_model->pu1_avg_qp[u1_curr_frame_index] = u1_avg_mp2qp;
ps_rd_model->u1_curr_frm_counter++;
if(MAX_FRAMES_MODELLED == ps_rd_model->u1_curr_frm_counter)
ps_rd_model->u1_curr_frm_counter = 0;
if(ps_rd_model->u1_num_frms_in_model < ps_rd_model->u1_max_frms_to_model)
{
ps_rd_model->u1_num_frms_in_model++;
}
update_frame_rd_model(ps_rd_model);
}
WORD32 calc_per_frm_bits(
rc_rd_model_t *ps_rd_model, /* array of model structs */
UWORD16 *pu2_num_pics_of_a_pic_type, /* N1, N2,...Nk */
UWORD8 *
pu1_update_pic_type_model, /* flag which tells whether or not to update model coefficients of a particular pic-type */
UWORD8 u1_num_pic_types, /* value of k */
UWORD32 *
pu4_num_skip_of_a_pic_type, /* the number of skips of that pic-type. It "may" be used to update the model coefficients at a later point. Right now it is not being used at all. */
UWORD8 u1_base_pic_type, /* base pic type index wrt which alpha & beta are calculated */
float *pfl_gamma, /* gamma_i = beta_i / alpha_i */
float *pfl_eta,
UWORD8
u1_curr_pic_type, /* the current pic-type for which the targetted bits need to be computed */
UWORD32
u4_bits_for_sub_gop, /* the number of bits to be consumed for the remaining part of sub-gop */
UWORD32 u4_curr_estimated_sad,
UWORD8 *pu1_curr_pic_type_qp) /* output of this function */
{
WORD32 i4_per_frm_bits_Ti;
UWORD8 u1_i;
rc_rd_model_t *ps_rd_model_of_pic_type;
/* first part of this function updates all the model coefficients */
/*for all the pic-types */
{
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
if((0 != pu2_num_pics_of_a_pic_type[u1_i]) && (1 == pu1_update_pic_type_model[u1_i]))
{
/* ps_rd_model_of_pic_type = ps_rd_model + u1_i; */
update_frame_rd_model(&ps_rd_model[u1_i]);
}
}
}
/* The second part of this function deals with solving the
equation using all the pic-types models */
{
UWORD8 u1_combined_model_used;
/* first choose the model to be used */
u1_combined_model_used = QUAD_MODEL;
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
ps_rd_model_of_pic_type = ps_rd_model + u1_i;
if((0 != pu2_num_pics_of_a_pic_type[u1_i]) &&
(QUAD_MODEL != ps_rd_model_of_pic_type->u1_model_used))
{
u1_combined_model_used = LIN_MODEL;
break;
}
}
if(u1_combined_model_used == LIN_MODEL)
{
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
ps_rd_model_of_pic_type = ps_rd_model + u1_i;
if((0 != pu2_num_pics_of_a_pic_type[u1_i]) &&
(QUAD_MODEL != ps_rd_model_of_pic_type->u1_model_used) &&
(LIN_MODEL != ps_rd_model_of_pic_type->u1_model_used))
{
u1_combined_model_used = PREV_FRAME_MODEL;
break;
}
}
}
/* solve the equation for the */
{
model_coeff eff_A;
model_coeff eff_B;
model_coeff eff_C;
float fl_determinant;
float fl_sad_by_qp_base;
float fl_sad_by_qp_curr_frm;
float fl_qp_curr_frm;
float fl_bits_for_curr_frm;
/* If the combined chosen model is quad model */
if(QUAD_MODEL == u1_combined_model_used)
{
eff_A = 0.0;
eff_B = 0.0;
eff_C = 0.0;
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
ps_rd_model_of_pic_type = ps_rd_model + u1_i;
eff_A +=
((pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) *
ps_rd_model_of_pic_type->model_coeff_a_quad * pfl_gamma[u1_i]);
eff_B +=
((pfl_eta[u1_i] * pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) *
ps_rd_model_of_pic_type->model_coeff_b_quad * pfl_gamma[u1_i] *
pfl_gamma[u1_i]);
eff_C +=
(pu2_num_pics_of_a_pic_type[u1_i] *
ps_rd_model_of_pic_type->model_coeff_c_quad);
}
eff_C -= u4_bits_for_sub_gop;
fl_determinant = eff_A * eff_A - 4 * eff_B * eff_C;
if(fl_determinant < 0)
{
u1_combined_model_used =
PREV_FRAME_MODEL; /* TO BE replaced by LIN_MODEL later */
}
else
{
fl_determinant = sqrt(fl_determinant);
fl_sad_by_qp_base = fl_determinant - eff_A;
fl_sad_by_qp_base = fl_sad_by_qp_base / (2 * eff_B);
fl_sad_by_qp_curr_frm =
fl_sad_by_qp_base * pfl_gamma[u1_curr_pic_type] * pfl_eta[u1_curr_pic_type];
ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type;
fl_bits_for_curr_frm =
ps_rd_model_of_pic_type->model_coeff_a_quad * fl_sad_by_qp_curr_frm +
ps_rd_model_of_pic_type->model_coeff_b_quad * fl_sad_by_qp_curr_frm *
fl_sad_by_qp_curr_frm +
ps_rd_model_of_pic_type->model_coeff_c_quad;
}
}
/* If the combined chosen model is linear model with an intercept */
if(LIN_MODEL == u1_combined_model_used)
{
eff_A = 0.0;
eff_B = 0.0;
eff_C = 0.0;
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
ps_rd_model_of_pic_type = ps_rd_model + u1_i;
eff_A +=
((pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) *
ps_rd_model_of_pic_type->model_coeff_a_lin * pfl_gamma[u1_i]);
eff_C +=
(pu2_num_pics_of_a_pic_type[u1_i] *
ps_rd_model_of_pic_type->model_coeff_c_lin);
}
eff_C -= u4_bits_for_sub_gop;
fl_determinant = (-(eff_C / eff_A));
if((fl_determinant) <= 0)
{
u1_combined_model_used = PREV_FRAME_MODEL;
}
else
{
fl_sad_by_qp_base = fl_determinant;
fl_sad_by_qp_curr_frm =
fl_sad_by_qp_base * pfl_gamma[u1_curr_pic_type] * pfl_eta[u1_curr_pic_type];
ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type;
fl_bits_for_curr_frm =
ps_rd_model_of_pic_type->model_coeff_a_lin * fl_sad_by_qp_curr_frm +
ps_rd_model_of_pic_type->model_coeff_c_lin;
}
}
/* If the combined chosen model is linear model without an intercept */
if(PREV_FRAME_MODEL == u1_combined_model_used)
{
eff_A = 0.0;
eff_B = 0.0;
eff_C = 0.0;
for(u1_i = 0; u1_i < u1_num_pic_types; u1_i++)
{
ps_rd_model_of_pic_type = ps_rd_model + u1_i;
eff_A +=
((pfl_eta[u1_i] + pu2_num_pics_of_a_pic_type[u1_i] - 1) *
ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int * pfl_gamma[u1_i]);
}
fl_sad_by_qp_base = u4_bits_for_sub_gop / eff_A;
fl_sad_by_qp_curr_frm =
fl_sad_by_qp_base * pfl_gamma[u1_curr_pic_type] * pfl_eta[u1_curr_pic_type];
ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type;
fl_bits_for_curr_frm =
ps_rd_model_of_pic_type->model_coeff_a_lin_wo_int * fl_sad_by_qp_curr_frm;
}
/* store the model that was finally used to calculate Qp.
This is so that the same model is used in further calculations for this picture. */
ps_rd_model_of_pic_type = ps_rd_model + u1_curr_pic_type;
ps_rd_model_of_pic_type->u1_model_used = u1_combined_model_used;
i4_per_frm_bits_Ti = (WORD32)(fl_bits_for_curr_frm + 0.5);
if(fl_sad_by_qp_curr_frm > 0)
fl_qp_curr_frm = (float)u4_curr_estimated_sad / fl_sad_by_qp_curr_frm;
else
fl_qp_curr_frm = 255;
if(fl_qp_curr_frm > 255)
fl_qp_curr_frm = 255;
*pu1_curr_pic_type_qp = (fl_qp_curr_frm + 0.5);
}
}
return (i4_per_frm_bits_Ti);
}
model_coeff get_linear_coefficient(rc_rd_model_t *ps_rd_model)
{
/*UWORD32 linear_coeff:
linear_coeff = ps_rd_model->model_coeff_a_lin_wo_int;*/
return (ps_rd_model->model_coeff_a_lin_wo_int);
}
#endif /* !(RC_FIXED_POINT) */
WORD32 rc_rd_model_dummy_for_avoiding_warnings(
rc_rd_model_t **pps_rc_rd_model, itt_memtab_t *ps_memtab, ITT_FUNC_TYPE_E e_func_type)
{
WORD32 i4_mem_tab_idx = 0;
static rc_rd_model_t s_rc_rd_model_temp;
/* Hack for al alloc, during which we dont have any state memory.
Dereferencing can cause issues */
if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB)
(*pps_rc_rd_model) = &s_rc_rd_model_temp;
/*for src rate control state structure*/
if(e_func_type != GET_NUM_MEMTAB)
{
fill_memtab(
&ps_memtab[i4_mem_tab_idx], sizeof(rc_rd_model_t), MEM_TAB_ALIGNMENT, PERSISTENT, DDR);
use_or_fill_base(&ps_memtab[0], (void **)pps_rc_rd_model, e_func_type);
}
i4_mem_tab_idx++;
return (i4_mem_tab_idx);
}