diff options
| author | Ram Mohan <ram.mohan@ittiam.com> | 2018-10-05 18:05:06 +0530 |
|---|---|---|
| committer | Ray Essick <essick@google.com> | 2019-02-18 07:43:11 -0800 |
| commit | 69da5e22f66880b785b8d9d9b2b0ca706ac24d91 (patch) | |
| tree | f74d679fa97b370f412b864781c3bc03bde0e256 /encoder/cbr_buffer_control.c | |
| parent | e9568e04fc0749e3b3ad8bdcce61163f0f08d894 (diff) | |
| download | platform_external_libhevc-69da5e22f66880b785b8d9d9b2b0ca706ac24d91.tar.gz platform_external_libhevc-69da5e22f66880b785b8d9d9b2b0ca706ac24d91.tar.bz2 platform_external_libhevc-69da5e22f66880b785b8d9d9b2b0ca706ac24d91.zip | |
libhevcenc: Initial commit
Test: hevcenc -c vid_enc_cfg.txt
Bug: 110456253
Test: CtsMediaTests/VideoEncoder
Change-Id: I9df8143709c3fe5d2c8398974a16529a3f8b8ebc
Diffstat (limited to 'encoder/cbr_buffer_control.c')
| -rw-r--r-- | encoder/cbr_buffer_control.c | 1384 |
1 files changed, 1384 insertions, 0 deletions
diff --git a/encoder/cbr_buffer_control.c b/encoder/cbr_buffer_control.c new file mode 100644 index 0000000..29aebf3 --- /dev/null +++ b/encoder/cbr_buffer_control.c @@ -0,0 +1,1384 @@ +/****************************************************************************** + * + * Copyright (C) 2018 The Android Open Source Project + * + * Licensed under the Apache License, Version 2.0 (the "License"); + * you may not use this file except in compliance with the License. + * You may obtain a copy of the License at: + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, software + * distributed under the License is distributed on an "AS IS" BASIS, + * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. + * See the License for the specific language governing permissions and + * limitations under the License. + * + ***************************************************************************** + * Originally developed and contributed by Ittiam Systems Pvt. Ltd, Bangalore +*/ +/*! +****************************************************************************** +* \file cbr_buffer_control.c +* +* \brief +* This file contains all functions needed for cbr buffer control +* \date +* 06/05/2008 +* +* \author +* ittiam +* +* \List of Functions +* init_cbr_buffer +* cbr_buffer_constraint_check +* get_cbr_buffer_status +* update_cbr_buffer +* +****************************************************************************** +*/ +/*****************************************************************************/ +/* File Includes */ +/*****************************************************************************/ + +/* System include files */ +#include <stdio.h> + +/* User include files */ +#include "assert.h" +#include "ittiam_datatypes.h" +#include "rc_cntrl_param.h" +#include "rc_common.h" +#include "mem_req_and_acq.h" +#include "fixed_point_error_bits.h" +#include "cbr_buffer_control.h" +#include "trace_support.h" +#include "var_q_operator.h" + +#define MIN(x, y) ((x) < (y)) ? (x) : (y) +/*allow a maximum of 20 percent deviation when input is very large*/ +#define VBR_MAX_BIT_DEV_SEC 50LL + +typedef struct cbr_buffer_t +{ + WORD32 i4_buffer_size; /* Buffer size = Delay * Bitrate*/ + WORD32 + i4_drain_bits_per_frame[MAX_NUM_DRAIN_RATES]; /* Constant drain rate */ + WORD32 i4_ebf; /* Encoder Buffer Fullness */ + LWORD64 + i8_ebf_bit_alloc; /* current encoder buffer fulness that accounts precise bit consumption (not truncated to max buffer size at skip)*/ + LWORD64 i8_credit_level; + WORD32 i4_upr_thr[MAX_PIC_TYPE]; /* Upper threshold of the Buffer */ + WORD32 i4_low_thr[MAX_PIC_TYPE]; /* Lower threshold of the Buffer */ + error_bits_handle + aps_bpf_error_bits[MAX_NUM_DRAIN_RATES]; /* For error due to bits per frame calculation */ + WORD32 + i4_is_cbr_mode; /* Whether the buffer model is used for CBR or VBR streaming */ + /* Input parameters stored for initialisation */ + WORD32 ai4_bit_rate[MAX_NUM_DRAIN_RATES]; + WORD32 i4_max_delay; + WORD32 ai4_num_pics_in_delay_period[MAX_PIC_TYPE]; + WORD32 i4_tgt_frm_rate; + UWORD32 u4_max_vbv_buf_size; + WORD32 i4_peak_drain_rate_frame; + WORD32 u4_num_frms_in_delay; + UWORD32 u4_vbr_max_bit_deviation; + rc_type_e e_rc_type; + WORD32 i4_vbr_no_peak_rate_duration_limit; + LWORD64 i8_tot_frm_to_be_encoded; + LWORD64 + i8_num_frames_encoded; /*need to track the number of frames encoded to calculate possible deviaiton allowed*/ + WORD32 i4_cbr_rc_pass; + WORD32 i4_inter_frame_int; + WORD32 i4_intra_frame_int; + WORD32 i4_capped_vbr_on; + float f_max_dur_peak_rate; + LWORD64 i4_ebf_estimate; +} cbr_buffer_t; + +#if NON_STEADSTATE_CODE +WORD32 cbr_buffer_num_fill_use_free_memtab( + cbr_buffer_t **pps_cbr_buffer, itt_memtab_t *ps_memtab, ITT_FUNC_TYPE_E e_func_type) +{ + WORD32 i4_mem_tab_idx = 0, i; + static cbr_buffer_t s_cbr_buffer_temp; + + /* Hack for al alloc, during which we dont have any state memory. + Dereferencing can cause issues */ + if(e_func_type == GET_NUM_MEMTAB || e_func_type == FILL_MEMTAB) + (*pps_cbr_buffer) = &s_cbr_buffer_temp; + + if(e_func_type != GET_NUM_MEMTAB) + { + fill_memtab( + &ps_memtab[i4_mem_tab_idx], sizeof(cbr_buffer_t), MEM_TAB_ALIGNMENT, PERSISTENT, DDR); + use_or_fill_base(&ps_memtab[0], (void **)pps_cbr_buffer, e_func_type); + } + i4_mem_tab_idx++; + + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + { + i4_mem_tab_idx += error_bits_num_fill_use_free_memtab( + &pps_cbr_buffer[0]->aps_bpf_error_bits[i], &ps_memtab[i4_mem_tab_idx], e_func_type); + } + return (i4_mem_tab_idx); +} +static void set_upper_lower_vbv_threshold(cbr_buffer_t *ps_cbr_buffer, WORD32 i4_bits_per_frm) +{ + WORD32 i; + for(i = 0; i < MAX_PIC_TYPE; i++) + { + ps_cbr_buffer->i4_upr_thr[i] = + (WORD32)(((LWORD64)ps_cbr_buffer->i4_buffer_size >> 4) * UPPER_THRESHOLD_EBF_Q4); + if(ps_cbr_buffer->e_rc_type == VBR_STREAMING) + { + /*lower threshold can be zero as there is no problem of studffing in this mode (VBR STORAGE)*/ + if(ps_cbr_buffer->i4_vbr_no_peak_rate_duration_limit) + ps_cbr_buffer->i4_low_thr[i] = 0; + else + ps_cbr_buffer->i4_low_thr[i] = ps_cbr_buffer->i4_inter_frame_int * i4_bits_per_frm; + } + else + { + if(ps_cbr_buffer->i4_inter_frame_int == 1) + ps_cbr_buffer->i4_low_thr[i] = 0; + else + { + ps_cbr_buffer->i4_low_thr[i] = ps_cbr_buffer->i4_inter_frame_int * i4_bits_per_frm; + } + } + /*For huge buffer low limit can be higher*/ + + if(ps_cbr_buffer->i4_low_thr[i] < (ps_cbr_buffer->i4_buffer_size >> 6)) + ps_cbr_buffer->i4_low_thr[i] = (ps_cbr_buffer->i4_buffer_size >> 6); + + if(ps_cbr_buffer->i4_low_thr[i] > (ps_cbr_buffer->i4_buffer_size >> 3)) //KISH_DEBUG + ps_cbr_buffer->i4_low_thr[i] = (ps_cbr_buffer->i4_buffer_size >> 3); + ASSERT(ps_cbr_buffer->i4_upr_thr[i] > ps_cbr_buffer->i4_low_thr[i]); + } +} +/* ******************************************************************************/ +/** + * @brief Initialise the CBR VBV buffer state. + * This could however be used for VBR streaming VBV also + * + * @param ps_cbr_buffer + * @param i4_buffer_delay + * @param i4_tgt_frm_rate + * @param i4_bit_rate + * @param u4_num_pics_in_delay_prd + * @param u4_vbv_buf_size + */ +/* ******************************************************************************/ +void init_cbr_buffer( + cbr_buffer_t *ps_cbr_buffer, + WORD32 i4_buffer_delay, + WORD32 i4_tgt_frm_rate, + UWORD32 u4_bit_rate, + UWORD32 *u4_num_pics_in_delay_prd, + UWORD32 u4_vbv_buf_size, + UWORD32 u4_intra_frm_int, + rc_type_e e_rc_type, + UWORD32 u4_peak_bit_rate, + UWORD32 u4_num_frames_in_delay, + float f_max_dur_peak_rate, + LWORD64 i8_num_frames_to_encode, + WORD32 i4_inter_frm_int, + WORD32 i4_cbr_rc_pass, + WORD32 i4_capped_vbr_flag) + +{ + WORD32 i4_bits_per_frm[MAX_NUM_DRAIN_RATES]; + int i; + + /* Initially Encoder buffer fullness is zero */ + ps_cbr_buffer->i4_ebf = 0; + ps_cbr_buffer->i4_ebf_estimate = 0; + ps_cbr_buffer->i8_ebf_bit_alloc = 0; + ps_cbr_buffer->i8_credit_level = 0; + ps_cbr_buffer->e_rc_type = e_rc_type; + ps_cbr_buffer->i4_capped_vbr_on = i4_capped_vbr_flag; + /*If this is set to 1, it acts similar to storage VBR which allows peak rate to be sustained for infinite duration*/ + ps_cbr_buffer->i4_vbr_no_peak_rate_duration_limit = 0; + ps_cbr_buffer->i8_num_frames_encoded = 0; + ps_cbr_buffer->i8_tot_frm_to_be_encoded = i8_num_frames_to_encode; + ps_cbr_buffer->i4_cbr_rc_pass = i4_cbr_rc_pass; + ps_cbr_buffer->i4_inter_frame_int = i4_inter_frm_int; + ps_cbr_buffer->i4_intra_frame_int = u4_intra_frm_int; + ps_cbr_buffer->f_max_dur_peak_rate = f_max_dur_peak_rate; + + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + { + X_PROD_Y_DIV_Z(u4_bit_rate, 1000, i4_tgt_frm_rate, i4_bits_per_frm[i]); + /* Drain rate = bitrate/(framerate/1000) */ + ps_cbr_buffer->i4_drain_bits_per_frame[i] = i4_bits_per_frm[i]; + /* initialise the bits per frame error bits calculation */ + init_error_bits(ps_cbr_buffer->aps_bpf_error_bits[i], i4_tgt_frm_rate, u4_bit_rate); + } + + /* Bitrate * delay = buffer size, divide by 1000 as delay is in ms*/ + if(e_rc_type == CBR_NLDRC) /* This would mean CBR mode */ + { + //buffer size should be independent of initial delay + //X_PROD_Y_DIV_Z(u4_bit_rate,i4_buffer_delay,1000,ps_cbr_buffer->i4_buffer_size); + ps_cbr_buffer->i4_buffer_size = (WORD32)u4_vbv_buf_size; + ps_cbr_buffer->i4_is_cbr_mode = 1; + ps_cbr_buffer->i4_peak_drain_rate_frame = i4_bits_per_frm[0]; + /*In CBR the max file size deviaiton allowed is specified by buffer size*/ + ps_cbr_buffer->u4_vbr_max_bit_deviation = ps_cbr_buffer->i4_buffer_size; + } + else if(e_rc_type == VBR_STREAMING) + { + /*this is raw vbv buffer size, also initilize the buffer window to bit alloc (credit limit)*/ + ps_cbr_buffer->i4_buffer_size = (WORD32)u4_vbv_buf_size; + /*if there is no limit on duration for which peak bitrate can be sustained, bits can be moved from any region to other region + giving better quality*/ + if(f_max_dur_peak_rate < 0) + ps_cbr_buffer->i4_vbr_no_peak_rate_duration_limit = 1; + /*To avoid file size deviation in case of VBR mode of rate control, clip the max deviaiton allowed based on number of frames to enode*/ + { + ULWORD64 u8_vbr_max_bit_deviation; + ULWORD64 file_size = (ULWORD64)( + (((LWORD64)u4_bit_rate * 1000) / i4_tgt_frm_rate) * i8_num_frames_to_encode); + + /*When f_max_dur_peak_rate is -ve, it implies user is not worried about duration for which peak is sustained, hence go with max possible value*/ + if(f_max_dur_peak_rate > 0) + u8_vbr_max_bit_deviation = (ULWORD64)(f_max_dur_peak_rate * u4_bit_rate); + else + u8_vbr_max_bit_deviation = (ULWORD64)(VBR_MAX_BIT_DEV_SEC * u4_bit_rate); + + /*when num frames to encode is negative is -ve it implies total frames data is not available (as in case of live encoding)*/ + if(i8_num_frames_to_encode > 0) + { + /*allow atleast one second deviation or 12% of total file size whichever is higher*/ + if(u8_vbr_max_bit_deviation > (file_size >> 3)) + u8_vbr_max_bit_deviation = (UWORD32)(file_size >> 3); + + /*allow atleast one second for shorter sequence*/ + if(u8_vbr_max_bit_deviation < u4_bit_rate) + u8_vbr_max_bit_deviation = u4_bit_rate; + } + else + { + /*the data of number of frames to be encoded is not available*/ + /*start off with one second delay, this will be later adjusted once large number of frames are encoded*/ + u8_vbr_max_bit_deviation = u4_bit_rate; + } + ps_cbr_buffer->u4_vbr_max_bit_deviation = u8_vbr_max_bit_deviation; + } + ps_cbr_buffer->i4_is_cbr_mode = 0; + X_PROD_Y_DIV_Z( + u4_peak_bit_rate, 1000, i4_tgt_frm_rate, ps_cbr_buffer->i4_peak_drain_rate_frame); + } + else + { + /*currently only two modes are supported*/ + ASSERT(e_rc_type == CONST_QP); + } + + if(ps_cbr_buffer->i4_buffer_size > (WORD32)u4_vbv_buf_size) + { + ps_cbr_buffer->i4_buffer_size = u4_vbv_buf_size; + } + + /* Uppr threshold for + I frame = 1 * bits per frame + P Frame = 4 * bits per frame. + The threshold for I frame is only 1 * bits per frame as the threshold should + only account for error in estimated bits. + In P frame it should account for difference bets bits consumed by I(Scene change) + and P frame I to P complexity is assumed to be 5. */ + /*HEVC_hierarchy*/ + if(e_rc_type != CONST_QP) + set_upper_lower_vbv_threshold(ps_cbr_buffer, i4_bits_per_frm[0]); + /* Storing the input parameters for using it for change functions */ + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + ps_cbr_buffer->ai4_bit_rate[i] = u4_bit_rate; + for(i = 0; i < MAX_PIC_TYPE; i++) + { + ps_cbr_buffer->ai4_num_pics_in_delay_period[i] = u4_num_pics_in_delay_prd[i]; + } + ps_cbr_buffer->i4_tgt_frm_rate = i4_tgt_frm_rate; + ps_cbr_buffer->i4_max_delay = i4_buffer_delay; + ps_cbr_buffer->u4_max_vbv_buf_size = u4_vbv_buf_size; + ps_cbr_buffer->u4_num_frms_in_delay = u4_num_frames_in_delay; +} +#endif /* #if NON_STEADSTATE_CODE */ + +/* ******************************************************************************/ +/** + * @brief Condition check for constrining the number of bits allocated based on bufer size + * + * @param ps_cbr_buffer + * @param i4_tgt_bits + * @param e_pic_type + * + * @return + */ +/* ******************************************************************************/ +WORD32 cbr_buffer_constraint_check( + cbr_buffer_t *ps_cbr_buffer, + WORD32 i4_tgt_bits, + picture_type_e e_pic_type, + WORD32 *pi4_max_tgt_bits, + WORD32 *pi4_min_tgt_bits) +{ + WORD32 i4_max_tgt_bits, i4_min_tgt_bits; + WORD32 i4_drain_bits_per_frame = (e_pic_type == I_PIC) + ? ps_cbr_buffer->i4_drain_bits_per_frame[0] + : ps_cbr_buffer->i4_drain_bits_per_frame[1]; + WORD32 i4_error_bits = (e_pic_type == I_PIC) + ? get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[0]) + : get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[1]); + + /*trace_printf(" ebf = %d bebf = %d ",ps_cbr_buffer->i4_ebf,ps_cbr_buffer->i8_ebf_bit_alloc);*/ + /* Max tgt bits = Upper threshold - current encoder buffer fullness */ + i4_max_tgt_bits = + (WORD32)(ps_cbr_buffer->i4_upr_thr[e_pic_type] - ps_cbr_buffer->i4_ebf_estimate); + /* Max tgt bits cannot be negative */ + if(i4_max_tgt_bits < 0) + i4_max_tgt_bits = 0; + + /* Min tgt bits , least number of bits in the Encoder after + draining such that it is greater than lower threshold */ + i4_min_tgt_bits = (WORD32)( + ps_cbr_buffer->i4_low_thr[e_pic_type] - + (ps_cbr_buffer->i4_ebf_estimate - i4_drain_bits_per_frame - i4_error_bits)); + /*Min tgt bits cannot be negative*/ + if(i4_min_tgt_bits < 0) + i4_min_tgt_bits = 0; + + /* current tgt bits should be between max and min tgt bits*/ + CLIP(i4_tgt_bits, i4_max_tgt_bits, i4_min_tgt_bits); + pi4_min_tgt_bits[0] = i4_min_tgt_bits; + pi4_max_tgt_bits[0] = i4_max_tgt_bits; + return i4_tgt_bits; +} + +/* ******************************************************************************/ +/** + * @brief constaints the bit allocation based on buffer size + * + * @param ps_cbr_buffer + * @param i4_tgt_bits + * @param e_pic_type + * + * @return + */ +/* ******************************************************************************/ +WORD32 vbr_stream_buffer_constraint_check( + cbr_buffer_t *ps_cbr_buffer, + WORD32 i4_tgt_bits, + picture_type_e e_pic_type, + WORD32 *pi4_max_bits, + WORD32 *pi4_min_bits) +{ + WORD32 i4_max_tgt_bits, i4_min_tgt_bits = 0; + + /* Max tgt bits = Upper threshold - current encoder buffer fullness */ + /*maximum target for a pic is amount of bits that can be transmitted to decoder buffer in delay assuming max drain rate + This above limit has to be constrained wrt a single frame being accomodated in the buffer*/ + i4_max_tgt_bits = (WORD32)( + (ps_cbr_buffer->u4_num_frms_in_delay * ps_cbr_buffer->i4_peak_drain_rate_frame) - + ps_cbr_buffer->i4_ebf_estimate); + /*the below check is necessary to make sure that a single frame to be accomodated in encoder buffer*/ + if(i4_max_tgt_bits > ps_cbr_buffer->i4_upr_thr[e_pic_type] - ps_cbr_buffer->i4_ebf_estimate) + { + i4_max_tgt_bits = + (WORD32)(ps_cbr_buffer->i4_upr_thr[e_pic_type] - ps_cbr_buffer->i4_ebf_estimate); + } + + /*In VBR streaming though encoder buffer underflow is not a problem, at any point of time the bitrate underconsumption + cannot go below specified limit. Hence it is limited based on possible bitrate deviation allowed*/ + /*Enabling movement of stuffing bits always*/ + if(ps_cbr_buffer->i4_vbr_no_peak_rate_duration_limit) + { + /*If the content has underconsumed force it to consume atleast per frame bits so that end of encoding there wont be too much undersonsumption*/ + if(ps_cbr_buffer->i8_ebf_bit_alloc < 0 && ps_cbr_buffer->i4_cbr_rc_pass != 2) + i4_min_tgt_bits = (ps_cbr_buffer->i4_drain_bits_per_frame[0] >> 1); + } + else + { + /*In this case buffer is always guranteed to be positive, to avoid stuffing give decent amount of min bits*/ + i4_min_tgt_bits = (WORD32)(ps_cbr_buffer->i4_low_thr[0] - ps_cbr_buffer->i8_ebf_bit_alloc); + } + + /*Clip min target bit*/ + if(i4_min_tgt_bits < 0) + i4_min_tgt_bits = 0; + if(i4_tgt_bits < i4_min_tgt_bits) + i4_tgt_bits = i4_min_tgt_bits; + pi4_min_bits[0] = i4_min_tgt_bits; + /* Max tgt bits cannot be negative */ + if(i4_max_tgt_bits < 0) + i4_max_tgt_bits = 0; + if(i4_tgt_bits > i4_max_tgt_bits) + i4_tgt_bits = i4_max_tgt_bits; + pi4_max_bits[0] = i4_max_tgt_bits; + + return i4_tgt_bits; +} + +/* ******************************************************************************/ +/** + * @brief Verifies the buffer state and returns whether it is overflowing, underflowing or normal + * + * @param ps_cbr_buffer + * @param i4_tot_consumed_bits + * @param pi4_num_bits_to_prevent_overflow + * @param e_pic_type + * + * @return + */ +/* ******************************************************************************/ +vbv_buf_status_e get_cbr_buffer_status( + cbr_buffer_t *ps_cbr_buffer, + WORD32 i4_tot_consumed_bits, + WORD32 *pi4_num_bits_to_prevent_overflow, + picture_type_e e_pic_type, + rc_type_e e_rc_type) +{ + vbv_buf_status_e e_buf_status; + WORD32 i4_cur_enc_buf; + WORD32 i4_error_bits = (e_pic_type == I_PIC) + ? get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[0]) + : get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[1]); + WORD32 i4_drain_bits_per_frame = (e_pic_type == I_PIC) + ? ps_cbr_buffer->i4_drain_bits_per_frame[0] + : ps_cbr_buffer->i4_drain_bits_per_frame[1]; + + /* Add the tot consumed bits to the Encoder Buffer*/ + i4_cur_enc_buf = ps_cbr_buffer->i4_ebf + i4_tot_consumed_bits; + + /* If the Encoder exceeds the Buffer Size signal an Overflow*/ + if(i4_cur_enc_buf > ps_cbr_buffer->i4_buffer_size) + { + e_buf_status = VBV_OVERFLOW; + i4_cur_enc_buf = ps_cbr_buffer->i4_buffer_size; + } + else + { + /* Subtract the constant drain bits and error bits due to fixed point implementation*/ + i4_cur_enc_buf -= (i4_drain_bits_per_frame + i4_error_bits); + + if(e_rc_type == VBR_STREAMING) + { + /*In VBR suffing scenerio will not occur*/ + if(i4_cur_enc_buf < 0) + i4_cur_enc_buf = 0; + } + /* If the buffer is less than stuffing threshold an Underflow is signaled else its NORMAL*/ + if(i4_cur_enc_buf < 0) + { + e_buf_status = VBV_UNDERFLOW; + } + else + { + e_buf_status = VBV_NORMAL; + } + + if(i4_cur_enc_buf < 0) + i4_cur_enc_buf = 0; + } + + /* The RC lib models the encoder buffer, but the VBV buffer characterises the decoder buffer */ + if(e_buf_status == VBV_OVERFLOW) + { + e_buf_status = VBV_UNDERFLOW; + } + else if(e_buf_status == VBV_UNDERFLOW) + { + e_buf_status = VBV_OVERFLOW; + } + + pi4_num_bits_to_prevent_overflow[0] = (ps_cbr_buffer->i4_buffer_size - i4_cur_enc_buf); + + return e_buf_status; +} + +/* ******************************************************************************/ +/** + * @brief Based on the bits consumed the buffer model is updated + * + * @param ps_cbr_buffer + * @param i4_tot_consumed_bits + * @param e_pic_type + */ +/* ******************************************************************************/ +void update_cbr_buffer( + cbr_buffer_t *ps_cbr_buffer, WORD32 i4_tot_consumed_bits, picture_type_e e_pic_type) +{ + WORD32 i; + WORD32 i4_error_bits = (e_pic_type == I_PIC) + ? get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[0]) + : get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[1]); + WORD32 i4_drain_bits_per_frame = (e_pic_type == I_PIC) + ? ps_cbr_buffer->i4_drain_bits_per_frame[0] + : ps_cbr_buffer->i4_drain_bits_per_frame[1]; + + ps_cbr_buffer->i8_num_frames_encoded++; + if(ps_cbr_buffer->e_rc_type == VBR_STREAMING && ps_cbr_buffer->i8_tot_frm_to_be_encoded < 0) + { + LWORD64 i8_max_bit_dev_allowed = ps_cbr_buffer->ai4_bit_rate[0]; + LWORD64 approx_file_size = ps_cbr_buffer->i8_num_frames_encoded * + ps_cbr_buffer->ai4_bit_rate[0] * 1000 / + ps_cbr_buffer->i4_tgt_frm_rate; + if(i8_max_bit_dev_allowed < (approx_file_size >> 4)) + i8_max_bit_dev_allowed = (approx_file_size >> 4); + + /*have a max limit so that bit dev does not grow for very long sequence like 24 hours of encoding (max can be 20 second)*/ + if(i8_max_bit_dev_allowed > (VBR_MAX_BIT_DEV_SEC * ps_cbr_buffer->ai4_bit_rate[0])) + i8_max_bit_dev_allowed = (VBR_MAX_BIT_DEV_SEC * ps_cbr_buffer->ai4_bit_rate[0]); + + ps_cbr_buffer->u4_max_vbv_buf_size = (UWORD32)i8_max_bit_dev_allowed; + } + /* Update the Encoder buffer with the total consumed bits*/ + if(ps_cbr_buffer->i4_is_cbr_mode != 0) + { + ps_cbr_buffer->i4_ebf += i4_tot_consumed_bits; + ps_cbr_buffer->i8_ebf_bit_alloc += i4_tot_consumed_bits; + + /* Subtract the drain bits and error bits due to fixed point implementation*/ + ps_cbr_buffer->i4_ebf -= (i4_drain_bits_per_frame + i4_error_bits); + ps_cbr_buffer->i8_ebf_bit_alloc -= (i4_drain_bits_per_frame + i4_error_bits); + } + else + { + ps_cbr_buffer->i4_ebf += i4_tot_consumed_bits; + ps_cbr_buffer->i4_ebf -= + ((MIN(ps_cbr_buffer->i4_peak_drain_rate_frame, ps_cbr_buffer->i4_ebf)) + i4_error_bits); + + ps_cbr_buffer->i8_ebf_bit_alloc += i4_tot_consumed_bits; + ps_cbr_buffer->i8_ebf_bit_alloc -= + (ps_cbr_buffer->i4_drain_bits_per_frame[0] + i4_error_bits); + + ps_cbr_buffer->i8_credit_level += i4_tot_consumed_bits; + ps_cbr_buffer->i8_credit_level -= + (ps_cbr_buffer->i4_drain_bits_per_frame[0] + i4_error_bits); + /*To keep limit on duration for which peak rate can be sustained limit the accumulation of bits from simpler regions*/ + if(!ps_cbr_buffer->i4_vbr_no_peak_rate_duration_limit) + { + if(ps_cbr_buffer->i8_ebf_bit_alloc < 0) + ps_cbr_buffer->i8_ebf_bit_alloc = + 0; /*This will make VBR buffer believe that the bits are lost*/ + } + } + + /*SS - Fix for lack of stuffing*/ + if(ps_cbr_buffer->i4_ebf < 0) + { + //trace_printf("Error: Should not be coming here with bit stuffing \n"); + ps_cbr_buffer->i4_ebf = 0; + } + + if(ps_cbr_buffer->i4_ebf > ps_cbr_buffer->i4_buffer_size) + { + //trace_printf("Error: Frame should be skipped\n"); + ps_cbr_buffer->i4_ebf = ps_cbr_buffer->i4_buffer_size; + } + + ps_cbr_buffer->i4_ebf_estimate = ps_cbr_buffer->i4_ebf; + + trace_printf( + "VBR ebf = %d bebf = %d ", ps_cbr_buffer->i4_ebf, ps_cbr_buffer->i8_ebf_bit_alloc); + /* Update the error bits */ + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + update_error_bits(ps_cbr_buffer->aps_bpf_error_bits[i]); +} + +/* ******************************************************************************/ +/** + * @brief If the buffer underflows then return the number of bits to prevent underflow + * + * @param ps_cbr_buffer + * @param i4_tot_consumed_bits + * @param e_pic_type + * + * @return + */ +/* ******************************************************************************/ +WORD32 get_cbr_bits_to_stuff( + cbr_buffer_t *ps_cbr_buffer, WORD32 i4_tot_consumed_bits, picture_type_e e_pic_type) +{ + WORD32 i4_bits_to_stuff; + WORD32 i4_error_bits = (e_pic_type == I_PIC) + ? get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[0]) + : get_error_bits(ps_cbr_buffer->aps_bpf_error_bits[1]); + WORD32 i4_drain_bits_per_frame = (e_pic_type == I_PIC) + ? ps_cbr_buffer->i4_drain_bits_per_frame[0] + : ps_cbr_buffer->i4_drain_bits_per_frame[1]; + + /* Stuffing bits got from the following equation + Stuffing_threshold = ebf + tcb - drain bits - error bits + stuff_bits*/ + i4_bits_to_stuff = + i4_drain_bits_per_frame + i4_error_bits - (ps_cbr_buffer->i4_ebf + i4_tot_consumed_bits); + + return i4_bits_to_stuff; +} + +/* ******************************************************************************/ +/** + * @brief Change the state for change in bit rate + * + * @param ps_cbr_buffer + * @param i4_bit_rate + */ +/* ******************************************************************************/ +void change_cbr_vbv_bit_rate( + cbr_buffer_t *ps_cbr_buffer, WORD32 *i4_bit_rate, WORD32 i4_peak_bitrate) +{ + WORD32 i4_bits_per_frm[MAX_NUM_DRAIN_RATES]; + int i; + + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + { + X_PROD_Y_DIV_Z(i4_bit_rate[i], 1000, ps_cbr_buffer->i4_tgt_frm_rate, i4_bits_per_frm[i]); + /* Drain rate = bitrate/(framerate/1000) */ + ps_cbr_buffer->i4_drain_bits_per_frame[i] = i4_bits_per_frm[i]; + + /* initialise the bits per frame error bits calculation */ + change_bitrate_in_error_bits(ps_cbr_buffer->aps_bpf_error_bits[i], i4_bit_rate[i]); + } + X_PROD_Y_DIV_Z( + i4_peak_bitrate, + 1000, + ps_cbr_buffer->i4_tgt_frm_rate, + ps_cbr_buffer->i4_peak_drain_rate_frame); + /* Bitrate * delay = buffer size, divide by 1000 as delay is in ms*/ + //if(i4_bit_rate[0] == i4_bit_rate[1]) /* This would mean CBR mode */ + { + X_PROD_Y_DIV_Z( + i4_bit_rate[0], + ps_cbr_buffer->i4_max_delay, + 1000, + ps_cbr_buffer->i4_buffer_size); //the delay term is supposed to remain constant + //ps_cbr_buffer->i4_is_cbr_mode = 1; + ps_cbr_buffer->u4_max_vbv_buf_size = ps_cbr_buffer->i4_buffer_size; + } + if(ps_cbr_buffer->i4_buffer_size > (WORD32)ps_cbr_buffer->u4_max_vbv_buf_size) + { + ps_cbr_buffer->i4_buffer_size = ps_cbr_buffer->u4_max_vbv_buf_size; + } + set_upper_lower_vbv_threshold(ps_cbr_buffer, i4_bits_per_frm[0]); + if(ps_cbr_buffer->e_rc_type == CBR_NLDRC) + { + ps_cbr_buffer->u4_vbr_max_bit_deviation = ps_cbr_buffer->i4_buffer_size; + } + else + { + /*DCB: the deviaiton must be altered for VBR case, when bitrate is lowered quality might be bad because of this*/ + { + ULWORD64 u8_vbr_max_bit_deviation = + (ULWORD64)(ps_cbr_buffer->f_max_dur_peak_rate * i4_bit_rate[0]); + ULWORD64 file_size = (ULWORD64)( + (((LWORD64)i4_bit_rate[0] * 1000) / ps_cbr_buffer->i4_tgt_frm_rate) * + (ps_cbr_buffer->i8_tot_frm_to_be_encoded - ps_cbr_buffer->i8_num_frames_encoded)); + /*When f_max_dur_peak_rate is -ve, it implies user is not worried about duration for which peak is sustained, hence go with max possible value*/ + if(ps_cbr_buffer->f_max_dur_peak_rate > 0) + u8_vbr_max_bit_deviation = + (ULWORD64)(ps_cbr_buffer->f_max_dur_peak_rate * i4_bit_rate[0]); + else + u8_vbr_max_bit_deviation = VBR_MAX_BIT_DEV_SEC * i4_bit_rate[0]; + + /*when num frames to encode is negative is -ve it implies total frames data is not available (as in case of live encoding)*/ + if(ps_cbr_buffer->i8_tot_frm_to_be_encoded > 0) + { + /*allow atleast one second deviation or 12% of total file size whichever is higher*/ + if(u8_vbr_max_bit_deviation > (file_size >> 3)) + u8_vbr_max_bit_deviation = (UWORD32)(file_size >> 3); + } + else + { + u8_vbr_max_bit_deviation = (UWORD32)(file_size >> 3); + } + /*allow atleast one second for shorter sequence*/ + if(u8_vbr_max_bit_deviation < (ULWORD64)i4_bit_rate[0]) + u8_vbr_max_bit_deviation = (ULWORD64)i4_bit_rate[0]; + ps_cbr_buffer->u4_vbr_max_bit_deviation = u8_vbr_max_bit_deviation; + } + } + + /* Storing the input parameters for using it for change functions */ + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + ps_cbr_buffer->ai4_bit_rate[i] = i4_bit_rate[i]; +} +/* ******************************************************************************/ +/** + * @brief Update the state for change in number of pics in the delay period + * + * @param ps_cbr_buffer + * @param u4_num_pics_in_delay_prd + */ +/* ******************************************************************************/ +void change_cbr_vbv_num_pics_in_delay_period( + cbr_buffer_t *ps_cbr_buffer, UWORD32 *u4_num_pics_in_delay_prd) +{ + WORD32 i; + + if(!ps_cbr_buffer->i4_is_cbr_mode) + { + ps_cbr_buffer->i4_buffer_size = + u4_num_pics_in_delay_prd[0] * ps_cbr_buffer->i4_drain_bits_per_frame[0] + + u4_num_pics_in_delay_prd[1] * ps_cbr_buffer->i4_drain_bits_per_frame[1]; + + if(ps_cbr_buffer->i4_buffer_size > (WORD32)ps_cbr_buffer->u4_max_vbv_buf_size) + { + ps_cbr_buffer->i4_buffer_size = ps_cbr_buffer->u4_max_vbv_buf_size; + } + for(i = 0; i < MAX_PIC_TYPE; i++) + { + ps_cbr_buffer->i4_upr_thr[i] = + ps_cbr_buffer->i4_buffer_size - (ps_cbr_buffer->i4_buffer_size >> 3); + } + + /* Re-initilise the number of pics in delay period */ + for(i = 0; i < MAX_PIC_TYPE; i++) + { + ps_cbr_buffer->ai4_num_pics_in_delay_period[i] = u4_num_pics_in_delay_prd[i]; + } + } +} +/* ******************************************************************************/ +/** + * @ modifies the ebf estimated parameter based on error + * + * @param ps_cbr_buffer + * @param i4_bit_error + */ +/* ******************************************************************************/ +void cbr_modify_ebf_estimate(cbr_buffer_t *ps_cbr_buffer, WORD32 i4_bit_error) +{ + ps_cbr_buffer->i4_ebf_estimate = ps_cbr_buffer->i4_ebf + i4_bit_error; + if(ps_cbr_buffer->i4_ebf_estimate < 0) + { + ps_cbr_buffer->i4_ebf_estimate = 0; + } + else if(ps_cbr_buffer->i4_ebf_estimate > ps_cbr_buffer->i4_buffer_size) + { + ps_cbr_buffer->i4_ebf_estimate = ps_cbr_buffer->i4_buffer_size; + } +} + +/* ******************************************************************************/ +/** + * @ get the buffer size + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ + +WORD32 get_cbr_buffer_size(cbr_buffer_t *ps_cbr_buffer) +{ + return (ps_cbr_buffer->i4_buffer_size); +} + +#if NON_STEADSTATE_CODE +/* ******************************************************************************/ +/** + * @brief update the state for change in target frame rate + * + * @param ps_cbr_buffer + * @param i4_tgt_frm_rate + */ +/* ******************************************************************************/ +void change_cbr_vbv_tgt_frame_rate(cbr_buffer_t *ps_cbr_buffer, WORD32 i4_tgt_frm_rate) +{ + WORD32 i4_i, i4_bits_per_frm[MAX_NUM_DRAIN_RATES]; + int i; + + for(i = 0; i < MAX_NUM_DRAIN_RATES; i++) + { + X_PROD_Y_DIV_Z(ps_cbr_buffer->ai4_bit_rate[i], 1000, i4_tgt_frm_rate, i4_bits_per_frm[i]); + /* Drain rate = bitrate/(framerate/1000) */ + ps_cbr_buffer->i4_drain_bits_per_frame[i] = i4_bits_per_frm[i]; + /* initialise the bits per frame error bits calculation */ + change_frm_rate_in_error_bits(ps_cbr_buffer->aps_bpf_error_bits[i], i4_tgt_frm_rate); + } + + /* Bitrate * delay = buffer size, divide by 1000 as delay is in ms*/ + if(!ps_cbr_buffer->i4_is_cbr_mode) + { + /* VBR streaming case which has different drain rates for I and P */ + ps_cbr_buffer->i4_buffer_size = ps_cbr_buffer->ai4_num_pics_in_delay_period[0] * + ps_cbr_buffer->i4_drain_bits_per_frame[0] + + ps_cbr_buffer->ai4_num_pics_in_delay_period[1] * + ps_cbr_buffer->i4_drain_bits_per_frame[1]; + } + + if(ps_cbr_buffer->i4_buffer_size > (WORD32)ps_cbr_buffer->u4_max_vbv_buf_size) + { + ps_cbr_buffer->i4_buffer_size = ps_cbr_buffer->u4_max_vbv_buf_size; + } + + for(i4_i = 0; i4_i < MAX_PIC_TYPE; i4_i++) + { + /* Uppr threshold for + I frame = 1 * bits per frame + P Frame = 4 * bits per frame. + The threshold for I frame is only 1 * bits per frame as the threshold should + only account for error in estimated bits. + In P frame it should account for difference bets bits consumed by I(Scene change) + and P frame I to P complexity is assumed to be 5. */ + WORD32 i4_index; + i4_index = i4_i > 0 ? 1 : 0; + ps_cbr_buffer->i4_upr_thr[i4_i] = + ps_cbr_buffer->i4_buffer_size - (ps_cbr_buffer->i4_buffer_size >> 3); + + /* For both I and P frame Lower threshold is equal to drain rate. + Even if the encoder consumes zero bits it should have enough bits to drain*/ + ps_cbr_buffer->i4_low_thr[i4_i] = i4_bits_per_frm[i4_index]; + } + + /* Storing the input parameters for using it for change functions */ + ps_cbr_buffer->i4_tgt_frm_rate = i4_tgt_frm_rate; +} +/* ******************************************************************************/ +/** + * @brief update the state for change in buffer delay + * + * @param ps_cbr_buffer + * @param i4_buffer_delay + */ +/* ******************************************************************************/ +void change_cbr_buffer_delay(cbr_buffer_t *ps_cbr_buffer, WORD32 i4_buffer_delay) +{ + WORD32 i4_i; + + /* Bitrate * delay = buffer size, divide by 1000 as delay is in ms*/ + if(ps_cbr_buffer->i4_is_cbr_mode) + { + X_PROD_Y_DIV_Z( + ps_cbr_buffer->ai4_bit_rate[0], i4_buffer_delay, 1000, ps_cbr_buffer->i4_buffer_size); + } + + if(ps_cbr_buffer->i4_buffer_size > (WORD32)ps_cbr_buffer->u4_max_vbv_buf_size) + { + ps_cbr_buffer->i4_buffer_size = ps_cbr_buffer->u4_max_vbv_buf_size; + } + + for(i4_i = 0; i4_i < MAX_PIC_TYPE; i4_i++) + { + /* Uppr threshold for + I frame = 1 * bits per frame + P Frame = 4 * bits per frame. + The threshold for I frame is only 1 * bits per frame as the threshold should + only account for error in estimated bits. + In P frame it should account for difference bets bits consumed by I(Scene change) + and P frame I to P complexity is assumed to be 5. */ + ps_cbr_buffer->i4_upr_thr[i4_i] = + ps_cbr_buffer->i4_buffer_size - (ps_cbr_buffer->i4_buffer_size >> 3); + } + + /* Storing the input parameters for using it for change functions */ + ps_cbr_buffer->i4_max_delay = i4_buffer_delay; +} +/* ******************************************************************************/ +/** + * @brief update the state for change in buffer delay + * + * @param ps_cbr_buffer + * @param i4_buffer_delay + */ +/* ******************************************************************************/ +WORD32 get_cbr_buffer_delay(cbr_buffer_t *ps_cbr_buffer) +{ + return (ps_cbr_buffer->i4_max_delay); +} +/* ******************************************************************************/ +/** + * @brief get_cbr_ebf + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +WORD32 get_cbr_ebf(cbr_buffer_t *ps_cbr_buffer) +{ + return (ps_cbr_buffer->i4_ebf); +} +/* ******************************************************************************/ +/** + * @brief get_cbr_max_ebf + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +WORD32 get_cbr_max_ebf(cbr_buffer_t *ps_cbr_buffer) +{ + return (ps_cbr_buffer->i4_upr_thr[0]); +} +/* ******************************************************************************/ +/** + * @brief set_cbr_ebf + * + * @param ps_cbr_buffer + * @param i32_init_ebf + */ +/* ******************************************************************************/ +void set_cbr_ebf(cbr_buffer_t *ps_cbr_buffer, WORD32 i32_init_ebf) +{ + ps_cbr_buffer->i4_ebf = i32_init_ebf; +} +/* ******************************************************************************/ +/** + * @brief update_cbr_buf_mismatch_bit + * + * @param ps_cbr_buffer + * @param i4_error_bits + */ +/* ******************************************************************************/ +void update_cbr_buf_mismatch_bit(cbr_buffer_t *ps_cbr_buffer, WORD32 i4_error_bits) +{ + ps_cbr_buffer->i4_ebf -= i4_error_bits; + ps_cbr_buffer->i8_ebf_bit_alloc -= i4_error_bits; + ps_cbr_buffer->i8_credit_level -= i4_error_bits; +} +/* ******************************************************************************/ +/** + * @brief get encoded number of frames + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +LWORD64 get_num_frms_encoded(cbr_buffer_t *ps_cbr_buffer) +{ + return ps_cbr_buffer->i8_num_frames_encoded; +} +/* ******************************************************************************/ +/** + * @brief get num frames to encode + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +LWORD64 get_num_frms_to_encode(cbr_buffer_t *ps_cbr_buffer) +{ + return ps_cbr_buffer->i8_tot_frm_to_be_encoded; +} +/* ******************************************************************************/ +/** + * @brief get peak drain rate + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +/* The buffer limit in bit allocation should be according to peak bitrate */ +WORD32 get_buf_max_drain_rate(cbr_buffer_t *ps_cbr_buffer) +{ + if(ps_cbr_buffer->e_rc_type == VBR_STREAMING) + return ps_cbr_buffer->i4_peak_drain_rate_frame; + else if(ps_cbr_buffer->e_rc_type != CONST_QP) + { + ASSERT( + ps_cbr_buffer->i4_peak_drain_rate_frame == ps_cbr_buffer->i4_drain_bits_per_frame[0]); + return ps_cbr_buffer->i4_drain_bits_per_frame[0]; + } + return ps_cbr_buffer->i4_drain_bits_per_frame[0]; +} +/* ******************************************************************************/ +/** + * @brief get excess bits by moving in VBV buffer to enable bitrate greater than peak rate for shorter duration in very + * complex contents + * + * @param ps_cbr_buffer + * @param i4_tgt_frm_rate + */ +/* ******************************************************************************/ +WORD32 get_vbv_buffer_based_excess( + cbr_buffer_t *ps_cbr_buffer, + float f_complexity_peak_rate, + float f_cur_bits_complexity, + WORD32 bit_alloc_period, + WORD32 i4_num_gops_for_excess) +{ + LWORD64 max_buffer_level = (LWORD64)((float)ps_cbr_buffer->i4_buffer_size * 0.8f); + LWORD64 i8_excess_bits; + /*LWORD64target_buf_level;*/ + WORD32 + num_frm_to_be_distributed; //Number of frames for which excess bits should be distributed, using number of frames corresponding to buffer size for now + + if(ps_cbr_buffer->i4_upr_thr[0] < + max_buffer_level) /*choose max allowed level to min(upper_threshold,80% of buffer*/ + max_buffer_level = ps_cbr_buffer->i4_upr_thr[0]; + + if(ps_cbr_buffer->e_rc_type == VBR_STREAMING) + max_buffer_level = (LWORD64)( + ps_cbr_buffer->i4_peak_drain_rate_frame * ps_cbr_buffer->u4_num_frms_in_delay * 0.8f); + + if(f_cur_bits_complexity > + 0.9f) /*clip current to max of 80% of buffer size to avoid dangerous buffer level by end of GOP*/ + f_cur_bits_complexity = 0.9f; + + if(f_cur_bits_complexity < f_complexity_peak_rate || f_cur_bits_complexity < 0.1f || + ps_cbr_buffer->i4_buffer_size < + ps_cbr_buffer->ai4_bit_rate + [0]) //For buffer size less than 1 sec disable any contribution from buffer based for extra complex contents + { + /*For very low compleity content or Cavg do not allow buffer movement*/ + return 0; + } + + i8_excess_bits = (LWORD64)( + ((f_cur_bits_complexity - f_complexity_peak_rate) / (0.9f - f_complexity_peak_rate)) * + (max_buffer_level - ps_cbr_buffer->i4_ebf)); + + if(i8_excess_bits < 0) + i8_excess_bits = 0; + + num_frm_to_be_distributed = (WORD32)( + ((float)ps_cbr_buffer->i4_buffer_size / ps_cbr_buffer->ai4_bit_rate[0] * + ps_cbr_buffer->i4_tgt_frm_rate / 1000) + + 0.5); + /*Excess bits should be proportional to bit alloc period, shorter intra period should get in small incentives*/ + if(bit_alloc_period < num_frm_to_be_distributed) + i8_excess_bits = + (LWORD64)((float)i8_excess_bits * bit_alloc_period / num_frm_to_be_distributed); + + if(ps_cbr_buffer->e_rc_type == VBR_STREAMING) + { + if(i4_num_gops_for_excess > 1) + i8_excess_bits = i8_excess_bits * i4_num_gops_for_excess; + + if(i8_excess_bits > (LWORD64)( + (float)ps_cbr_buffer->i4_peak_drain_rate_frame * + ps_cbr_buffer->u4_num_frms_in_delay * 0.8f)) + i8_excess_bits = (LWORD64)( + (float)ps_cbr_buffer->i4_peak_drain_rate_frame * + ps_cbr_buffer->u4_num_frms_in_delay * 0.8f); + } + trace_printf( + "Excess bits %d %f %f num gops %d", + i8_excess_bits, + f_cur_bits_complexity, + f_complexity_peak_rate, + i4_num_gops_for_excess); + + return ((WORD32)i8_excess_bits); +} +/* ******************************************************************************/ +/** + * @brief get gop correction error bits for the current gop. This will be added to rbip. + * + * @param ps_cbr_buffer + * @param i4_lap_complexity_q7 + * @param i4_bit_alloc_period + */ +/* ******************************************************************************/ +WORD32 get_error_bits_for_desired_buf( + cbr_buffer_t *ps_cbr_buffer, WORD32 i4_lap_complexity_q7, WORD32 i4_bit_alloc_period) +{ + if(ps_cbr_buffer->e_rc_type == CBR_NLDRC) + { + LWORD64 error_bits = 0, complexity_mov_buf_size = 0; + LWORD64 i8_default_bits_in_period, i8_max_additional_bits_in_period; + LWORD64 i8_buf_based_limit_red, i8_buf_based_limit_inc, i8_buf_diff_bits; + float buf_diff, abs_lap_complexity; + + /*calculate default allocation*/ + i8_default_bits_in_period = (LWORD64)ps_cbr_buffer->ai4_bit_rate[0] * 1000 * + i4_bit_alloc_period / ps_cbr_buffer->i4_tgt_frm_rate; + + /*In case of VBR give additional bits according to peak bitrate*/ + if(ps_cbr_buffer->e_rc_type == VBR_STREAMING) + { + i8_max_additional_bits_in_period = + ((LWORD64)ps_cbr_buffer->i4_peak_drain_rate_frame * i4_bit_alloc_period) - + i8_default_bits_in_period; + ASSERT(i8_max_additional_bits_in_period >= 0); + if(i8_max_additional_bits_in_period > (i8_default_bits_in_period)) + { + /*clip max bits that can be given to 2x bitrate since its too riskly to give more than that in single pass encoding + where long future is not known*/ + i8_max_additional_bits_in_period = (i8_default_bits_in_period); + } + } + else + { + i8_max_additional_bits_in_period = i8_default_bits_in_period; + } + { + float X = ((float)i4_lap_complexity_q7 / 128); + float desired_buf_level; + /*For CBR VBV buffer size is "complexity_mov_buf_size" and In case of VBR it is determined by bit deviaiton*/ + if(ps_cbr_buffer->e_rc_type == CBR_NLDRC) + { + complexity_mov_buf_size = (LWORD64)ps_cbr_buffer->i4_upr_thr[0]; + } + else if(ps_cbr_buffer->e_rc_type == VBR_STREAMING) + { + complexity_mov_buf_size = ps_cbr_buffer->u4_vbr_max_bit_deviation; + } + abs_lap_complexity = X; + + if(ps_cbr_buffer->i4_cbr_rc_pass == 2) + desired_buf_level = COMP_TO_BITS_MAP_2_PASS(X, complexity_mov_buf_size); + else + desired_buf_level = COMP_TO_BITS_MAP(X, complexity_mov_buf_size); + + if(desired_buf_level < 0) + desired_buf_level = 0; + /*map complexity to buffer level*/ + + error_bits = (LWORD64)(desired_buf_level - ps_cbr_buffer->i8_ebf_bit_alloc); + i8_buf_diff_bits = error_bits; + /*For VBR its possible that i8_ebf_bit_alloc can go below 0, that the extent of giving should only be desired - cur( = 0 for cur < 0)*/ + buf_diff = (float)error_bits / complexity_mov_buf_size; + + /*clipping based on buffer size should depend on gop size. Assuming 7% of gop of gop = 32, calculate for other GOP intervals max 7% while giving from buffer and 10% + while stealing from buffer(for GOP of 32)*/ + /*try to be conservative when giving extra bits to gop and limit while reducing bits to GOP needs to be higher inorder to be buffer compliant if necessary*/ + i8_buf_based_limit_red = + ((LWORD64)complexity_mov_buf_size * i4_bit_alloc_period * 12) >> 12; + i8_buf_based_limit_inc = ((LWORD64)complexity_mov_buf_size * i4_bit_alloc_period * 8) >> + 12; + + /*(shd be 7 even if GOP size goes lesser)*/ + if(i8_buf_based_limit_red < (((LWORD64)complexity_mov_buf_size * 10) >> 7)) + i8_buf_based_limit_red = (((LWORD64)complexity_mov_buf_size * 10) >> 7); + if(i8_buf_based_limit_inc < (((LWORD64)complexity_mov_buf_size * 10) >> 7)) + i8_buf_based_limit_inc = (((LWORD64)complexity_mov_buf_size * 10) >> 7); + + /*if error bits is too high it is given in stages so that buffer is utilized for entire complex content*/ + /*error bits should not exceed ten 7% of buffer*/ + /*error bits can be max equal to bitrate*/ + if(error_bits > 0) + { + /*if lap compleixty is higher and buffer allows give the bits*/ + error_bits = (WORD32)(abs_lap_complexity * i8_max_additional_bits_in_period); + /*if lap complexity is too simple do not give additional bits to make sure that simple scenes never get additional bits whatsoever*/ + if(abs_lap_complexity < 0.2f && ps_cbr_buffer->i8_ebf_bit_alloc >= 0) + { + error_bits = 0; + } + if(error_bits > i8_buf_diff_bits) + error_bits = i8_buf_diff_bits; + + if(error_bits > i8_buf_based_limit_inc) + { + error_bits = i8_buf_based_limit_inc; + } + /*If buffer is already half filled be conservative. Allocate 1.5 times bits + else allocate twice the bits*/ + if(ps_cbr_buffer->i8_ebf_bit_alloc > + (LWORD64)(ps_cbr_buffer->i4_buffer_size * 0.75)) + { + if(error_bits > (i8_max_additional_bits_in_period >> 1)) + { + error_bits = (i8_max_additional_bits_in_period >> 1); + } + } + else + { + if(error_bits > i8_max_additional_bits_in_period) + { + error_bits = i8_max_additional_bits_in_period; + } + } + } + else + { + error_bits = (WORD32)(buf_diff * (i8_default_bits_in_period >> 1)); + if(error_bits < -i8_buf_based_limit_red) + { + error_bits = -i8_buf_based_limit_red; + } + /*when buffer level needs to reduce bits in period*/ + /*If current level is less than half min bits in period = 70% of constant bit in period else 50%*/ + if(ps_cbr_buffer->i8_ebf_bit_alloc > (ps_cbr_buffer->i4_buffer_size >> 1)) + { + if(error_bits < -(i8_default_bits_in_period >> 1)) + { + error_bits = -(i8_default_bits_in_period >> 1); + } + } + else + { + if(error_bits < -((i8_default_bits_in_period * 5) >> 4)) + { + error_bits = -((i8_default_bits_in_period * 5) >> 4); + } + } + } + } + return (WORD32)error_bits; + } + else + { + LWORD64 max_excess_bits, default_allocation_for_period, comp_based_excess = 0; + LWORD64 i8_excess_bits = 0, bit_dev_so_far, credit_limit_level; + LWORD64 Ravg_dur, num_intra_period_in_Ravg_dur, + num_intra_in_clip; //duration for which Ravg has to be met, for shorter slips this can be equal to clip duration + LWORD64 i8_buf_based_limit_red, i8_buf_based_limit_inc; + float comp_to_bit_mapped, X; + + /*default allocation for period in absence of complexity based bit allocation*/ + default_allocation_for_period = + ps_cbr_buffer->i4_drain_bits_per_frame[0] * i4_bit_alloc_period; + + bit_dev_so_far = ps_cbr_buffer->i8_ebf_bit_alloc; + credit_limit_level = ps_cbr_buffer->i8_credit_level; + Ravg_dur = + ps_cbr_buffer->u4_vbr_max_bit_deviation * 5 / ps_cbr_buffer->i4_drain_bits_per_frame[0]; + if(Ravg_dur > 20 * ps_cbr_buffer->i8_tot_frm_to_be_encoded / 100) + Ravg_dur = 20 * ps_cbr_buffer->i8_tot_frm_to_be_encoded / 100; + if(Ravg_dur <= 0) + Ravg_dur = 1; + /*map the complexity to bits ratio*/ + X = (float)i4_lap_complexity_q7 / 128; + if(ps_cbr_buffer->i4_cbr_rc_pass == 2) + comp_to_bit_mapped = COMP_TO_BITS_MAP_2_PASS(X, 1.0f); + else + comp_to_bit_mapped = COMP_TO_BITS_MAP(X, 1.0f); + + comp_to_bit_mapped *= 10; //mapping it to absolute peak bitrate + + /*calculate the number of bit alloc periods over which the credit limit needs to build up*/ + num_intra_in_clip = ps_cbr_buffer->i8_tot_frm_to_be_encoded / i4_bit_alloc_period; + num_intra_period_in_Ravg_dur = Ravg_dur / i4_bit_alloc_period; + //ASSERT(ps_cbr_buffer->i8_tot_frm_to_be_encoded > i4_bit_alloc_period); + if(ps_cbr_buffer->i8_tot_frm_to_be_encoded < i4_bit_alloc_period) + { + num_intra_period_in_Ravg_dur = 1; + num_intra_in_clip = 1; + } + if(num_intra_period_in_Ravg_dur <= 0) + { + num_intra_period_in_Ravg_dur = 1; + } + /*max excess bits possible according to given peak bitrate*/ + { + max_excess_bits = (ps_cbr_buffer->i4_peak_drain_rate_frame - + ps_cbr_buffer->i4_drain_bits_per_frame[0]) * + i4_bit_alloc_period; + /*constrain max excess bits allocated to a region if buffer is already at critical level*/ + /*assume room for 20% over-consumption due to mismatch between allocation and consumption*/ + if(ps_cbr_buffer->i4_ebf > + (ps_cbr_buffer->i4_upr_thr[0] - (WORD32)(max_excess_bits * 0.2))) + { + max_excess_bits = (LWORD64)(max_excess_bits * 0.8); + } + } + /*clipping based on buffer size should depend on gop size. Assuming 7% of gop of gop = 32, calculate for other GOP intervals max 7% while giving from buffer and 10% + while stealing from buffer(for GOP of 32)*/ + /*try to be conservative when giving extra bits to gop and limit while reducing bits to GOP needs to be higher inorder to be buffer compliant if necessary*/ + i8_buf_based_limit_red = + ((LWORD64)ps_cbr_buffer->u4_vbr_max_bit_deviation * i4_bit_alloc_period * 12) >> 12; + i8_buf_based_limit_inc = + ((LWORD64)ps_cbr_buffer->u4_vbr_max_bit_deviation * i4_bit_alloc_period * 8) >> 12; + + /*(shd be 7 even if GOP size goes lesser)*/ + if(i8_buf_based_limit_red < (((LWORD64)ps_cbr_buffer->u4_vbr_max_bit_deviation * 10) >> 7)) + i8_buf_based_limit_red = (((LWORD64)ps_cbr_buffer->u4_vbr_max_bit_deviation * 10) >> 7); + if(i8_buf_based_limit_inc < (((LWORD64)ps_cbr_buffer->u4_vbr_max_bit_deviation * 10) >> 7)) + i8_buf_based_limit_inc = (((LWORD64)ps_cbr_buffer->u4_vbr_max_bit_deviation * 10) >> 7); + + /*The credit limit is not completly built, hence the average operating bitrate will be lesser than average*/ + //if(ps_cbr_buffer->i8_ebf_bit_alloc >= 0) + //Disabling this to avoid under-consumption of bits since mostly contents will end with simpler sequence + if(1 != ps_cbr_buffer->i4_capped_vbr_on) + { + /*adjust the excess bits to account for deviation in bitrate + If bit deviation is positive then overconsumption, hence resuce the default bit allocation*/ + + /* In capped vbr mode this is not calculated as there is no constraint to meet the configured bitrate */ + i8_excess_bits -= (bit_dev_so_far / num_intra_period_in_Ravg_dur); + } + /*allocate bits based on complexity*/ + /*comp_to_bit_mapped less than 1 implies a content that requires less than average bitrate, + hence due to sign reversal we tend to steal bits*/ + comp_based_excess = (LWORD64)((comp_to_bit_mapped - 1) * default_allocation_for_period); + + if(1 != ps_cbr_buffer->i4_capped_vbr_on) + { + /*clip the complexity based on intra period and credit limit buffer size so that when credit limit is lower not everything is used for first GOP*/ + if(comp_based_excess > i8_buf_based_limit_inc) + { + comp_based_excess = i8_buf_based_limit_inc; + } + else if(comp_based_excess < -i8_buf_based_limit_red) + { + comp_based_excess = -i8_buf_based_limit_red; + } + + /*when the credit limit is fully used, stop giving extra*/ + if(credit_limit_level > ps_cbr_buffer->u4_vbr_max_bit_deviation) + { + if(comp_based_excess < 0) + i8_excess_bits += comp_based_excess; + } + /*when credit limit is almost full (80 percent full)*/ + else if(credit_limit_level > (LWORD64)(ps_cbr_buffer->u4_vbr_max_bit_deviation * 0.8f)) + { + /*follow smooth transition, at 80% utilized the excess should be 100 percent, it should move to zero percent as it approaches 100% utlization*/ + if(comp_based_excess > 0) + i8_excess_bits += (LWORD64)( + ((ps_cbr_buffer->u4_vbr_max_bit_deviation - credit_limit_level) / + (0.2f * ps_cbr_buffer->u4_vbr_max_bit_deviation)) * + comp_based_excess); + else + i8_excess_bits += comp_based_excess; + } + else if(credit_limit_level > (LWORD64)(ps_cbr_buffer->u4_vbr_max_bit_deviation * 0.2f)) + { + i8_excess_bits += comp_based_excess; + } + /*When credit limit is almost unutilized*/ + else if( + credit_limit_level < (WORD32)(ps_cbr_buffer->u4_vbr_max_bit_deviation * 0.2f) && + credit_limit_level > 0) + { + if(comp_based_excess < 0) + i8_excess_bits += (LWORD64)( + (credit_limit_level / (0.2f * ps_cbr_buffer->u4_vbr_max_bit_deviation)) * + comp_based_excess); + else + i8_excess_bits += comp_based_excess; + } + /*If the credit limit still uutilized stop drawing bits from simpler content*/ + else if(credit_limit_level <= 0) + { + if(comp_based_excess > 0) + i8_excess_bits += comp_based_excess; + } + else + ASSERT(0); + } + else + { + /* In capped vbr mode excess bits will be based on complexity of content alone*/ + i8_excess_bits = comp_based_excess; + } + + /*Clip the excess bits such that it will never violate peak bitrate and also Rmin*/ + if(i8_excess_bits > max_excess_bits) + i8_excess_bits = max_excess_bits; + /*assuming atleast 0.4 times average bitrate even for the simplest content*/ + if(i8_excess_bits < -(default_allocation_for_period * 0.6f)) + i8_excess_bits = (LWORD64)(-(default_allocation_for_period * 0.6f)); + + ASSERT(i8_excess_bits <= 0x7FFFFFFF); + return (WORD32)i8_excess_bits; + } +} +/* ******************************************************************************/ +/** + * @brief get_rc_type. + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +rc_type_e get_rc_type(cbr_buffer_t *ps_cbr_buffer) +{ + return (ps_cbr_buffer->e_rc_type); +} +/* ******************************************************************************/ +/** + * @brief cbr_get_delay_frames + * + * @param ps_cbr_buffer + */ +/* ******************************************************************************/ +UWORD32 cbr_get_delay_frames(cbr_buffer_t *ps_cbr_buffer) +{ + return (ps_cbr_buffer->u4_num_frms_in_delay); +} +#endif /* #if NON_STEADSTATE_CODE */ |
