/* * Copyright 2015 Rockchip Electronics Co. LTD * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #define MODULE_TAG "vp8e_rc" #include #include "mpp_env.h" #include "mpp_mem.h" #include "mpp_common.h" #include "mpp_rc.h" #include "vp8e_syntax.h" #include "vp8e_debug.h" #include "vp8e_rc.h" #define DSCY 64 #define UPSCALE 8000 #define I32_MPP_MAX 0x7fffffff #define QINDEX_RANGE 128 #define RC_ERROR_RESET 0x7fffffff #define BIT_COUNT_MAX 0x1fffffff #define BIT_COUNT_MIN (-BIT_COUNT_MAX) static const RK_S32 ac_q_lookup_tbl[QINDEX_RANGE] = { 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 60, 62, 64, 66, 68, 70, 72, 74, 76, 78, 80, 82, 84, 86, 88, 90, 92, 94, 96, 98, 100, 102, 104, 106, 108, 110, 112, 114, 116, 119, 122, 125, 128, 131, 134, 137, 140, 143, 146, 149, 152, 155, 158, 161, 164, 167, 170, 173, 177, 181, 185, 189, 193, 197, 201, 205, 209, 213, 217, 221, 225, 229, 234, 239, 245, 249, 254, 259, 264, 269, 274, 279, 284 }; static RK_S32 initial_qp(RK_S32 bits, RK_S32 pels) { RK_S32 i = -1; static const RK_S32 qp_tbl[2][12] = { {47, 57, 73, 93, 122, 155, 214, 294, 373, 506, 781, 0x7FFFFFFF}, {120, 110, 100, 90, 80, 70, 60, 50, 40, 30, 20, 10} }; if (bits > 1000000) return 10; pels >>= 8; bits >>= 5; bits *= pels + 250; bits /= 350 + (3 * pels) / 4; bits = axb_div_c(bits, UPSCALE, pels << 6); while (qp_tbl[0][++i] < bits); return qp_tbl[1][i]; } static MPP_RET update_rc_error(Vp8eLinReg *p, RK_S32 bits) { p->len = 3; if (bits >= (RK_S32)I32_MPP_MAX) { p->bits[0] = 0; p->bits[1] = 0; p->bits[2] = 0; return MPP_NOK; } p->bits[0] = bits - p->bits[2]; p->bits[1] = bits + p->bits[1]; p->bits[2] = bits; return MPP_OK; } static RK_S32 lin_sxy(RK_S32 *qp, RK_S32 *r, RK_S32 n) { RK_S32 tmp, sum = 0; while (n--) { tmp = qp[n] * qp[n] * qp[n]; if (tmp > r[n]) { sum += MPP_DIV_SIGN(tmp, DSCY) * r[n]; } else { sum += tmp * MPP_DIV_SIGN(r[n], DSCY); } if (sum < 0) { return I32_MPP_MAX; } } return sum; } static RK_S32 lin_sx(RK_S32 *qp, RK_S32 n) { RK_S32 tmp = 0; while (n--) { tmp += qp[n]; } return tmp; } static RK_S32 lin_sy(RK_S32 *qp, RK_S32 *r, RK_S32 n) { RK_S32 sum = 0; while (n--) { sum += qp[n] * qp[n] * r[n]; if (sum < 0) { return 2147483647 / 64; } } return MPP_DIV_SIGN(sum, DSCY); } static RK_S32 lin_nsxx(RK_S32 *qp, RK_S32 n) { RK_S32 tmp = 0; RK_S32 sum = 0; RK_S32 d = n; while (n--) { tmp = qp[n]; tmp *= tmp; sum += d * tmp; } return sum; } static void update_model(Vp8eLinReg *p) { RK_S32 a1, a2; RK_S32 *qs = p->qs; RK_S32 *r = p->bits; RK_S32 n = p->len; RK_S32 sx = lin_sx(qs, n); RK_S32 sy = lin_sy(qs, r, n); a1 = lin_sxy(qs, r, n); a1 = (a1 < (I32_MPP_MAX / n)) ? (a1 * n) : I32_MPP_MAX; if (sy == 0) { a1 = 0; } else { a1 -= (sx < I32_MPP_MAX / sy) ? (sx * sy) : I32_MPP_MAX; } a2 = (lin_nsxx(qs, n) - (sx * sx)); if (a2 == 0) { if (p->a1 == 0) { a1 = 0; } else { a1 = (p->a1 * 2) / 3; } } else { a1 = axb_div_c(a1, DSCY, a2); } a1 = MPP_MAX(a1, -4096 * DSCY); a1 = MPP_MIN(a1, 4096 * DSCY - 1); a2 = MPP_DIV_SIGN(sy * DSCY, n) - MPP_DIV_SIGN(a1 * sx, n); if (p->len > 0) { p->a1 = a1; p->a2 = a2; } } static RK_S32 get_vir_buffer_bitcnt(Vp8eVirBuf *vb, RK_S32 time_inc) { RK_S32 drift = 0; RK_S32 target = 0; /* Saturate realBitCnt, this is to prevent overflows caused by much greater bitrate setting than is really possible to reach */ if (vb->real_bit_cnt > BIT_COUNT_MAX) vb->real_bit_cnt = BIT_COUNT_MAX; if (vb->real_bit_cnt < BIT_COUNT_MIN) vb->real_bit_cnt = BIT_COUNT_MIN; vb->pic_time_inc += time_inc; vb->virtual_bit_cnt += axb_div_c(vb->bit_rate, time_inc, vb->time_scale); target = vb->virtual_bit_cnt - vb->real_bit_cnt; /* Saturate target, prevents rc going totally out of control. This situation should never happen. */ if (target > BIT_COUNT_MAX) target = BIT_COUNT_MAX; if (target < BIT_COUNT_MIN) target = BIT_COUNT_MIN; while (vb->pic_time_inc >= vb->time_scale) { vb->pic_time_inc -= vb->time_scale; vb->virtual_bit_cnt -= vb->bit_rate; vb->real_bit_cnt -= vb->bit_rate; } drift = axb_div_c(vb->bit_rate, vb->pic_time_inc, vb->time_scale); drift -= vb->virtual_bit_cnt; vb->virtual_bit_cnt += drift; return target; } static MPP_RET skip_pic(Vp8eRc *rc) { Vp8eVirBuf *vb = &rc->virbuf; RK_S32 skip_inc_limit = -vb->bit_per_pic / 3; RK_S32 skip_dec_limit = vb->bit_per_pic / 3; RK_S32 bit_available = vb->virtual_bit_cnt - vb->real_bit_cnt; if (((rc->pic_rc_enable == 0) || (vb->skip_frame_target == 0)) && (bit_available < skip_inc_limit)) vb->skip_frame_target++; if ((bit_available > skip_dec_limit) && vb->skip_frame_target > 0) vb->skip_frame_target--; if (vb->skipped_frames < vb->skip_frame_target) { vb->skipped_frames++; rc->frame_coded = 0; } else { vb->skipped_frames = 0; } return MPP_OK; } static RK_S32 new_pic_quant(Vp8eLinReg *p, RK_S32 bits, RK_U8 use_qp_delta_limit) { RK_S32 tmp, diff; RK_S32 qp = p->qp_prev; RK_S32 qp_best = p->qp_prev; RK_S32 diff_best = I32_MPP_MAX; if (p->a1 == 0 && p->a2 == 0) { return qp; } if (bits <= 0) { if (use_qp_delta_limit) qp = MPP_MIN(QINDEX_RANGE - 1, MPP_MAX(0, qp + 4)); else qp = MPP_MIN(QINDEX_RANGE - 1, MPP_MAX(0, qp + 10)); return qp; } do { tmp = MPP_DIV_SIGN(p->a1, ac_q_lookup_tbl[qp]); tmp += MPP_DIV_SIGN(p->a2, ac_q_lookup_tbl[qp] * ac_q_lookup_tbl[qp]); diff = MPP_ABS(tmp - bits); if (diff < diff_best) { diff_best = diff; qp_best = qp; if ((tmp - bits) <= 0) { if (qp < 1) { break; } qp--; } else { if (qp >= QINDEX_RANGE - 1) { break; } qp++; } } else { break; } } while ((qp >= 0) && (qp < QINDEX_RANGE)); qp = qp_best; if (use_qp_delta_limit) { tmp = qp - p->qp_prev; if (tmp > 4) { qp = p->qp_prev + 4; } else if (tmp < -4) { qp = p->qp_prev - 4; } } return qp; } static RK_S32 avg_rc_error(Vp8eLinReg *p) { return MPP_DIV_SIGN(p->bits[2] * 4 + p->bits[1] * 6 + p->bits[0] * 0, 100); } static MPP_RET cal_pic_quant(Vp8eRc *rc) { RK_S32 tmp = 0; RK_S32 tmp_value = 0; RK_S32 tmp_avg_rc_error; RK_U8 use_qp_delta_limit = 1; if (!rc->pic_rc_enable) { rc->qp_hdr = rc->fixed_qp; return MPP_OK; } if (rc->curr_frame_intra) { if (rc->gop_len == 1 || rc->gop_len == 2) { tmp = new_pic_quant(&rc->lin_reg, axb_div_c(rc->target_pic_size, 256, rc->mb_per_pic), use_qp_delta_limit); } else { if (rc->gop_qp_sum) { tmp = MPP_DIV_SIGN(rc->gop_qp_sum, rc->gop_qp_div); } rc->gop_qp_sum = 0; rc->gop_qp_div = 0; } if (tmp) { rc->qp_hdr = tmp; } } else if (rc->prev_frame_intra) { rc->qp_hdr = rc->qp_hdr_prev; } else { tmp_avg_rc_error = avg_rc_error(&rc->r_error); tmp_value = axb_div_c(rc->target_pic_size - tmp_avg_rc_error, 256, rc->mb_per_pic); rc->qp_hdr = new_pic_quant(&rc->lin_reg, tmp_value, use_qp_delta_limit); } vp8e_rc_dbg_rc("frame_cnt = %d, qp = %d\n", rc->frame_cnt, rc->qp_hdr); rc->qp_hdr = MPP_MIN(rc->qp_max, MPP_MAX(rc->qp_min, rc->qp_hdr)); rc->qp_hdr_prev = rc->qp_hdr; if (rc->curr_frame_intra) { if (rc->fixed_intra_qp) rc->qp_hdr = rc->fixed_intra_qp; else if (!rc->prev_frame_intra) rc->qp_hdr += rc->intra_qp_delta; rc->qp_hdr = MPP_MIN(rc->qp_max, MPP_MAX(rc->qp_min, rc->qp_hdr)); } else { rc->gop_qp_sum += rc->qp_hdr; rc->gop_qp_div++; } return MPP_OK; } static void update_tables(Vp8eLinReg *p, RK_S32 qp, RK_S32 bits) { RK_S32 len = 10; RK_S32 tmp = p->pos; p->qp_prev = qp; p->qs[tmp] = ac_q_lookup_tbl[qp]; p->bits[tmp] = bits; if ((++p->pos) >= len) { p->pos = 0; } if (p->len < len) { p->len++; } } MPP_RET vp8e_update_rc_cfg(Vp8eRc *rc, MppEncRcCfg *cfg) { RK_U32 change = cfg->change; Vp8eVirBuf *vb = &rc->virbuf; if (change & MPP_ENC_RC_CFG_CHANGE_BPS) { vp8e_rc_dbg_cfg("bps: %d [%d %d]\n", cfg->bps_target, cfg->bps_min, cfg->bps_max); vb->bps_min = cfg->bps_min; vb->bps_max = cfg->bps_max; vb->bit_rate = cfg->bps_target; } if (change & MPP_ENC_RC_CFG_CHANGE_FPS_OUT) { vp8e_rc_dbg_cfg("fps: %d / %d\n", cfg->fps_out_num, cfg->fps_out_denorm); rc->fps_out_num = cfg->fps_out_num; rc->fps_out_denorm = cfg->fps_out_denorm; if (rc->fps_out_denorm == 0) { mpp_err("denorm can not be 0, change to default 1"); rc->fps_out_denorm = 1; } rc->fps_out = rc->fps_out_num / rc->fps_out_denorm; if (rc->fps_out == 0) { rc->fps_out = 30; rc->fps_out_num = 30; rc->fps_out_denorm = 1; mpp_err("fps out can not be 0, change to default 30"); } } if ((change & MPP_ENC_RC_CFG_CHANGE_GOP) && (rc->gop_len != cfg->gop)) { rc->gop_len = cfg->gop; vp8e_rc_dbg_cfg("gop: %d\n", cfg->gop); } vb->bit_per_pic = axb_div_c(vb->bit_rate, rc->fps_out_denorm, rc->fps_out_num); cfg->change = 0; return MPP_OK; } MPP_RET vp8e_init_rc(Vp8eRc *rc, MppEncCfgSet *cfg) { RK_S32 max_bps; Vp8eVirBuf *vb = &rc->virbuf; rc->qp_hdr = -1; rc->qp_min = 0; rc->qp_max = QINDEX_RANGE; rc->pic_skip = 0; rc->pic_rc_enable = 1; rc->gop_len = cfg->rc.gop; rc->intra_qp_delta = 0; rc->fixed_intra_qp = 0; rc->intra_picture_rate = 30; rc->golden_picture_rate = 0; rc->altref_picture_rate = 0; rc->virbuf.bit_rate = cfg->rc.bps_target; rc->fps_out_denorm = cfg->rc.fps_out_denorm; rc->fps_out_num = cfg->rc.fps_out_num; rc->mb_per_pic = ((cfg->prep.width + 15) / 16) * ((cfg->prep.height + 15) / 16); if (rc->qp_max >= QINDEX_RANGE) rc->qp_max = QINDEX_RANGE - 1; if (rc->qp_min < 0) rc->qp_min = 0; max_bps = rc->mb_per_pic * 16 * 16 * 6; max_bps = axb_div_c(max_bps, rc->fps_out_num, rc->fps_out_denorm); if (max_bps < 0) max_bps = I32_MPP_MAX; vb->bit_rate = MPP_MIN(vb->bit_rate, max_bps); vb->bit_per_pic = axb_div_c(vb->bit_rate, rc->fps_out_denorm, rc->fps_out_num); if (rc->qp_hdr == -1) rc->qp_hdr = initial_qp(vb->bit_per_pic, rc->mb_per_pic * 16 * 16); rc->qp_hdr = MPP_MIN(rc->qp_max, MPP_MAX(rc->qp_min, rc->qp_hdr)); vp8e_rc_dbg_rc("init qp, qp = %d, bitRate = %d, bitPerPic = %d\n", rc->qp_hdr, vb->bit_rate, vb->bit_per_pic); rc->qp_hdr_prev = rc->qp_hdr; rc->fixed_qp = rc->qp_hdr; rc->frame_coded = 1; rc->curr_frame_intra = 1; rc->prev_frame_intra = 0; rc->frame_cnt = 0; rc->gop_qp_sum = 0; rc->gop_qp_div = 0; rc->target_pic_size = 0; rc->frame_bit_cnt = 0; rc->time_inc = 0; memset(&rc->lin_reg, 0, sizeof(rc->lin_reg)); rc->lin_reg.qs[0] = ac_q_lookup_tbl[QINDEX_RANGE - 1]; rc->lin_reg.qp_prev = rc->qp_hdr; vb->gop_rem = rc->gop_len; vb->time_scale = rc->fps_out_num; update_rc_error(&rc->r_error, RC_ERROR_RESET); return MPP_OK; } MPP_RET vp8e_before_pic_rc(Vp8eRc *rc) { RK_S32 tmp = 0; Vp8eVirBuf *vb = &rc->virbuf; rc->frame_coded = 1; if (rc->curr_frame_intra || vb->gop_rem == 1) { vb->gop_rem = rc->gop_len; } else { vb->gop_rem--; } tmp = get_vir_buffer_bitcnt(&rc->virbuf, (RK_S32)rc->time_inc); rc->target_pic_size = vb->bit_per_pic + MPP_DIV_SIGN(tmp, MPP_MAX(vb->gop_rem, 3)); rc->target_pic_size = MPP_MAX(0, rc->target_pic_size); if (rc->pic_skip) skip_pic(rc); cal_pic_quant(rc); return MPP_OK; } MPP_RET vp8e_after_pic_rc(Vp8eRc *rc, RK_S32 bitcnt) { Vp8eVirBuf *vb = &rc->virbuf; rc->time_inc = 1; rc->frame_cnt++; rc->frame_bit_cnt = bitcnt; rc->prev_frame_intra = rc->curr_frame_intra; vb->real_bit_cnt += bitcnt; if ((!rc->curr_frame_intra) || (rc->gop_len == 1)) { update_tables(&rc->lin_reg, rc->qp_hdr_prev, axb_div_c(bitcnt, 256, rc->mb_per_pic)); if (vb->gop_rem == rc->gop_len - 1) { update_rc_error(&rc->r_error, RC_ERROR_RESET); } else { update_rc_error(&rc->r_error, MPP_MIN(bitcnt - rc->target_pic_size, 2 * rc->target_pic_size)); } update_model(&rc->lin_reg); } return MPP_OK; }