/*
|
* Copyright 2021 Rockchip Electronics Co. LTD
|
*
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
* you may not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* http://www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*/
|
|
#define MODULE_TAG "hal_h265e_v580"
|
|
#include <string.h>
|
#include <math.h>
|
#include <limits.h>
|
|
#include "mpp_env.h"
|
#include "mpp_mem.h"
|
#include "mpp_soc.h"
|
#include "mpp_common.h"
|
#include "mpp_frame_impl.h"
|
|
#include "hal_h265e_debug.h"
|
#include "h265e_syntax_new.h"
|
#include "hal_bufs.h"
|
#include "rkv_enc_def.h"
|
#include "vepu541_common.h"
|
#include "hal_h265e_vepu580.h"
|
#include "hal_h265e_vepu580_reg.h"
|
#include "mpp_enc_cb_param.h"
|
|
#include "mpp_service.h"
|
|
#define MAX_TILE_NUM 2
|
|
#define hal_h265e_err(fmt, ...) \
|
do {\
|
mpp_err_f(fmt, ## __VA_ARGS__);\
|
} while (0)
|
|
typedef struct vepu580_h265_fbk_t {
|
RK_U32 hw_status; /* 0:corret, 1:error */
|
RK_U32 qp_sum;
|
RK_U32 out_strm_size;
|
RK_U32 out_hw_strm_size;
|
RK_S64 sse_sum;
|
RK_U32 st_lvl64_inter_num;
|
RK_U32 st_lvl32_inter_num;
|
RK_U32 st_lvl16_inter_num;
|
RK_U32 st_lvl8_inter_num;
|
RK_U32 st_lvl32_intra_num;
|
RK_U32 st_lvl16_intra_num;
|
RK_U32 st_lvl8_intra_num;
|
RK_U32 st_lvl4_intra_num;
|
RK_U32 st_cu_num_qp[52];
|
RK_U32 st_madp;
|
RK_U32 st_madi;
|
RK_U32 st_md_sad_b16num0;
|
RK_U32 st_md_sad_b16num1;
|
RK_U32 st_md_sad_b16num2;
|
RK_U32 st_md_sad_b16num3;
|
RK_U32 st_madi_b16num0;
|
RK_U32 st_madi_b16num1;
|
RK_U32 st_madi_b16num2;
|
RK_U32 st_madi_b16num3;
|
RK_U32 st_mb_num;
|
RK_U32 st_ctu_num;
|
} vepu580_h265_fbk;
|
|
typedef struct H265eV580HalContext_t {
|
MppEncHalApi api;
|
MppDev dev;
|
void *regs[MAX_TILE_NUM];
|
void *reg_out[MAX_TILE_NUM];
|
|
vepu580_h265_fbk feedback;
|
void *dump_files;
|
RK_U32 frame_cnt_gen_ready;
|
|
RK_S32 frame_type;
|
RK_S32 last_frame_type;
|
|
/* @frame_cnt starts from ZERO */
|
RK_U32 frame_cnt;
|
Vepu541OsdCfg osd_cfg;
|
MppDevRegOffCfgs *reg_cfg;
|
void *roi_data;
|
MppEncCfgSet *cfg;
|
|
MppBufferGroup tile_grp;
|
MppBuffer hw_tile_buf[2];
|
MppBuffer hw_tile_stream;
|
MppBuffer buf_pass1;
|
|
RK_U32 enc_mode;
|
RK_U32 frame_size;
|
RK_S32 max_buf_cnt;
|
RK_S32 hdr_status;
|
void *input_fmt;
|
RK_U8 *src_buf;
|
RK_U8 *dst_buf;
|
RK_S32 buf_size;
|
RK_U32 frame_num;
|
HalBufs dpb_bufs;
|
RK_S32 fbc_header_len;
|
RK_U32 tile_num;
|
RK_U32 tile_parall_en;
|
RK_U32 tile_dump_err;
|
|
RK_S32 poll_slice_max;
|
RK_S32 poll_cfg_size;
|
MppDevPollCfg *poll_cfgs;
|
MppCbCtx *output_cb;
|
|
/* finetune */
|
void *tune;
|
} H265eV580HalContext;
|
|
#define TILE_BUF_SIZE MPP_ALIGN(128 * 1024, 256)
|
|
static RK_U32 klut_weight[24] = {
|
0x50800080, 0x00330000, 0xA1000100, 0x00660000, 0x42000200, 0x00CC0001,
|
0x84000400, 0x01980002, 0x08000800, 0x03300005, 0x10001000, 0x0660000A,
|
0x20002000, 0x0CC00014, 0x40004000, 0x19800028, 0x80008000, 0x33000050,
|
0x00010000, 0x660000A1, 0x00020000, 0xCC000142, 0xFF83FFFF, 0x000001FF
|
};
|
|
static RK_U32 aq_thd_default[16] = {
|
0, 0, 0, 0,
|
3, 3, 5, 5,
|
8, 8, 8, 15,
|
15, 20, 25, 35
|
};
|
|
static RK_S32 aq_qp_dealt_default[16] = {
|
-8, -7, -6, -5,
|
-4, -3, -2, -1,
|
0, 1, 2, 3,
|
4, 5, 6, 8,
|
};
|
|
static RK_U16 lvl32_intra_cst_thd[4] = {2, 6, 16, 36};
|
|
static RK_U16 lvl16_intra_cst_thd[4] = {2, 6, 16, 36};
|
|
static RK_U8 lvl32_intra_cst_wgt[8] = {23, 22, 21, 20, 22, 24, 26};
|
|
static RK_U8 lvl16_intra_cst_wgt[8] = {17, 17, 17, 18, 17, 18, 18};
|
|
static RK_U32 lamd_satd_qp[52] = {
|
0x00000183, 0x000001b2, 0x000001e7, 0x00000223, 0x00000266, 0x000002b1, 0x00000305, 0x00000364,
|
0x000003ce, 0x00000445, 0x000004cb, 0x00000562, 0x0000060a, 0x000006c8, 0x0000079c, 0x0000088b,
|
0x00000996, 0x00000ac3, 0x00000c14, 0x00000d8f, 0x00000f38, 0x00001115, 0x0000132d, 0x00001586,
|
0x00001829, 0x00001b1e, 0x00001e70, 0x0000222b, 0x0000265a, 0x00002b0c, 0x00003052, 0x0000363c,
|
0x00003ce1, 0x00004455, 0x00004cb4, 0x00005618, 0x000060a3, 0x00006c79, 0x000079c2, 0x000088ab,
|
0x00009967, 0x0000ac30, 0x0000c147, 0x0000d8f2, 0x0000f383, 0x00011155, 0x000132ce, 0x00015861,
|
0x0001828d, 0x0001b1e4, 0x0001e706, 0x000222ab
|
};
|
|
static RK_U32 lamd_moda_qp[52] = {
|
0x00000049, 0x0000005c, 0x00000074, 0x00000092, 0x000000b8, 0x000000e8, 0x00000124, 0x00000170,
|
0x000001cf, 0x00000248, 0x000002df, 0x0000039f, 0x0000048f, 0x000005bf, 0x0000073d, 0x0000091f,
|
0x00000b7e, 0x00000e7a, 0x0000123d, 0x000016fb, 0x00001cf4, 0x0000247b, 0x00002df6, 0x000039e9,
|
0x000048f6, 0x00005bed, 0x000073d1, 0x000091ec, 0x0000b7d9, 0x0000e7a2, 0x000123d7, 0x00016fb2,
|
0x0001cf44, 0x000247ae, 0x0002df64, 0x00039e89, 0x00048f5c, 0x0005bec8, 0x00073d12, 0x00091eb8,
|
0x000b7d90, 0x000e7a23, 0x00123d71, 0x0016fb20, 0x001cf446, 0x00247ae1, 0x002df640, 0x0039e88c,
|
0x0048f5c3, 0x005bec81, 0x0073d119, 0x0091eb85
|
};
|
|
static RK_U32 lamd_modb_qp[52] = {
|
0x00000070, 0x00000089, 0x000000b0, 0x000000e0, 0x00000112, 0x00000160, 0x000001c0, 0x00000224,
|
0x000002c0, 0x00000380, 0x00000448, 0x00000580, 0x00000700, 0x00000890, 0x00000b00, 0x00000e00,
|
0x00001120, 0x00001600, 0x00001c00, 0x00002240, 0x00002c00, 0x00003800, 0x00004480, 0x00005800,
|
0x00007000, 0x00008900, 0x0000b000, 0x0000e000, 0x00011200, 0x00016000, 0x0001c000, 0x00022400,
|
0x0002c000, 0x00038000, 0x00044800, 0x00058000, 0x00070000, 0x00089000, 0x000b0000, 0x000e0000,
|
0x00112000, 0x00160000, 0x001c0000, 0x00224000, 0x002c0000, 0x00380000, 0x00448000, 0x00580000,
|
0x00700000, 0x00890000, 0x00b00000, 0x00e00000
|
};
|
|
#include "hal_h265e_vepu580_tune.c"
|
|
static void vepu580_h265_set_me_ram(H265eSyntax_new *syn, hevc_vepu580_base *regs, RK_U32 index)
|
{
|
RK_S32 frm_sta = 0, frm_end = 0, pic_w = 0;
|
RK_S32 srch_w = regs->reg0220_me_rnge.cme_srch_h * 4;
|
RK_S32 srch_h = regs->reg0220_me_rnge.cme_srch_v * 4;
|
RK_S32 x_gmv = regs->reg0224_gmv.gmv_x;
|
RK_S32 y_gmv = regs->reg0224_gmv.gmv_y;
|
RK_U32 pic_wd64 = ((regs->reg0196_enc_rsl.pic_wd8_m1 + 1) * 8 + 63) / 64;
|
|
if (!syn->pp.tiles_enabled_flag) {
|
if (x_gmv - srch_w < 0) {
|
frm_sta = (x_gmv - srch_w - 15) / 16;
|
} else {
|
frm_sta = (x_gmv - srch_w) / 16;
|
}
|
frm_sta = mpp_clip(frm_sta, 0, pic_wd64 - 1);
|
if (x_gmv + srch_w < 0) {
|
frm_end = pic_wd64 - 1 + (x_gmv + srch_w) / 16;
|
} else {
|
frm_end = pic_wd64 - 1 + (x_gmv + srch_w + 15) / 16;
|
}
|
frm_end = mpp_clip(frm_end, 0, pic_wd64 - 1);
|
} else {
|
RK_S32 tile_ctu_stax = index * pic_wd64 / (syn->pp.num_tile_columns_minus1 + 1);
|
RK_S32 tile_ctu_endx = 0;
|
|
if (index == syn->pp.num_tile_columns_minus1) {
|
tile_ctu_endx = ((regs->reg0196_enc_rsl.pic_wd8_m1 + 1) * 8 + 63) / 64 - 1;
|
} else {
|
tile_ctu_endx = (index + 1) * pic_wd64 / (syn->pp.num_tile_columns_minus1 + 1) - 1;
|
}
|
|
if (x_gmv - srch_w < 0) {
|
frm_sta = tile_ctu_stax + (x_gmv - srch_w - 15) / 16;
|
} else {
|
frm_sta = tile_ctu_stax + (x_gmv - srch_w) / 16;
|
}
|
frm_sta = mpp_clip(frm_sta, 0, pic_wd64 - 1);
|
|
if (x_gmv + srch_w < 0) {
|
frm_end = tile_ctu_endx + (x_gmv + srch_w) / 16;
|
} else {
|
frm_end = tile_ctu_endx + (x_gmv + srch_w + 15) / 16;
|
}
|
frm_end = mpp_clip(frm_end, 0, pic_wd64 - 1);
|
}
|
pic_w = (frm_end - frm_sta + 1) * 64;
|
regs->reg0222_me_cach.cme_linebuf_w = (pic_w ? pic_w : 64) / 64;
|
{
|
RK_U32 cime_rama_max = 2464;
|
RK_U32 ctu_4_h = 4, ramb_h;
|
RK_U32 cur_srch_16_w, cur_srch_4_h, cur_srch_max;
|
RK_U32 cime_rama_h = ctu_4_h;
|
|
if ((x_gmv % 16 - srch_w % 16) < 0) {
|
cur_srch_16_w = (16 + (x_gmv % 16 - srch_w % 16) % 16 + srch_w * 2 + 15) / 16 + 1;
|
} else {
|
cur_srch_16_w = ((x_gmv % 16 - srch_w % 16) % 16 + srch_w * 2 + 15) / 16 + 1;
|
}
|
if ((y_gmv % 4 - srch_h % 4) < 0) {
|
cur_srch_4_h = (4 + (y_gmv % 4 - srch_h % 4) % 4 + srch_h * 2 + 3) / 4 + ctu_4_h;
|
} else {
|
cur_srch_4_h = ((y_gmv % 4 - srch_h % 4) % 4 + srch_h * 2 + 3) / 4 + ctu_4_h;
|
}
|
cur_srch_max = MPP_ALIGN(cur_srch_4_h, 4);
|
if (regs->reg0222_me_cach.cme_linebuf_w < cur_srch_16_w) {
|
cur_srch_16_w = regs->reg0222_me_cach.cme_linebuf_w;
|
}
|
ramb_h = cur_srch_4_h;
|
while ((cime_rama_h < cur_srch_max) && (cime_rama_max >
|
((cime_rama_h - ctu_4_h) * regs->reg0222_me_cach.cme_linebuf_w * 4 + (ramb_h * 4 * cur_srch_16_w)))) {
|
cime_rama_h = cime_rama_h + ctu_4_h;
|
if (ramb_h > 2 * ctu_4_h) {
|
ramb_h = ramb_h - ctu_4_h;
|
} else {
|
ramb_h = ctu_4_h;
|
}
|
}
|
if (cur_srch_4_h == ctu_4_h) {
|
cime_rama_h = cime_rama_h + ctu_4_h;
|
ramb_h = 0;
|
}
|
if (cime_rama_max < ((cime_rama_h - ctu_4_h) * regs->reg0222_me_cach.cme_linebuf_w * 4 + (ramb_h * 4 * cur_srch_16_w))) {
|
cime_rama_h = cime_rama_h - ctu_4_h;
|
}
|
regs->reg0222_me_cach.cme_rama_h = cime_rama_h; /* cime_rama_max */
|
|
{
|
RK_U32 ram_col_h = (cime_rama_h - ctu_4_h) / ctu_4_h;
|
regs->reg0222_me_cach.cme_rama_max = ram_col_h * regs->reg0222_me_cach.cme_linebuf_w + cur_srch_16_w;
|
}
|
|
}
|
|
hal_h265e_dbg_detail("cime_rama_h %d, cime_rama_max %d, cime_linebuf_w %d",
|
regs->reg0222_me_cach.cme_rama_h, regs->reg0222_me_cach.cme_rama_max, regs->reg0222_me_cach.cme_linebuf_w);
|
}
|
|
static MPP_RET vepu580_h265_setup_hal_bufs(H265eV580HalContext *ctx)
|
{
|
MPP_RET ret = MPP_OK;
|
VepuFmtCfg *fmt = (VepuFmtCfg *)ctx->input_fmt;
|
RK_U32 frame_size;
|
RK_S32 mb_wd64, mb_h64;
|
MppEncRefCfg ref_cfg = ctx->cfg->ref_cfg;
|
MppEncPrepCfg *prep = &ctx->cfg->prep;
|
RK_S32 old_max_cnt = ctx->max_buf_cnt;
|
RK_S32 new_max_cnt = 2;
|
|
hal_h265e_enter();
|
|
mb_wd64 = (prep->width + 63) / 64;
|
mb_h64 = (prep->height + 63) / 64 + 1;
|
|
frame_size = MPP_ALIGN(prep->width, 16) * MPP_ALIGN(prep->height, 16);
|
vepu541_set_fmt(fmt, ctx->cfg->prep.format);
|
|
if (ref_cfg) {
|
MppEncCpbInfo *info = mpp_enc_ref_cfg_get_cpb_info(ref_cfg);
|
new_max_cnt = MPP_MAX(new_max_cnt, info->dpb_size + 1);
|
}
|
|
if (frame_size > ctx->frame_size || new_max_cnt > old_max_cnt) {
|
size_t size[3] = {0};
|
|
hal_bufs_deinit(ctx->dpb_bufs);
|
hal_bufs_init(&ctx->dpb_bufs);
|
|
ctx->fbc_header_len = MPP_ALIGN(((mb_wd64 * mb_h64) << 6), SZ_8K);
|
size[0] = ctx->fbc_header_len + ((mb_wd64 * mb_h64) << 12) * 3 / 2; //fbc_h + fbc_b
|
size[1] = (mb_wd64 * mb_h64 << 8);
|
size[2] = MPP_ALIGN(mb_wd64 * mb_h64 * 16 * 6, 256);
|
new_max_cnt = MPP_MAX(new_max_cnt, old_max_cnt);
|
|
hal_h265e_dbg_detail("frame size %d -> %d max count %d -> %d\n",
|
ctx->frame_size, frame_size, old_max_cnt, new_max_cnt);
|
|
hal_bufs_setup(ctx->dpb_bufs, new_max_cnt, 3, size);
|
|
ctx->frame_size = frame_size;
|
ctx->max_buf_cnt = new_max_cnt;
|
}
|
hal_h265e_leave();
|
return ret;
|
}
|
|
static void vepu580_h265_sobel_cfg(hevc_vepu580_wgt *reg)
|
{
|
reg->pre_intra_cla0_B0.pre_intra_cla0_m0 = 10;
|
reg->pre_intra_cla0_B0.pre_intra_cla0_m1 = 11;
|
reg->pre_intra_cla0_B0.pre_intra_cla0_m2 = 12;
|
reg->pre_intra_cla0_B0.pre_intra_cla0_m3 = 13;
|
reg->pre_intra_cla0_B0.pre_intra_cla0_m4 = 14;
|
|
reg->pre_intra_cla0_B1.pre_intra_cla0_m5 = 9;
|
reg->pre_intra_cla0_B1.pre_intra_cla0_m6 = 15;
|
reg->pre_intra_cla0_B1.pre_intra_cla0_m7 = 8;
|
reg->pre_intra_cla0_B1.pre_intra_cla0_m8 = 16;
|
reg->pre_intra_cla0_B1.pre_intra_cla0_m9 = 7;
|
|
reg->pre_intra_cla1_B0.pre_intra_cla1_m0 = 10;
|
reg->pre_intra_cla1_B0.pre_intra_cla1_m1 = 9;
|
reg->pre_intra_cla1_B0.pre_intra_cla1_m2 = 8;
|
reg->pre_intra_cla1_B0.pre_intra_cla1_m3 = 7;
|
reg->pre_intra_cla1_B0.pre_intra_cla1_m4 = 6;
|
reg->pre_intra_cla1_B1.pre_intra_cla1_m5 = 11;
|
reg->pre_intra_cla1_B1.pre_intra_cla1_m6 = 5;
|
reg->pre_intra_cla1_B1.pre_intra_cla1_m7 = 12;
|
reg->pre_intra_cla1_B1.pre_intra_cla1_m8 = 4;
|
reg->pre_intra_cla1_B1.pre_intra_cla1_m9 = 13;
|
|
reg->pre_intra_cla2_B0.pre_intra_cla2_m0 = 18;
|
reg->pre_intra_cla2_B0.pre_intra_cla2_m1 = 17;
|
reg->pre_intra_cla2_B0.pre_intra_cla2_m2 = 16;
|
reg->pre_intra_cla2_B0.pre_intra_cla2_m3 = 15;
|
reg->pre_intra_cla2_B0.pre_intra_cla2_m4 = 14;
|
reg->pre_intra_cla2_B1.pre_intra_cla2_m5 = 19;
|
reg->pre_intra_cla2_B1.pre_intra_cla2_m6 = 13;
|
reg->pre_intra_cla2_B1.pre_intra_cla2_m7 = 20;
|
reg->pre_intra_cla2_B1.pre_intra_cla2_m8 = 12;
|
reg->pre_intra_cla2_B1.pre_intra_cla2_m9 = 21;
|
|
reg->pre_intra_cla3_B0.pre_intra_cla3_m0 = 18;
|
reg->pre_intra_cla3_B0.pre_intra_cla3_m1 = 19;
|
reg->pre_intra_cla3_B0.pre_intra_cla3_m2 = 20;
|
reg->pre_intra_cla3_B0.pre_intra_cla3_m3 = 21;
|
reg->pre_intra_cla3_B0.pre_intra_cla3_m4 = 22;
|
reg->pre_intra_cla3_B1.pre_intra_cla3_m5 = 17;
|
reg->pre_intra_cla3_B1.pre_intra_cla3_m6 = 23;
|
reg->pre_intra_cla3_B1.pre_intra_cla3_m7 = 16;
|
reg->pre_intra_cla3_B1.pre_intra_cla3_m8 = 24;
|
reg->pre_intra_cla3_B1.pre_intra_cla3_m9 = 15;
|
|
reg->pre_intra_cla4_B0.pre_intra_cla4_m0 = 25;
|
reg->pre_intra_cla4_B0.pre_intra_cla4_m1 = 26;
|
reg->pre_intra_cla4_B0.pre_intra_cla4_m2 = 24;
|
reg->pre_intra_cla4_B0.pre_intra_cla4_m3 = 23;
|
reg->pre_intra_cla4_B0.pre_intra_cla4_m4 = 22;
|
reg->pre_intra_cla4_B1.pre_intra_cla4_m5 = 27;
|
reg->pre_intra_cla4_B1.pre_intra_cla4_m6 = 21;
|
reg->pre_intra_cla4_B1.pre_intra_cla4_m7 = 28;
|
reg->pre_intra_cla4_B1.pre_intra_cla4_m8 = 20;
|
reg->pre_intra_cla4_B1.pre_intra_cla4_m9 = 29;
|
|
reg->pre_intra_cla5_B0.pre_intra_cla5_m0 = 27;
|
reg->pre_intra_cla5_B0.pre_intra_cla5_m1 = 26;
|
reg->pre_intra_cla5_B0.pre_intra_cla5_m2 = 28;
|
reg->pre_intra_cla5_B0.pre_intra_cla5_m3 = 29;
|
reg->pre_intra_cla5_B0.pre_intra_cla5_m4 = 30;
|
reg->pre_intra_cla5_B1.pre_intra_cla5_m5 = 25;
|
reg->pre_intra_cla5_B1.pre_intra_cla5_m6 = 31;
|
reg->pre_intra_cla5_B1.pre_intra_cla5_m7 = 24;
|
reg->pre_intra_cla5_B1.pre_intra_cla5_m8 = 32;
|
reg->pre_intra_cla5_B1.pre_intra_cla5_m9 = 23;
|
|
reg->pre_intra_cla6_B0.pre_intra_cla6_m0 = 34;
|
reg->pre_intra_cla6_B0.pre_intra_cla6_m1 = 33;
|
reg->pre_intra_cla6_B0.pre_intra_cla6_m2 = 32;
|
reg->pre_intra_cla6_B0.pre_intra_cla6_m3 = 31;
|
reg->pre_intra_cla6_B0.pre_intra_cla6_m4 = 30;
|
reg->pre_intra_cla6_B1.pre_intra_cla6_m5 = 2;
|
reg->pre_intra_cla6_B1.pre_intra_cla6_m6 = 29;
|
reg->pre_intra_cla6_B1.pre_intra_cla6_m7 = 3;
|
reg->pre_intra_cla6_B1.pre_intra_cla6_m8 = 28;
|
reg->pre_intra_cla6_B1.pre_intra_cla6_m9 = 4;
|
|
reg->pre_intra_cla7_B0.pre_intra_cla7_m0 = 34;
|
reg->pre_intra_cla7_B0.pre_intra_cla7_m1 = 2;
|
reg->pre_intra_cla7_B0.pre_intra_cla7_m2 = 3;
|
reg->pre_intra_cla7_B0.pre_intra_cla7_m3 = 4;
|
reg->pre_intra_cla7_B0.pre_intra_cla7_m4 = 5;
|
reg->pre_intra_cla7_B1.pre_intra_cla7_m5 = 33;
|
reg->pre_intra_cla7_B1.pre_intra_cla7_m6 = 6;
|
reg->pre_intra_cla7_B1.pre_intra_cla7_m7 = 32;
|
reg->pre_intra_cla7_B1.pre_intra_cla7_m8 = 7;
|
reg->pre_intra_cla7_B1.pre_intra_cla7_m9 = 31;
|
|
reg->pre_intra_cla8_B0.pre_intra_cla8_m0 = 10;
|
reg->pre_intra_cla8_B0.pre_intra_cla8_m1 = 26;
|
reg->pre_intra_cla8_B0.pre_intra_cla8_m2 = 18;
|
reg->pre_intra_cla8_B0.pre_intra_cla8_m3 = 34;
|
reg->pre_intra_cla8_B0.pre_intra_cla8_m4 = 6;
|
reg->pre_intra_cla8_B1.pre_intra_cla8_m5 = 14;
|
reg->pre_intra_cla8_B1.pre_intra_cla8_m6 = 22;
|
reg->pre_intra_cla8_B1.pre_intra_cla8_m7 = 30;
|
reg->pre_intra_cla8_B1.pre_intra_cla8_m8 = 2;
|
reg->pre_intra_cla8_B1.pre_intra_cla8_m9 = 24;
|
|
reg->pre_intra_cla9_B0.pre_intra_cla9_m0 = 0;
|
reg->pre_intra_cla9_B0.pre_intra_cla9_m1 = 0;
|
reg->pre_intra_cla9_B0.pre_intra_cla9_m2 = 0;
|
reg->pre_intra_cla9_B0.pre_intra_cla9_m3 = 0;
|
reg->pre_intra_cla9_B0.pre_intra_cla9_m4 = 0;
|
reg->pre_intra_cla9_B1.pre_intra_cla9_m5 = 0;
|
reg->pre_intra_cla9_B1.pre_intra_cla9_m6 = 0;
|
reg->pre_intra_cla9_B1.pre_intra_cla9_m7 = 0;
|
reg->pre_intra_cla9_B1.pre_intra_cla9_m8 = 0;
|
reg->pre_intra_cla9_B1.pre_intra_cla9_m9 = 0;
|
|
reg->pre_intra_cla10_B0.pre_intra_cla10_m0 = 0;
|
reg->pre_intra_cla10_B0.pre_intra_cla10_m1 = 0;
|
reg->pre_intra_cla10_B0.pre_intra_cla10_m2 = 0;
|
reg->pre_intra_cla10_B0.pre_intra_cla10_m3 = 0;
|
reg->pre_intra_cla10_B0.pre_intra_cla10_m4 = 0;
|
reg->pre_intra_cla10_B1.pre_intra_cla10_m5 = 0;
|
reg->pre_intra_cla10_B1.pre_intra_cla10_m6 = 0;
|
reg->pre_intra_cla10_B1.pre_intra_cla10_m7 = 0;
|
reg->pre_intra_cla10_B1.pre_intra_cla10_m8 = 0;
|
reg->pre_intra_cla10_B1.pre_intra_cla10_m9 = 0;
|
|
reg->pre_intra_cla11_B0.pre_intra_cla11_m0 = 0;
|
reg->pre_intra_cla11_B0.pre_intra_cla11_m1 = 0;
|
reg->pre_intra_cla11_B0.pre_intra_cla11_m2 = 0;
|
reg->pre_intra_cla11_B0.pre_intra_cla11_m3 = 0;
|
reg->pre_intra_cla11_B0.pre_intra_cla11_m4 = 0;
|
reg->pre_intra_cla11_B1.pre_intra_cla11_m5 = 0;
|
reg->pre_intra_cla11_B1.pre_intra_cla11_m6 = 0;
|
reg->pre_intra_cla11_B1.pre_intra_cla11_m7 = 0;
|
reg->pre_intra_cla11_B1.pre_intra_cla11_m8 = 0;
|
reg->pre_intra_cla11_B1.pre_intra_cla11_m9 = 0;
|
|
reg->pre_intra_cla12_B0.pre_intra_cla12_m0 = 0;
|
reg->pre_intra_cla12_B0.pre_intra_cla12_m1 = 0;
|
reg->pre_intra_cla12_B0.pre_intra_cla12_m2 = 0;
|
reg->pre_intra_cla12_B0.pre_intra_cla12_m3 = 0;
|
reg->pre_intra_cla12_B0.pre_intra_cla12_m4 = 0;
|
reg->pre_intra_cla12_B1.pre_intra_cla12_m5 = 0;
|
reg->pre_intra_cla12_B1.pre_intra_cla12_m6 = 0;
|
reg->pre_intra_cla12_B1.pre_intra_cla12_m7 = 0;
|
reg->pre_intra_cla12_B1.pre_intra_cla12_m8 = 0;
|
reg->pre_intra_cla12_B1.pre_intra_cla12_m9 = 0;
|
|
reg->pre_intra_cla13_B0.pre_intra_cla13_m0 = 0;
|
reg->pre_intra_cla13_B0.pre_intra_cla13_m1 = 0;
|
reg->pre_intra_cla13_B0.pre_intra_cla13_m2 = 0;
|
reg->pre_intra_cla13_B0.pre_intra_cla13_m3 = 0;
|
reg->pre_intra_cla13_B0.pre_intra_cla13_m4 = 0;
|
reg->pre_intra_cla13_B1.pre_intra_cla13_m5 = 0;
|
reg->pre_intra_cla13_B1.pre_intra_cla13_m6 = 0;
|
reg->pre_intra_cla13_B1.pre_intra_cla13_m7 = 0;
|
reg->pre_intra_cla13_B1.pre_intra_cla13_m8 = 0;
|
reg->pre_intra_cla13_B1.pre_intra_cla13_m9 = 0;
|
|
reg->pre_intra_cla14_B0.pre_intra_cla14_m0 = 0;
|
reg->pre_intra_cla14_B0.pre_intra_cla14_m1 = 0;
|
reg->pre_intra_cla14_B0.pre_intra_cla14_m2 = 0;
|
reg->pre_intra_cla14_B0.pre_intra_cla14_m3 = 0;
|
reg->pre_intra_cla14_B0.pre_intra_cla14_m4 = 0;
|
reg->pre_intra_cla14_B1.pre_intra_cla14_m5 = 0;
|
reg->pre_intra_cla14_B1.pre_intra_cla14_m6 = 0;
|
reg->pre_intra_cla14_B1.pre_intra_cla14_m7 = 0;
|
reg->pre_intra_cla14_B1.pre_intra_cla14_m8 = 0;
|
reg->pre_intra_cla14_B1.pre_intra_cla14_m9 = 0;
|
|
reg->pre_intra_cla15_B0.pre_intra_cla15_m0 = 0;
|
reg->pre_intra_cla15_B0.pre_intra_cla15_m1 = 0;
|
reg->pre_intra_cla15_B0.pre_intra_cla15_m2 = 0;
|
reg->pre_intra_cla15_B0.pre_intra_cla15_m3 = 0;
|
reg->pre_intra_cla15_B0.pre_intra_cla15_m4 = 0;
|
reg->pre_intra_cla15_B1.pre_intra_cla15_m5 = 0;
|
reg->pre_intra_cla15_B1.pre_intra_cla15_m6 = 0;
|
reg->pre_intra_cla15_B1.pre_intra_cla15_m7 = 0;
|
reg->pre_intra_cla15_B1.pre_intra_cla15_m8 = 0;
|
reg->pre_intra_cla15_B1.pre_intra_cla15_m9 = 0;
|
|
reg->pre_intra_cla16_B0.pre_intra_cla16_m0 = 0;
|
reg->pre_intra_cla16_B0.pre_intra_cla16_m1 = 0;
|
reg->pre_intra_cla16_B0.pre_intra_cla16_m2 = 0;
|
reg->pre_intra_cla16_B0.pre_intra_cla16_m3 = 0;
|
reg->pre_intra_cla16_B0.pre_intra_cla16_m4 = 0;
|
reg->pre_intra_cla16_B1.pre_intra_cla16_m5 = 0;
|
reg->pre_intra_cla16_B1.pre_intra_cla16_m6 = 0;
|
reg->pre_intra_cla16_B1.pre_intra_cla16_m7 = 0;
|
reg->pre_intra_cla16_B1.pre_intra_cla16_m8 = 0;
|
reg->pre_intra_cla16_B1.pre_intra_cla16_m9 = 0;
|
|
reg->i16_sobel_t.intra_l16_sobel_t0 = 64;
|
reg->i16_sobel_t.intra_l16_sobel_t1 = 200;
|
reg->i16_sobel_a_00.intra_l16_sobel_a0_qp0 = 32;
|
reg->i16_sobel_a_00.intra_l16_sobel_a0_qp1 = 32;
|
reg->i16_sobel_a_00.intra_l16_sobel_a0_qp2 = 32;
|
reg->i16_sobel_a_00.intra_l16_sobel_a0_qp3 = 32;
|
reg->i16_sobel_a_00.intra_l16_sobel_a0_qp4 = 32;
|
reg->i16_sobel_a_01.intra_l16_sobel_a0_qp5 = 32;
|
reg->i16_sobel_a_01.intra_l16_sobel_a0_qp6 = 32;
|
reg->i16_sobel_a_01.intra_l16_sobel_a0_qp7 = 32;
|
reg->i16_sobel_a_01.intra_l16_sobel_a0_qp8 = 32;
|
reg->i16_sobel_b_00.intra_l16_sobel_b0_qp0 = 0;
|
reg->i16_sobel_b_00.intra_l16_sobel_b0_qp1 = 0;
|
reg->i16_sobel_b_01.intra_l16_sobel_b0_qp2 = 0;
|
reg->i16_sobel_b_01.intra_l16_sobel_b0_qp3 = 0;
|
reg->i16_sobel_b_02.intra_l16_sobel_b0_qp4 = 0;
|
reg->i16_sobel_b_02.intra_l16_sobel_b0_qp5 = 0;
|
reg->i16_sobel_b_03.intra_l16_sobel_b0_qp6 = 0;
|
reg->i16_sobel_b_03.intra_l16_sobel_b0_qp7 = 0;
|
reg->i16_sobel_b_04.intra_l16_sobel_b0_qp8 = 0;
|
reg->i16_sobel_c_00.intra_l16_sobel_c0_qp0 = 13;
|
reg->i16_sobel_c_00.intra_l16_sobel_c0_qp1 = 13;
|
reg->i16_sobel_c_00.intra_l16_sobel_c0_qp2 = 13;
|
reg->i16_sobel_c_00.intra_l16_sobel_c0_qp3 = 13;
|
reg->i16_sobel_c_00.intra_l16_sobel_c0_qp4 = 13;
|
reg->i16_sobel_c_01.intra_l16_sobel_c0_qp5 = 13;
|
reg->i16_sobel_c_01.intra_l16_sobel_c0_qp6 = 13;
|
reg->i16_sobel_c_01.intra_l16_sobel_c0_qp7 = 13;
|
reg->i16_sobel_c_01.intra_l16_sobel_c0_qp8 = 13;
|
reg->i16_sobel_d_00.intra_l16_sobel_d0_qp0 = 23750;
|
reg->i16_sobel_d_00.intra_l16_sobel_d0_qp1 = 23750;
|
reg->i16_sobel_d_01.intra_l16_sobel_d0_qp2 = 23750;
|
reg->i16_sobel_d_01.intra_l16_sobel_d0_qp3 = 23750;
|
reg->i16_sobel_d_02.intra_l16_sobel_d0_qp4 = 23750;
|
reg->i16_sobel_d_02.intra_l16_sobel_d0_qp5 = 23750;
|
reg->i16_sobel_d_03.intra_l16_sobel_d0_qp6 = 23750;
|
reg->i16_sobel_d_03.intra_l16_sobel_d0_qp7 = 23750;
|
reg->i16_sobel_d_04.intra_l16_sobel_d0_qp8 = 23750;
|
|
reg->intra_l16_sobel_e0_qp0_low = 20000;
|
reg->intra_l16_sobel_e0_qp1_low = 20000;
|
reg->intra_l16_sobel_e0_qp2_low = 20000;
|
reg->intra_l16_sobel_e0_qp3_low = 20000;
|
reg->intra_l16_sobel_e0_qp4_low = 20000;
|
reg->intra_l16_sobel_e0_qp5_low = 20000;
|
reg->intra_l16_sobel_e0_qp6_low = 20000;
|
reg->intra_l16_sobel_e0_qp7_low = 20000;
|
reg->intra_l16_sobel_e0_qp8_low = 20000;
|
reg->i16_sobel_e_01.intra_l16_sobel_e0_qp0_high = 0;
|
reg->i16_sobel_e_03.intra_l16_sobel_e0_qp1_high = 0;
|
reg->i16_sobel_e_05.intra_l16_sobel_e0_qp2_high = 0;
|
reg->i16_sobel_e_07.intra_l16_sobel_e0_qp3_high = 0;
|
reg->i16_sobel_e_09.intra_l16_sobel_e0_qp4_high = 0;
|
reg->i16_sobel_e_11.intra_l16_sobel_e0_qp5_high = 0;
|
reg->i16_sobel_e_13.intra_l16_sobel_e0_qp6_high = 0;
|
reg->i16_sobel_e_15.intra_l16_sobel_e0_qp7_high = 0;
|
reg->i16_sobel_e_17.intra_l16_sobel_e0_qp8_high = 0;
|
|
reg->i32_sobel_t_00.intra_l32_sobel_t2 = 64;
|
reg->i32_sobel_t_00.intra_l32_sobel_t3 = 400;
|
reg->i32_sobel_t_01.intra_l32_sobel_t4 = 8;
|
reg->i32_sobel_t_02.intra_l32_sobel_t5 = 100;
|
reg->i32_sobel_t_02.intra_l32_sobel_t6 = 100;
|
|
reg->i32_sobel_a.intra_l32_sobel_a1_qp0 = 18;
|
reg->i32_sobel_a.intra_l32_sobel_a1_qp1 = 18;
|
reg->i32_sobel_a.intra_l32_sobel_a1_qp2 = 18;
|
reg->i32_sobel_a.intra_l32_sobel_a1_qp3 = 18;
|
reg->i32_sobel_a.intra_l32_sobel_a1_qp4 = 18;
|
|
reg->i32_sobel_b_00.intra_l32_sobel_b1_qp0 = 0;
|
reg->i32_sobel_b_00.intra_l32_sobel_b1_qp1 = 0;
|
reg->i32_sobel_b_01.intra_l32_sobel_b1_qp2 = 0;
|
reg->i32_sobel_b_01.intra_l32_sobel_b1_qp3 = 0;
|
reg->i32_sobel_b_02.intra_l32_sobel_b1_qp4 = 0;
|
|
reg->i32_sobel_c.intra_l32_sobel_c1_qp0 = 16;
|
reg->i32_sobel_c.intra_l32_sobel_c1_qp1 = 16;
|
reg->i32_sobel_c.intra_l32_sobel_c1_qp2 = 16;
|
reg->i32_sobel_c.intra_l32_sobel_c1_qp3 = 16;
|
reg->i32_sobel_c.intra_l32_sobel_c1_qp4 = 16;
|
|
reg->i32_sobel_d_00.intra_l32_sobel_d1_qp0 = 0;
|
reg->i32_sobel_d_00.intra_l32_sobel_d1_qp1 = 0;
|
reg->i32_sobel_d_01.intra_l32_sobel_d1_qp2 = 0;
|
reg->i32_sobel_d_01.intra_l32_sobel_d1_qp3 = 0;
|
reg->i32_sobel_d_02.intra_l32_sobel_d1_qp4 = 0;
|
|
reg->intra_l32_sobel_e1_qp0_low = 20000;
|
reg->intra_l32_sobel_e1_qp1_low = 20000;
|
reg->intra_l32_sobel_e1_qp2_low = 20000;
|
reg->intra_l32_sobel_e1_qp3_low = 20000;
|
reg->intra_l32_sobel_e1_qp4_low = 20000;
|
|
reg->i32_sobel_e_01.intra_l32_sobel_e1_qp0_high = 0;
|
reg->i32_sobel_e_03.intra_l32_sobel_e1_qp1_high = 0;
|
reg->i32_sobel_e_05.intra_l32_sobel_e1_qp2_high = 0;
|
reg->i32_sobel_e_07.intra_l32_sobel_e1_qp3_high = 0;
|
reg->i32_sobel_e_09.intra_l32_sobel_e1_qp4_high = 0;
|
}
|
|
static void vepu580_h265_rdo_cfg (vepu580_rdo_cfg *reg)
|
{
|
RdoAtfCfg* p_rdo_atf;
|
RdoAtfSkipCfg* p_rdo_atf_skip;
|
reg->rdo_sqi_cfg.rdo_segment_en = 1;
|
reg->rdo_sqi_cfg.rdo_smear_en = 1;
|
p_rdo_atf = ®->rdo_b64_inter_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 32;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 144;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 300;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf_skip = ®->rdo_b64_skip_atf;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 4;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 6;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd3 = 8;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd10 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd11 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd20 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd21 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd30 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd31 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd40 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd41 = 400;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt10 = 10;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt11 = 10;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt12 = 10;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt20 = 14;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt21 = 14;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt22 = 15;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt30 = 15;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt31 = 15;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt32 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt40 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt41 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt42 = 16;
|
|
p_rdo_atf = ®->rdo_b32_intra_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 48;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 64;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 26;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 25;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 25;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 25;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 24;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 23;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 21;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 19;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 18;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf = ®->rdo_b32_inter_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 32;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 144;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 300;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf_skip = ®->rdo_b32_skip_atf;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 4;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 6;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd3 = 8;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd10 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd11 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd20 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd21 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd30 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd31 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd40 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd41 = 400;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 18;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt10 = 11;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt11 = 11;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt12 = 11;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt20 = 13;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt21 = 13;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt22 = 13;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt30 = 15;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt31 = 15;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt32 = 15;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt40 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt41 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt42 = 16;
|
|
p_rdo_atf = ®->rdo_b16_intra_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 48;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 64;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 26;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 25;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 25;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 25;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 24;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 23;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 21;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 19;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 18;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf = ®->rdo_b16_inter_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 32;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 144;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 300;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf_skip = ®->rdo_b16_skip_atf;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 24;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 48;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd3 = 96;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd10 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd11 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd20 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd21 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd30 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd31 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd40 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd41 = 400;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt10 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt11 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt12 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt20 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt21 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt22 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt32 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt40 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt41 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt42 = 16;
|
|
p_rdo_atf = ®->rdo_b8_intra_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 48;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 64;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 26;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 25;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 25;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 25;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 24;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 23;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 21;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 19;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 18;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf = ®->rdo_b8_inter_atf;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 32;
|
p_rdo_atf->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 144;
|
p_rdo_atf->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 300;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd00 = 31;
|
p_rdo_atf->rdo_b_var_thd0.cu_rdo_var_thd01 = 400;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd10 = 31;
|
p_rdo_atf->rdo_b_var_thd1.cu_rdo_var_thd11 = 400;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd20 = 31;
|
p_rdo_atf->rdo_b_var_thd2.cu_rdo_var_thd21 = 400;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd30 = 31;
|
p_rdo_atf->rdo_b_var_thd3.cu_rdo_var_thd31 = 400;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt01 = 16;
|
p_rdo_atf->rdo_b_atf_wgt0.cu_rdo_atf_wgt02 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt10 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt11 = 16;
|
p_rdo_atf->rdo_b_atf_wgt1.cu_rdo_atf_wgt12 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt20 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt21 = 16;
|
p_rdo_atf->rdo_b_atf_wgt2.cu_rdo_atf_wgt22 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf->rdo_b_atf_wgt3.cu_rdo_atf_wgt32 = 16;
|
|
p_rdo_atf_skip = ®->rdo_b8_skip_atf;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd0 = 24;
|
p_rdo_atf_skip->rdo_b_cime_thd0.cu_rdo_cime_thd1 = 24;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd2 = 48;
|
p_rdo_atf_skip->rdo_b_cime_thd1.cu_rdo_cime_thd3 = 96;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd10 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd0.cu_rdo_var_thd11 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd20 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd1.cu_rdo_var_thd21 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd30 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd2.cu_rdo_var_thd31 = 400;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd40 = 31;
|
p_rdo_atf_skip->rdo_b_var_thd3.cu_rdo_var_thd41 = 400;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt00 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt10 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt11 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt0.cu_rdo_atf_wgt12 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt20 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt21 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt1.cu_rdo_atf_wgt22 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt30 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt31 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt2.cu_rdo_atf_wgt32 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt40 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt41 = 16;
|
p_rdo_atf_skip->rdo_b_atf_wgt3.cu_rdo_atf_wgt42 = 16;
|
|
reg->rdo_segment_b64_thd0.rdo_segment_cu64_th0 = 160;
|
reg->rdo_segment_b64_thd0.rdo_segment_cu64_th1 = 96;
|
reg->rdo_segment_b64_thd1.rdo_segment_cu64_th2 = 30;
|
reg->rdo_segment_b64_thd1.rdo_segment_cu64_th3 = 0;
|
reg->rdo_segment_b64_thd1.rdo_segment_cu64_th4 = 1;
|
reg->rdo_segment_b64_thd1.rdo_segment_cu64_th5_minus1 = 4;
|
reg->rdo_segment_b64_thd1.rdo_segment_cu64_th6_minus1 = 11;
|
|
reg->rdo_segment_b32_thd0.rdo_segment_cu32_th0 = 160;
|
reg->rdo_segment_b32_thd0.rdo_segment_cu32_th1 = 96;
|
reg->rdo_segment_b32_thd1.rdo_segment_cu32_th2 = 30;
|
reg->rdo_segment_b32_thd1.rdo_segment_cu32_th3 = 0;
|
reg->rdo_segment_b32_thd1.rdo_segment_cu32_th4 = 1;
|
reg->rdo_segment_b32_thd1.rdo_segment_cu32_th5_minus1 = 2;
|
reg->rdo_segment_b32_thd1.rdo_segment_cu32_th6_minus1 = 3;
|
|
reg->rdo_segment_multi.rdo_segment_cu64_multi = 22;
|
reg->rdo_segment_multi.rdo_segment_cu32_multi = 22;
|
reg->rdo_segment_multi.rdo_smear_cu16_multi = 6;
|
|
reg->rdo_b16_smear_thd0.rdo_smear_cu16_cime_sad_th0 = 64;
|
reg->rdo_b16_smear_thd0.rdo_smear_cu16_cime_sad_th1 = 32;
|
reg->rdo_b16_smear_thd1.rdo_smear_cu16_cime_sad_th2 = 36;
|
reg->rdo_b16_smear_thd1.rdo_smear_cu16_cime_sad_th3 = 64;
|
|
|
reg->preintra_b32_cst_var_thd.pre_intra32_cst_var_th00 = 9;
|
reg->preintra_b32_cst_var_thd.pre_intra32_cst_var_th01 = 4;
|
reg->preintra_b32_cst_var_thd.pre_intra32_mode_th = 5;
|
|
reg->preintra_b32_cst_wgt.pre_intra32_cst_wgt00 = 31;
|
reg->preintra_b32_cst_wgt.pre_intra32_cst_wgt01 = 25;
|
|
reg->preintra_b16_cst_var_thd.pre_intra16_cst_var_th00 = 9;
|
reg->preintra_b16_cst_var_thd.pre_intra16_cst_var_th01 = 4;
|
reg->preintra_b16_cst_var_thd.pre_intra16_mode_th = 5;
|
|
reg->preintra_b16_cst_wgt.pre_intra16_cst_wgt00 = 31;
|
reg->preintra_b16_cst_wgt.pre_intra16_cst_wgt01 = 25;
|
}
|
|
static void vepu580_h265_scl_cfg(vepu580_rdo_cfg *reg)
|
{
|
static RK_U32 vepu580_h265_scl_tab[] = {
|
/* 0x2200 */
|
0x10001000, 0x10001000, 0x0e390f0f, 0x0aab0c31, 0x10001000, 0x10001000, 0x0d790f0f, 0x0a3d0ba3,
|
0x10001000, 0x0e390f0f, 0x0ba30ccd, 0x08d40a3d, 0x10001000, 0x0c310e39, 0x097b0aab, 0x071c0842,
|
0x0f0f0f0f, 0x0aab0ccd, 0x07500889, 0x0572063e, 0x0d790e39, 0x097b0ba3, 0x05d10750, 0x03f004be,
|
0x0ba30c31, 0x08420a3d, 0x04be063e, 0x02e903a8, 0x0a3d0aab, 0x071c08d4, 0x03f00572, 0x023a02e9,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x0aab0c31, 0x10001000, 0x10001000, 0x0d790f0f, 0x0a3d0ba3,
|
0x10001000, 0x0e390f0f, 0x0ba30ccd, 0x08d40a3d, 0x10001000, 0x0c310e39, 0x097b0aab, 0x071c0842,
|
0x0f0f0f0f, 0x0aab0ccd, 0x07500889, 0x0572063e, 0x0d790e39, 0x097b0ba3, 0x05d10750, 0x03f004be,
|
0x0ba30c31, 0x08420a3d, 0x04be063e, 0x02e903a8, 0x0a3d0aab, 0x071c08d4, 0x03f00572, 0x023a02e9,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x0aab0c31, 0x10001000, 0x10001000, 0x0d790f0f, 0x0a3d0ba3,
|
0x10001000, 0x0e390f0f, 0x0ba30ccd, 0x08d40a3d, 0x10001000, 0x0c310e39, 0x097b0aab, 0x071c0842,
|
0x0f0f0f0f, 0x0aab0ccd, 0x07500889, 0x0572063e, 0x0d790e39, 0x097b0ba3, 0x05d10750, 0x03f004be,
|
0x0ba30c31, 0x08420a3d, 0x04be063e, 0x02e903a8, 0x0a3d0aab, 0x071c08d4, 0x03f00572, 0x023a02e9,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x0aab0ccd, 0x10001000, 0x0f0f1000, 0x0ccd0e39, 0x0a3d0aab,
|
0x10001000, 0x0e390f0f, 0x0aab0ccd, 0x09250a3d, 0x0f0f1000, 0x0ccd0e39, 0x0a3d0aab, 0x07c20925,
|
0x0e390f0f, 0x0aab0ccd, 0x09250a3d, 0x063e07c2, 0x0ccd0e39, 0x0a3d0aab, 0x07c20925, 0x04be063e,
|
0x0aab0ccd, 0x09250a3d, 0x063e07c2, 0x039b04be, 0x0a3d0aab, 0x07c20925, 0x04be063e, 0x02d0039b,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x0aab0ccd, 0x10001000, 0x0f0f1000, 0x0ccd0e39, 0x0a3d0aab,
|
0x10001000, 0x0e390f0f, 0x0aab0ccd, 0x09250a3d, 0x0f0f1000, 0x0ccd0e39, 0x0a3d0aab, 0x07c20925,
|
0x0e390f0f, 0x0aab0ccd, 0x09250a3d, 0x063e07c2, 0x0ccd0e39, 0x0a3d0aab, 0x07c20925, 0x04be063e,
|
0x0aab0ccd, 0x09250a3d, 0x063e07c2, 0x039b04be, 0x0a3d0aab, 0x07c20925, 0x04be063e, 0x02d0039b,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x0aab0ccd, 0x10001000, 0x0f0f1000, 0x0ccd0e39, 0x0a3d0aab,
|
0x10001000, 0x0e390f0f, 0x0aab0ccd, 0x09250a3d, 0x0f0f1000, 0x0ccd0e39, 0x0a3d0aab, 0x07c20925,
|
0x0e390f0f, 0x0aab0ccd, 0x09250a3d, 0x063e07c2, 0x0ccd0e39, 0x0a3d0aab, 0x07c20925, 0x04be063e,
|
0x0aab0ccd, 0x09250a3d, 0x063e07c2, 0x039b04be, 0x0a3d0aab, 0x07c20925, 0x04be063e, 0x02d0039b,
|
0x10001000, 0x10001000, 0x10001000, 0x10101010, 0x0e390f0f, 0x0aab0c31, 0x10001000, 0x18151211,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x10101010, 0x0d790f0f, 0x0a3d0ba3, 0x0aab0c31, 0x19161311,
|
0x10001000, 0x0e390f0f, 0x10001000, 0x12111010, 0x0ba30ccd, 0x08d40a3d, 0x10001000, 0x1d191614,
|
0x10001000, 0x0c310e39, 0x0d790f0f, 0x15121010, 0x097b0aab, 0x071c0842, 0x0a3d0ba3, 0x241f1b18,
|
0x0f0f0f0f, 0x0aab0ccd, 0x10001000, 0x18141111, 0x07500889, 0x0572063e, 0x0e390f0f, 0x2f29231e,
|
0x0d790e39, 0x097b0ba3, 0x0ba30ccd, 0x1b161312, 0x05d10750, 0x03f004be, 0x08d40a3d, 0x41362c23,
|
0x0ba30c31, 0x08420a3d, 0x10001000, 0x1f191615, 0x04be063e, 0x02e903a8, 0x0c310e39, 0x58463629,
|
0x0a3d0aab, 0x071c08d4, 0x097b0aab, 0x241d1918, 0x03f00572, 0x023a02e9, 0x071c0842, 0x7358412f,
|
0x10001000, 0x10001000, 0x0f0f0f0f, 0x10101010, 0x0e390f0f, 0x0aab0c31, 0x0aab0ccd, 0x18151211,
|
0x10001000, 0x10001000, 0x07500889, 0x10101010, 0x0d790f0f, 0x0a3d0ba3, 0x0572063e, 0x19161311,
|
0x10001000, 0x0e390f0f, 0x0d790e39, 0x12111010, 0x0ba30ccd, 0x08d40a3d, 0x097b0ba3, 0x1d191614,
|
0x10001000, 0x0c310e39, 0x05d10750, 0x15121010, 0x097b0aab, 0x071c0842, 0x03f004be, 0x241f1b18,
|
0x0f0f0f0f, 0x0aab0ccd, 0x0ba30c31, 0x18141111, 0x07500889, 0x0572063e, 0x08420a3d, 0x2f29231e,
|
0x0d790e39, 0x097b0ba3, 0x04be063e, 0x1b161312, 0x05d10750, 0x03f004be, 0x02e903a8, 0x41362c23,
|
0x0ba30c31, 0x08420a3d, 0x0a3d0aab, 0x1f191615, 0x04be063e, 0x02e903a8, 0x071c08d4, 0x58463629,
|
0x0a3d0aab, 0x071c08d4, 0x03f00572, 0x241d1918, 0x03f00572, 0x023a02e9, 0x023a02e9, 0x7358412f,
|
0x10001000, 0x10001000, 0x10001000, 0x10101010, 0x0e390f0f, 0x0aab0c31, 0x10001000, 0x18151211,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x10101010, 0x0d790f0f, 0x0a3d0ba3, 0x0aab0ccd, 0x19161311,
|
0x10001000, 0x0e390f0f, 0x10001000, 0x12111010, 0x0ba30ccd, 0x08d40a3d, 0x0f0f1000, 0x1d191614,
|
0x10001000, 0x0c310e39, 0x0ccd0e39, 0x15121010, 0x097b0aab, 0x071c0842, 0x0a3d0aab, 0x241f1b18,
|
0x0f0f0f0f, 0x0aab0ccd, 0x10001000, 0x18141111, 0x07500889, 0x0572063e, 0x0e390f0f, 0x2f29231e,
|
0x0d790e39, 0x097b0ba3, 0x0aab0ccd, 0x1b161312, 0x05d10750, 0x03f004be, 0x09250a3d, 0x41362c23,
|
0x0ba30c31, 0x08420a3d, 0x0f0f1000, 0x1f191615, 0x04be063e, 0x02e903a8, 0x0ccd0e39, 0x58463629,
|
0x0a3d0aab, 0x071c08d4, 0x0a3d0aab, 0x241d1918, 0x03f00572, 0x023a02e9, 0x07c20925, 0x7358412f,
|
0x10001000, 0x10001000, 0x0e390f0f, 0x10101010, 0x0e390f0f, 0x0aab0ccd, 0x0aab0ccd, 0x18141211,
|
0x10001000, 0x0f0f1000, 0x09250a3d, 0x11101010, 0x0ccd0e39, 0x0a3d0aab, 0x063e07c2, 0x19181412,
|
0x10001000, 0x0e390f0f, 0x0ccd0e39, 0x12111010, 0x0aab0ccd, 0x09250a3d, 0x0a3d0aab, 0x1c191814,
|
0x0f0f1000, 0x0ccd0e39, 0x07c20925, 0x14121110, 0x0a3d0aab, 0x07c20925, 0x04be063e, 0x211c1918,
|
0x0e390f0f, 0x0aab0ccd, 0x0aab0ccd, 0x18141211, 0x09250a3d, 0x063e07c2, 0x09250a3d, 0x29211c19,
|
0x0ccd0e39, 0x0a3d0aab, 0x063e07c2, 0x19181412, 0x07c20925, 0x04be063e, 0x039b04be, 0x3629211c,
|
0x0aab0ccd, 0x09250a3d, 0x0a3d0aab, 0x1c191814, 0x063e07c2, 0x039b04be, 0x07c20925, 0x47362921,
|
0x0a3d0aab, 0x07c20925, 0x04be063e, 0x211c1918, 0x04be063e, 0x02d0039b, 0x02d0039b, 0x5b473629,
|
0x10001000, 0x10001000, 0x10101010, 0x10101010, 0x0e390f0f, 0x0aab0ccd, 0x10101010, 0x18141211,
|
0x10001000, 0x0f0f1000, 0x12111211, 0x11101010, 0x0ccd0e39, 0x0a3d0aab, 0x18141815, 0x19181412,
|
0x10001000, 0x0e390f0f, 0x10101010, 0x12111010, 0x0aab0ccd, 0x09250a3d, 0x11101010, 0x1c191814,
|
0x0f0f1000, 0x0ccd0e39, 0x14121311, 0x14121110, 0x0a3d0aab, 0x07c20925, 0x19181916, 0x211c1918,
|
0x0e390f0f, 0x0aab0ccd, 0x10101010, 0x18141211, 0x09250a3d, 0x063e07c2, 0x12111211, 0x29211c19,
|
0x0ccd0e39, 0x0a3d0aab, 0x18141614, 0x19181412, 0x07c20925, 0x04be063e, 0x1c191d19, 0x3629211c,
|
0x0aab0ccd, 0x09250a3d, 0x11101010, 0x1c191814, 0x063e07c2, 0x039b04be, 0x14121512, 0x47362921,
|
0x0a3d0aab, 0x07c20925, 0x19181b18, 0x211c1918, 0x04be063e, 0x02d0039b, 0x211c241f, 0x5b473629,
|
0x10001000, 0x10001000, 0x12111111, 0x10101010, 0x0e390f0f, 0x0aab0ccd, 0x18141814, 0x18141211,
|
0x10001000, 0x0f0f1000, 0x1c19231e, 0x11101010, 0x0ccd0e39, 0x0a3d0aab, 0x29212f29, 0x19181412,
|
0x10001000, 0x0e390f0f, 0x14121312, 0x12111010, 0x0aab0ccd, 0x09250a3d, 0x19181b16, 0x1c191814,
|
0x0f0f1000, 0x0ccd0e39, 0x211c2c23, 0x14121110, 0x0a3d0aab, 0x07c20925, 0x36294136, 0x211c1918,
|
0x0e390f0f, 0x0aab0ccd, 0x18141615, 0x18141211, 0x09250a3d, 0x063e07c2, 0x1c191f19, 0x29211c19,
|
0x0ccd0e39, 0x0a3d0aab, 0x29213629, 0x19181412, 0x07c20925, 0x04be063e, 0x47365846, 0x3629211c,
|
0x0aab0ccd, 0x09250a3d, 0x19181918, 0x1c191814, 0x063e07c2, 0x039b04be, 0x211c241d, 0x47362921,
|
0x0a3d0aab, 0x07c20925, 0x3629412f, 0x211c1918, 0x04be063e, 0x02d0039b, 0x5b477358, 0x5b473629,
|
0x10101010, 0x18151211, 0x10101010, 0x18141211, 0x10101010, 0x19161311, 0x11101010, 0x19181412,
|
0x12111010, 0x1d191614, 0x12111010, 0x1c191814, 0x15121010, 0x241f1b18, 0x14121110, 0x211c1918,
|
0x18141111, 0x2f29231e, 0x18141211, 0x29211c19, 0x1b161312, 0x41362c23, 0x19181412, 0x3629211c,
|
0x1f191615, 0x58463629, 0x1c191814, 0x47362921, 0x241d1918, 0x7358412f, 0x211c1918, 0x5b473629,
|
0x10101010, 0x18151211, 0x10101010, 0x18141211, 0x10101010, 0x19161311, 0x11101010, 0x19181412,
|
0x12111010, 0x1d191614, 0x12111010, 0x1c191814, 0x15121010, 0x241f1b18, 0x14121110, 0x211c1918,
|
0x18141111, 0x2f29231e, 0x18141211, 0x29211c19, 0x1b161312, 0x41362c23, 0x19181412, 0x3629211c,
|
0x1f191615, 0x58463629, 0x1c191814, 0x47362921, 0x241d1918, 0x7358412f, 0x211c1918, 0x5b473629,
|
0x10101010, 0x18151211, 0x10101010, 0x18141211, 0x10101010, 0x19161311, 0x11101010, 0x19181412,
|
0x12111010, 0x1d191614, 0x12111010, 0x1c191814, 0x15121010, 0x241f1b18, 0x14121110, 0x211c1918,
|
0x18141111, 0x2f29231e, 0x18141211, 0x29211c19, 0x1b161312, 0x41362c23, 0x19181412, 0x3629211c,
|
0x1f191615, 0x58463629, 0x1c191814, 0x47362921, 0x241d1918, 0x7358412f, 0x211c1918, 0x5b473629,
|
0x10001000, 0x10001000, 0x10001000, 0x10001000, 0x10101010, 0x10101010,
|
};
|
|
hal_h265e_dbg_func("enter\n");
|
|
memcpy(®->scaling_list_reg[0], vepu580_h265_scl_tab, sizeof(vepu580_h265_scl_tab));
|
|
hal_h265e_dbg_func("leave\n");
|
}
|
static void vepu580_h265_global_cfg_set(H265eV580HalContext *ctx, H265eV580RegSet *regs)
|
{
|
MppEncHwCfg *hw = &ctx->cfg->hw;
|
RK_U32 i;
|
hevc_vepu580_rc_klut *rc_regs = ®s->reg_rc_klut;
|
hevc_vepu580_wgt *reg_wgt = ®s->reg_wgt;
|
vepu580_rdo_cfg *reg_rdo = ®s->reg_rdo;
|
vepu580_h265_sobel_cfg(reg_wgt);
|
vepu580_h265_rdo_cfg(reg_rdo);
|
vepu580_h265_scl_cfg(reg_rdo);
|
|
memcpy(®_wgt->iprd_wgt_qp_hevc_0_51[0], lamd_satd_qp, sizeof(lamd_satd_qp));
|
|
if (ctx->frame_type == INTRA_FRAME) {
|
RK_U8 *thd = (RK_U8 *)&rc_regs->aq_tthd0;
|
RK_S8 *step = (RK_S8 *)&rc_regs->aq_stp0;
|
|
for (i = 0; i < MPP_ARRAY_ELEMS(aq_thd_default); i++) {
|
thd[i] = hw->aq_thrd_i[i];
|
step[i] = hw->aq_step_i[i] & 0x3f;
|
}
|
|
memcpy(®_wgt->rdo_wgta_qp_grpa_0_51[0], lamd_moda_qp, sizeof(lamd_moda_qp));
|
} else {
|
RK_U8 *thd = (RK_U8 *)&rc_regs->aq_tthd0;
|
RK_S8 *step = (RK_S8 *)&rc_regs->aq_stp0;
|
|
for (i = 0; i < MPP_ARRAY_ELEMS(aq_thd_default); i++) {
|
thd[i] = hw->aq_thrd_p[i];
|
step[i] = hw->aq_step_p[i] & 0x3f;
|
}
|
memcpy(®_wgt->rdo_wgta_qp_grpa_0_51[0], lamd_modb_qp, sizeof(lamd_modb_qp));
|
}
|
//to be done
|
rc_regs->madi_cfg.madi_mode = 0;
|
rc_regs->madi_cfg.madi_thd = 25;
|
rc_regs->md_sad_thd.md_sad_thd0 = 20;
|
rc_regs->md_sad_thd.md_sad_thd1 = 30;
|
rc_regs->md_sad_thd.md_sad_thd2 = 40;
|
rc_regs->madi_thd.madi_thd0 = 25;
|
rc_regs->madi_thd.madi_thd1 = 35;
|
rc_regs->madi_thd.madi_thd2 = 45;
|
|
reg_wgt->reg1484_qnt_bias_comb.qnt_bias_i = 171;
|
reg_wgt->reg1484_qnt_bias_comb.qnt_bias_p = 85;
|
|
memcpy(®_wgt->lvl32_intra_CST_THD0, lvl32_intra_cst_thd, sizeof(lvl32_intra_cst_thd));
|
memcpy(®_wgt->lvl16_intra_CST_THD0, lvl16_intra_cst_thd, sizeof(lvl16_intra_cst_thd));
|
memcpy(®_wgt->lvl32_intra_CST_WGT0, lvl32_intra_cst_wgt, sizeof(lvl32_intra_cst_wgt));
|
memcpy(®_wgt->lvl16_intra_CST_WGT0, lvl16_intra_cst_wgt, sizeof(lvl16_intra_cst_wgt));
|
|
reg_wgt->cime_sqi_cfg.cime_sad_mod_sel = 0;
|
reg_wgt->cime_sqi_cfg.cime_sad_use_big_block = 0;
|
reg_wgt->cime_sqi_cfg.cime_pmv_set_zero = 1;
|
reg_wgt->cime_sqi_cfg.cime_pmv_num = 3;
|
reg_wgt->cime_sqi_thd.cime_mvd_th0 = 32;
|
reg_wgt->cime_sqi_thd.cime_mvd_th1 = 80;
|
reg_wgt->cime_sqi_thd.cime_mvd_th2 = 128;
|
reg_wgt->cime_sqi_multi0.cime_multi0 = 16;
|
reg_wgt->cime_sqi_multi0.cime_multi1 = 32;
|
reg_wgt->cime_sqi_multi1.cime_multi2 = 96;
|
reg_wgt->cime_sqi_multi1.cime_multi3 = 96;
|
reg_wgt->rime_sqi_thd.cime_sad_th0 = 48;
|
reg_wgt->rime_sqi_thd.rime_mvd_th0 = 3;
|
reg_wgt->rime_sqi_thd.rime_mvd_th1 = 8;
|
reg_wgt->rime_sqi_multi.rime_multi0 = 16;
|
reg_wgt->rime_sqi_multi.rime_multi1 = 16;
|
reg_wgt->rime_sqi_multi.rime_multi2 = 128;
|
reg_wgt->fme_sqi_thd0.cime_sad_pu16_th = 16;
|
reg_wgt->fme_sqi_thd0.cime_sad_pu32_th = 16;
|
reg_wgt->fme_sqi_thd1.cime_sad_pu64_th = 16;
|
reg_wgt->fme_sqi_thd1.move_lambda = 1;
|
|
|
}
|
|
MPP_RET hal_h265e_v580_deinit(void *hal)
|
{
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
RK_U32 i = 0;
|
|
hal_h265e_enter();
|
|
for (i = 0; i < MAX_TILE_NUM; i++) {
|
MPP_FREE(ctx->regs[i]);
|
MPP_FREE(ctx->reg_out[i]);
|
}
|
|
MPP_FREE(ctx->poll_cfgs);
|
MPP_FREE(ctx->input_fmt);
|
hal_bufs_deinit(ctx->dpb_bufs);
|
|
if (ctx->hw_tile_buf[0]) {
|
mpp_buffer_put(ctx->hw_tile_buf[0]);
|
ctx->hw_tile_buf[0] = NULL;
|
}
|
|
if (ctx->hw_tile_buf[1]) {
|
mpp_buffer_put(ctx->hw_tile_buf[1]);
|
ctx->hw_tile_buf[1] = NULL;
|
}
|
|
if (ctx->hw_tile_stream) {
|
mpp_buffer_put(ctx->hw_tile_stream);
|
ctx->hw_tile_stream = NULL;
|
}
|
|
if (ctx->tile_grp) {
|
mpp_buffer_group_put(ctx->tile_grp);
|
ctx->tile_grp = NULL;
|
}
|
|
if (ctx->buf_pass1) {
|
mpp_buffer_put(ctx->buf_pass1);
|
ctx->buf_pass1 = NULL;
|
}
|
|
if (ctx->dev) {
|
mpp_dev_deinit(ctx->dev);
|
ctx->dev = NULL;
|
}
|
|
if (ctx->reg_cfg) {
|
mpp_dev_multi_offset_deinit(ctx->reg_cfg);
|
ctx->reg_cfg = NULL;
|
}
|
|
if (ctx->tune) {
|
vepu580_h265e_tune_deinit(ctx->tune);
|
ctx->tune = NULL;
|
}
|
hal_h265e_leave();
|
return MPP_OK;
|
}
|
|
MPP_RET hal_h265e_v580_init(void *hal, MppEncHalCfg *cfg)
|
{
|
MPP_RET ret = MPP_OK;
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
RK_U32 i = 0;
|
H265eV580RegSet *regs = NULL;
|
|
mpp_env_get_u32("hal_h265e_debug", &hal_h265e_debug, 0);
|
|
hal_h265e_enter();
|
|
for (i = 0; i < MAX_TILE_NUM; i++) {
|
ctx->regs[i] = mpp_calloc(H265eV580RegSet, 1);
|
ctx->reg_out[i] = mpp_calloc(H265eV580StatusElem, 1);
|
}
|
|
ctx->input_fmt = mpp_calloc(VepuFmtCfg, 1);
|
ctx->cfg = cfg->cfg;
|
hal_bufs_init(&ctx->dpb_bufs);
|
|
ctx->frame_cnt = 0;
|
ctx->frame_cnt_gen_ready = 0;
|
ctx->enc_mode = RKV_ENC_MODE;
|
cfg->type = VPU_CLIENT_RKVENC;
|
ret = mpp_dev_init(&cfg->dev, cfg->type);
|
if (ret) {
|
mpp_err_f("mpp_dev_init failed. ret: %d\n", ret);
|
goto DONE;
|
}
|
regs = (H265eV580RegSet *)ctx->regs[0];
|
ctx->dev = cfg->dev;
|
ctx->osd_cfg.reg_base = (void *)®s->reg_osd_cfg;
|
ctx->osd_cfg.dev = ctx->dev;
|
ctx->osd_cfg.plt_cfg = &ctx->cfg->plt_cfg;
|
ctx->osd_cfg.osd_data = NULL;
|
ctx->osd_cfg.osd_data2 = NULL;
|
|
mpp_dev_multi_offset_init(&ctx->reg_cfg, 24);
|
ctx->osd_cfg.reg_cfg = ctx->reg_cfg;
|
|
ctx->frame_type = INTRA_FRAME;
|
|
{ /* setup default hardware config */
|
MppEncHwCfg *hw = &cfg->cfg->hw;
|
|
hw->qp_delta_row_i = 2;
|
hw->qp_delta_row = 2;
|
|
memcpy(hw->aq_thrd_i, aq_thd_default, sizeof(hw->aq_thrd_i));
|
memcpy(hw->aq_thrd_p, aq_thd_default, sizeof(hw->aq_thrd_p));
|
memcpy(hw->aq_step_i, aq_qp_dealt_default, sizeof(hw->aq_step_i));
|
memcpy(hw->aq_step_p, aq_qp_dealt_default, sizeof(hw->aq_step_p));
|
}
|
|
ctx->tune = vepu580_h265e_tune_init(ctx);
|
|
{
|
// check parall tile ability
|
const MppServiceCmdCap *cap = mpp_get_mpp_service_cmd_cap();
|
|
ctx->tile_parall_en = cap->send_cmd > MPP_CMD_SET_SESSION_FD;
|
}
|
|
ctx->poll_slice_max = 8;
|
ctx->poll_cfg_size = (sizeof(ctx->poll_cfgs) + sizeof(RK_S32) * ctx->poll_slice_max) * 2;
|
ctx->poll_cfgs = mpp_malloc_size(MppDevPollCfg, ctx->poll_cfg_size);
|
|
if (NULL == ctx->poll_cfgs) {
|
ret = MPP_ERR_MALLOC;
|
mpp_err_f("init poll cfg buffer failed\n");
|
goto DONE;
|
}
|
ctx->output_cb = cfg->output_cb;
|
cfg->cap_recn_out = 1;
|
DONE:
|
if (ret)
|
hal_h265e_v580_deinit(hal);
|
|
hal_h265e_leave();
|
return ret;
|
}
|
static MPP_RET hal_h265e_vepu580_prepare(void *hal)
|
{
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
MppEncPrepCfg *prep = &ctx->cfg->prep;
|
|
hal_h265e_dbg_func("enter %p\n", hal);
|
|
if (prep->change & (MPP_ENC_PREP_CFG_CHANGE_INPUT | MPP_ENC_PREP_CFG_CHANGE_FORMAT)) {
|
RK_S32 i;
|
|
// pre-alloc required buffers to reduce first frame delay
|
vepu580_h265_setup_hal_bufs(ctx);
|
for (i = 0; i < ctx->max_buf_cnt; i++)
|
hal_bufs_get_buf(ctx->dpb_bufs, i);
|
|
prep->change = 0;
|
}
|
|
hal_h265e_dbg_func("leave %p\n", hal);
|
|
return MPP_OK;
|
}
|
|
static MPP_RET
|
vepu580_h265_set_patch_info(MppDevRegOffCfgs *cfgs, H265eSyntax_new *syn,
|
Vepu541Fmt input_fmt, HalEncTask *task)
|
{
|
MppFrameFormat fmt = mpp_frame_get_fmt(task->frame);
|
RK_U32 hor_stride = syn->pp.hor_stride;
|
RK_U32 ver_stride = syn->pp.ver_stride ? syn->pp.ver_stride : syn->pp.pic_height;
|
RK_U32 frame_size = hor_stride * ver_stride;
|
RK_U32 u_offset = 0, v_offset = 0;
|
MPP_RET ret = MPP_OK;
|
|
if (task->rc_task->frm.use_pass1)
|
fmt = MPP_FMT_YUV420SP;
|
|
if (MPP_FRAME_FMT_IS_FBC(fmt)) {
|
u_offset = mpp_frame_get_fbc_offset(task->frame);
|
v_offset = 0;
|
} else {
|
switch (input_fmt) {
|
case VEPU541_FMT_YUV420P: {
|
u_offset = frame_size;
|
v_offset = frame_size * 5 / 4;
|
} break;
|
case VEPU541_FMT_YUV420SP:
|
case VEPU541_FMT_YUV422SP: {
|
u_offset = frame_size;
|
v_offset = frame_size;
|
} break;
|
case VEPU541_FMT_YUV422P: {
|
u_offset = frame_size;
|
v_offset = frame_size * 3 / 2;
|
} break;
|
case VEPU541_FMT_YUYV422:
|
case VEPU541_FMT_UYVY422: {
|
u_offset = 0;
|
v_offset = 0;
|
} break;
|
case VEPU580_FMT_YUV444SP : {
|
u_offset = hor_stride * ver_stride;
|
v_offset = hor_stride * ver_stride;
|
} break;
|
case VEPU580_FMT_YUV444P : {
|
u_offset = hor_stride * ver_stride;
|
v_offset = hor_stride * ver_stride * 2;
|
} break;
|
case VEPU541_FMT_BGR565:
|
case VEPU541_FMT_BGR888:
|
case VEPU541_FMT_BGRA8888: {
|
u_offset = 0;
|
v_offset = 0;
|
} break;
|
default: {
|
hal_h265e_err("unknown color space: %d\n", input_fmt);
|
u_offset = frame_size;
|
v_offset = frame_size * 5 / 4;
|
}
|
}
|
}
|
|
/* input cb addr */
|
ret = mpp_dev_multi_offset_update(cfgs, 161, u_offset);
|
if (ret)
|
mpp_err_f("set input cb addr offset failed %d\n", ret);
|
|
/* input cr addr */
|
ret = mpp_dev_multi_offset_update(cfgs, 162, v_offset);
|
if (ret)
|
mpp_err_f("set input cr addr offset failed %d\n", ret);
|
|
return ret;
|
}
|
|
static MPP_RET vepu580_h265_set_roi_regs(H265eV580HalContext *ctx, hevc_vepu580_base *regs)
|
{
|
/* memset register on start so do not clear registers again here */
|
if (ctx->roi_data) {
|
/* roi setup */
|
MppEncROICfg2 *cfg = ( MppEncROICfg2 *)ctx->roi_data;
|
|
regs->reg0192_enc_pic.roi_en = 1;
|
regs->reg0178_roi_addr = mpp_buffer_get_fd(cfg->base_cfg_buf);
|
if (cfg->roi_qp_en) {
|
regs->reg0179_roi_qp_addr = mpp_buffer_get_fd(cfg->qp_cfg_buf);
|
regs->reg0228_roi_en.roi_qp_en = 1;
|
}
|
|
if (cfg->roi_amv_en) {
|
regs->reg0180_roi_amv_addr = mpp_buffer_get_fd(cfg->amv_cfg_buf);
|
regs->reg0228_roi_en.roi_amv_en = 1;
|
}
|
|
if (cfg->roi_mv_en) {
|
regs->reg0181_roi_mv_addr = mpp_buffer_get_fd(cfg->mv_cfg_buf);
|
regs->reg0228_roi_en.roi_mv_en = 1;
|
}
|
}
|
|
return MPP_OK;
|
}
|
|
static MPP_RET vepu580_h265_set_rc_regs(H265eV580HalContext *ctx, H265eV580RegSet *regs, HalEncTask *task)
|
{
|
H265eSyntax_new *syn = (H265eSyntax_new *)task->syntax.data;
|
EncRcTaskInfo *rc_cfg = &task->rc_task->info;
|
hevc_vepu580_base *reg_base = ®s->reg_base;
|
hevc_vepu580_rc_klut *reg_rc = ®s->reg_rc_klut;
|
MppEncCfgSet *cfg = ctx->cfg;
|
MppEncRcCfg *rc = &cfg->rc;
|
MppEncHwCfg *hw = &cfg->hw;
|
MppEncCodecCfg *codec = &cfg->codec;
|
MppEncH265Cfg *h265 = &codec->h265;
|
RK_S32 mb_wd64, mb_h64;
|
mb_wd64 = (syn->pp.pic_width + 63) / 64;
|
mb_h64 = (syn->pp.pic_height + 63) / 64;
|
|
RK_U32 ctu_target_bits_mul_16 = (rc_cfg->bit_target << 4) / (mb_wd64 * mb_h64);
|
RK_U32 ctu_target_bits;
|
RK_S32 negative_bits_thd, positive_bits_thd;
|
|
if (rc->rc_mode == MPP_ENC_RC_MODE_FIXQP) {
|
reg_base->reg0192_enc_pic.pic_qp = rc_cfg->quality_target;
|
reg_base->reg0240_synt_sli1.sli_qp = rc_cfg->quality_target;
|
|
reg_base->reg213_rc_qp.rc_max_qp = rc_cfg->quality_target;
|
reg_base->reg213_rc_qp.rc_min_qp = rc_cfg->quality_target;
|
} else {
|
if (ctu_target_bits_mul_16 >= 0x100000) {
|
ctu_target_bits_mul_16 = 0x50000;
|
}
|
ctu_target_bits = (ctu_target_bits_mul_16 * mb_wd64) >> 4;
|
negative_bits_thd = 0 - 5 * ctu_target_bits / 16;
|
positive_bits_thd = 5 * ctu_target_bits / 16;
|
|
reg_base->reg0192_enc_pic.pic_qp = rc_cfg->quality_target;
|
reg_base->reg0240_synt_sli1.sli_qp = rc_cfg->quality_target;
|
reg_base->reg212_rc_cfg.rc_en = 1;
|
reg_base->reg212_rc_cfg.aq_en = 1;
|
reg_base->reg212_rc_cfg.aq_mode = 1;
|
reg_base->reg212_rc_cfg.rc_ctu_num = mb_wd64;
|
reg_base->reg213_rc_qp.rc_qp_range = (ctx->frame_type == INTRA_FRAME) ?
|
hw->qp_delta_row_i : hw->qp_delta_row;
|
reg_base->reg213_rc_qp.rc_max_qp = rc_cfg->quality_max;
|
reg_base->reg213_rc_qp.rc_min_qp = rc_cfg->quality_min;
|
reg_base->reg214_rc_tgt.ctu_ebit = ctu_target_bits_mul_16;
|
|
reg_rc->rc_dthd_0_8[0] = 2 * negative_bits_thd;
|
reg_rc->rc_dthd_0_8[1] = negative_bits_thd;
|
reg_rc->rc_dthd_0_8[2] = positive_bits_thd;
|
reg_rc->rc_dthd_0_8[3] = 2 * positive_bits_thd;
|
reg_rc->rc_dthd_0_8[4] = 0x7FFFFFFF;
|
reg_rc->rc_dthd_0_8[5] = 0x7FFFFFFF;
|
reg_rc->rc_dthd_0_8[6] = 0x7FFFFFFF;
|
reg_rc->rc_dthd_0_8[7] = 0x7FFFFFFF;
|
reg_rc->rc_dthd_0_8[8] = 0x7FFFFFFF;
|
|
reg_rc->rc_adj0.qp_adj0 = -2;
|
reg_rc->rc_adj0.qp_adj1 = -1;
|
reg_rc->rc_adj0.qp_adj2 = 0;
|
reg_rc->rc_adj0.qp_adj3 = 1;
|
reg_rc->rc_adj0.qp_adj4 = 2;
|
reg_rc->rc_adj1.qp_adj5 = 0;
|
reg_rc->rc_adj1.qp_adj6 = 0;
|
reg_rc->rc_adj1.qp_adj7 = 0;
|
reg_rc->rc_adj1.qp_adj8 = 0;
|
|
reg_rc->roi_qthd0.qpmin_area0 = h265->qpmin_map[0] > 0 ? h265->qpmin_map[0] : rc_cfg->quality_min;
|
reg_rc->roi_qthd0.qpmax_area0 = h265->qpmax_map[0] > 0 ? h265->qpmax_map[0] : rc_cfg->quality_max;
|
reg_rc->roi_qthd0.qpmin_area1 = h265->qpmin_map[1] > 0 ? h265->qpmin_map[1] : rc_cfg->quality_min;
|
reg_rc->roi_qthd0.qpmax_area1 = h265->qpmax_map[1] > 0 ? h265->qpmax_map[1] : rc_cfg->quality_max;
|
reg_rc->roi_qthd0.qpmin_area2 = h265->qpmin_map[2] > 0 ? h265->qpmin_map[2] : rc_cfg->quality_min;;
|
reg_rc->roi_qthd1.qpmax_area2 = h265->qpmax_map[2] > 0 ? h265->qpmax_map[2] : rc_cfg->quality_max;
|
reg_rc->roi_qthd1.qpmin_area3 = h265->qpmin_map[3] > 0 ? h265->qpmin_map[3] : rc_cfg->quality_min;;
|
reg_rc->roi_qthd1.qpmax_area3 = h265->qpmax_map[3] > 0 ? h265->qpmax_map[3] : rc_cfg->quality_max;
|
reg_rc->roi_qthd1.qpmin_area4 = h265->qpmin_map[4] > 0 ? h265->qpmin_map[4] : rc_cfg->quality_min;;
|
reg_rc->roi_qthd1.qpmax_area4 = h265->qpmax_map[4] > 0 ? h265->qpmax_map[4] : rc_cfg->quality_max;
|
reg_rc->roi_qthd2.qpmin_area5 = h265->qpmin_map[5] > 0 ? h265->qpmin_map[5] : rc_cfg->quality_min;;
|
reg_rc->roi_qthd2.qpmax_area5 = h265->qpmax_map[5] > 0 ? h265->qpmax_map[5] : rc_cfg->quality_max;
|
reg_rc->roi_qthd2.qpmin_area6 = h265->qpmin_map[6] > 0 ? h265->qpmin_map[6] : rc_cfg->quality_min;;
|
reg_rc->roi_qthd2.qpmax_area6 = h265->qpmax_map[6] > 0 ? h265->qpmax_map[6] : rc_cfg->quality_max;
|
reg_rc->roi_qthd2.qpmin_area7 = h265->qpmin_map[7] > 0 ? h265->qpmin_map[7] : rc_cfg->quality_min;;
|
reg_rc->roi_qthd3.qpmax_area7 = h265->qpmax_map[7] > 0 ? h265->qpmax_map[7] : rc_cfg->quality_max;
|
reg_rc->roi_qthd3.qpmap_mode = h265->qpmap_mode;
|
}
|
return MPP_OK;
|
}
|
|
static MPP_RET vepu580_h265_set_pp_regs(H265eV580RegSet *regs, VepuFmtCfg *fmt,
|
MppEncPrepCfg *prep_cfg, HalEncTask *task)
|
{
|
hevc_vepu580_control_cfg *reg_ctl = ®s->reg_ctl;
|
hevc_vepu580_base *reg_base = ®s->reg_base;
|
RK_S32 stridey = 0;
|
RK_S32 stridec = 0;
|
|
reg_ctl->reg0012_dtrns_map.src_bus_edin = fmt->src_endian;
|
reg_base->reg0198_src_fmt.src_cfmt = fmt->format;
|
reg_base->reg0198_src_fmt.alpha_swap = fmt->alpha_swap;
|
reg_base->reg0198_src_fmt.rbuv_swap = fmt->rbuv_swap;
|
reg_base->reg0198_src_fmt.src_range = fmt->src_range;
|
reg_base->reg0198_src_fmt.out_fmt = 1;
|
reg_base->reg0203_src_proc.src_mirr = prep_cfg->mirroring > 0;
|
reg_base->reg0203_src_proc.src_rot = prep_cfg->rotation;
|
|
if (MPP_FRAME_FMT_IS_FBC(prep_cfg->format)) {
|
stridey = mpp_frame_get_fbc_hdr_stride(task->frame);
|
if (!stridey)
|
stridey = MPP_ALIGN(prep_cfg->width, 16);
|
} else if (prep_cfg->hor_stride) {
|
stridey = prep_cfg->hor_stride;
|
} else {
|
if (fmt->format == VEPU541_FMT_BGRA8888 )
|
stridey = prep_cfg->width * 4;
|
else if (fmt->format == VEPU541_FMT_BGR888 )
|
stridey = prep_cfg->width * 3;
|
else if (fmt->format == VEPU541_FMT_BGR565 ||
|
fmt->format == VEPU541_FMT_YUYV422 ||
|
fmt->format == VEPU541_FMT_UYVY422)
|
stridey = prep_cfg->width * 2;
|
else
|
stridey = prep_cfg->width;
|
}
|
|
switch (fmt->format) {
|
case VEPU580_FMT_YUV444SP : {
|
stridec = stridey * 2;
|
} break;
|
case VEPU541_FMT_YUV422SP :
|
case VEPU541_FMT_YUV420SP :
|
case VEPU580_FMT_YUV444P : {
|
stridec = stridey;
|
} break;
|
default : {
|
stridec = stridey / 2;
|
} break;
|
}
|
|
if (reg_base->reg0198_src_fmt.src_cfmt < VEPU541_FMT_NONE) {
|
reg_base->reg0199_src_udfy.csc_wgt_r2y = 66;
|
reg_base->reg0199_src_udfy.csc_wgt_g2y = 129;
|
reg_base->reg0199_src_udfy.csc_wgt_b2y = 25;
|
|
reg_base->reg0200_src_udfu.csc_wgt_r2u = -38;
|
reg_base->reg0200_src_udfu.csc_wgt_g2u = -74;
|
reg_base->reg0200_src_udfu.csc_wgt_b2u = 112;
|
|
reg_base->reg0201_src_udfv.csc_wgt_r2v = 112;
|
reg_base->reg0201_src_udfv.csc_wgt_g2v = -94;
|
reg_base->reg0201_src_udfv.csc_wgt_b2v = -18;
|
|
reg_base->reg0202_src_udfo.csc_ofst_y = 16;
|
reg_base->reg0202_src_udfo.csc_ofst_u = 128;
|
reg_base->reg0202_src_udfo.csc_ofst_v = 128;
|
}
|
|
reg_base->reg0205_src_strd0.src_strd0 = stridey;
|
reg_base->reg0206_src_strd1.src_strd1 = stridec;
|
|
return MPP_OK;
|
}
|
|
static void vepu580_h265_set_slice_regs(H265eSyntax_new *syn, hevc_vepu580_base *regs)
|
{
|
regs->reg0237_synt_sps.smpl_adpt_ofst_e = syn->pp.sample_adaptive_offset_enabled_flag;//slice->m_sps->m_bUseSAO;
|
regs->reg0237_synt_sps.num_st_ref_pic = syn->pp.num_short_term_ref_pic_sets;
|
regs->reg0237_synt_sps.num_lt_ref_pic = syn->pp.num_long_term_ref_pics_sps;
|
regs->reg0237_synt_sps.lt_ref_pic_prsnt = syn->pp.long_term_ref_pics_present_flag;
|
regs->reg0237_synt_sps.tmpl_mvp_e = syn->pp.sps_temporal_mvp_enabled_flag;
|
regs->reg0237_synt_sps.log2_max_poc_lsb = syn->pp.log2_max_pic_order_cnt_lsb_minus4;
|
regs->reg0237_synt_sps.strg_intra_smth = syn->pp.strong_intra_smoothing_enabled_flag;
|
|
regs->reg0238_synt_pps.dpdnt_sli_seg_en = syn->pp.dependent_slice_segments_enabled_flag;
|
regs->reg0238_synt_pps.out_flg_prsnt_flg = syn->pp.output_flag_present_flag;
|
regs->reg0238_synt_pps.num_extr_sli_hdr = syn->pp.num_extra_slice_header_bits;
|
regs->reg0238_synt_pps.sgn_dat_hid_en = syn->pp.sign_data_hiding_enabled_flag;
|
regs->reg0238_synt_pps.cbc_init_prsnt_flg = syn->pp.cabac_init_present_flag;
|
regs->reg0238_synt_pps.pic_init_qp = syn->pp.init_qp_minus26 + 26;
|
regs->reg0238_synt_pps.cu_qp_dlt_en = syn->pp.cu_qp_delta_enabled_flag;
|
regs->reg0238_synt_pps.chrm_qp_ofst_prsn = syn->pp.pps_slice_chroma_qp_offsets_present_flag;
|
regs->reg0238_synt_pps.lp_fltr_acrs_sli = syn->pp.pps_loop_filter_across_slices_enabled_flag;
|
regs->reg0238_synt_pps.dblk_fltr_ovrd_en = syn->pp.deblocking_filter_override_enabled_flag;
|
regs->reg0238_synt_pps.lst_mdfy_prsnt_flg = syn->pp.lists_modification_present_flag;
|
regs->reg0238_synt_pps.sli_seg_hdr_extn = syn->pp.slice_segment_header_extension_present_flag;
|
regs->reg0238_synt_pps.cu_qp_dlt_depth = syn->pp.diff_cu_qp_delta_depth;
|
regs->reg0238_synt_pps.lpf_fltr_acrs_til = syn->pp.loop_filter_across_tiles_enabled_flag;
|
|
regs->reg0239_synt_sli0.cbc_init_flg = syn->sp.cbc_init_flg;
|
regs->reg0239_synt_sli0.mvd_l1_zero_flg = syn->sp.mvd_l1_zero_flg;
|
regs->reg0239_synt_sli0.mrg_up_flg = syn->sp.merge_up_flag;
|
regs->reg0239_synt_sli0.mrg_lft_flg = syn->sp.merge_left_flag;
|
regs->reg0239_synt_sli0.ref_pic_lst_mdf_l0 = syn->sp.ref_pic_lst_mdf_l0;
|
|
regs->reg0239_synt_sli0.num_refidx_l1_act = syn->sp.num_refidx_l1_act;
|
regs->reg0239_synt_sli0.num_refidx_l0_act = syn->sp.num_refidx_l0_act;
|
|
regs->reg0239_synt_sli0.num_refidx_act_ovrd = syn->sp.num_refidx_act_ovrd;
|
|
regs->reg0239_synt_sli0.sli_sao_chrm_flg = syn->sp.sli_sao_chrm_flg;
|
regs->reg0239_synt_sli0.sli_sao_luma_flg = syn->sp.sli_sao_luma_flg;
|
regs->reg0239_synt_sli0.sli_tmprl_mvp_e = syn->sp.sli_tmprl_mvp_en;
|
regs->reg0192_enc_pic.num_pic_tot_cur = syn->sp.tot_poc_num;
|
|
regs->reg0239_synt_sli0.pic_out_flg = syn->sp.pic_out_flg;
|
regs->reg0239_synt_sli0.sli_type = syn->sp.slice_type;
|
regs->reg0239_synt_sli0.sli_rsrv_flg = syn->sp.slice_rsrv_flg;
|
regs->reg0239_synt_sli0.dpdnt_sli_seg_flg = syn->sp.dpdnt_sli_seg_flg;
|
regs->reg0239_synt_sli0.sli_pps_id = syn->sp.sli_pps_id;
|
regs->reg0239_synt_sli0.no_out_pri_pic = syn->sp.no_out_pri_pic;
|
|
|
regs->reg0240_synt_sli1.sp_tc_ofst_div2 = syn->sp.sli_tc_ofst_div2;;
|
regs->reg0240_synt_sli1.sp_beta_ofst_div2 = syn->sp.sli_beta_ofst_div2;
|
regs->reg0240_synt_sli1.sli_lp_fltr_acrs_sli = syn->sp.sli_lp_fltr_acrs_sli;
|
regs->reg0240_synt_sli1.sp_dblk_fltr_dis = syn->sp.sli_dblk_fltr_dis;
|
regs->reg0240_synt_sli1.dblk_fltr_ovrd_flg = syn->sp.dblk_fltr_ovrd_flg;
|
regs->reg0240_synt_sli1.sli_cb_qp_ofst = syn->sp.sli_cb_qp_ofst;
|
regs->reg0240_synt_sli1.max_mrg_cnd = syn->sp.max_mrg_cnd;
|
|
regs->reg0240_synt_sli1.col_ref_idx = syn->sp.col_ref_idx;
|
regs->reg0240_synt_sli1.col_frm_l0_flg = syn->sp.col_frm_l0_flg;
|
regs->reg0241_synt_sli2.sli_poc_lsb = syn->sp.sli_poc_lsb;
|
regs->reg0241_synt_sli2.sli_hdr_ext_len = syn->sp.sli_hdr_ext_len;
|
|
}
|
|
static void vepu580_h265_set_ref_regs(H265eSyntax_new *syn, hevc_vepu580_base *regs)
|
{
|
regs->reg0242_synt_refm0.st_ref_pic_flg = syn->sp.st_ref_pic_flg;
|
regs->reg0242_synt_refm0.poc_lsb_lt0 = syn->sp.poc_lsb_lt0;
|
regs->reg0242_synt_refm0.num_lt_pic = syn->sp.num_lt_pic;
|
|
regs->reg0243_synt_refm1.dlt_poc_msb_prsnt0 = syn->sp.dlt_poc_msb_prsnt0;
|
regs->reg0243_synt_refm1.dlt_poc_msb_cycl0 = syn->sp.dlt_poc_msb_cycl0;
|
regs->reg0243_synt_refm1.used_by_lt_flg0 = syn->sp.used_by_lt_flg0;
|
regs->reg0243_synt_refm1.used_by_lt_flg1 = syn->sp.used_by_lt_flg1;
|
regs->reg0243_synt_refm1.used_by_lt_flg2 = syn->sp.used_by_lt_flg2;
|
regs->reg0243_synt_refm1.dlt_poc_msb_prsnt0 = syn->sp.dlt_poc_msb_prsnt0;
|
regs->reg0243_synt_refm1.dlt_poc_msb_cycl0 = syn->sp.dlt_poc_msb_cycl0;
|
regs->reg0243_synt_refm1.dlt_poc_msb_prsnt1 = syn->sp.dlt_poc_msb_prsnt1;
|
regs->reg0243_synt_refm1.num_negative_pics = syn->sp.num_neg_pic;
|
regs->reg0243_synt_refm1.num_pos_pic = syn->sp.num_pos_pic;
|
|
regs->reg0243_synt_refm1.used_by_s0_flg = syn->sp.used_by_s0_flg;
|
regs->reg0244_synt_refm2.dlt_poc_s0_m10 = syn->sp.dlt_poc_s0_m10;
|
regs->reg0244_synt_refm2.dlt_poc_s0_m11 = syn->sp.dlt_poc_s0_m11;
|
regs->reg0245_synt_refm3.dlt_poc_s0_m12 = syn->sp.dlt_poc_s0_m12;
|
regs->reg0245_synt_refm3.dlt_poc_s0_m13 = syn->sp.dlt_poc_s0_m13;
|
|
regs->reg0246_synt_long_refm0.poc_lsb_lt1 = syn->sp.poc_lsb_lt1;
|
regs->reg0247_synt_long_refm1.dlt_poc_msb_cycl1 = syn->sp.dlt_poc_msb_cycl1;
|
regs->reg0246_synt_long_refm0.poc_lsb_lt2 = syn->sp.poc_lsb_lt2;
|
regs->reg0243_synt_refm1.dlt_poc_msb_prsnt2 = syn->sp.dlt_poc_msb_prsnt2;
|
regs->reg0247_synt_long_refm1.dlt_poc_msb_cycl2 = syn->sp.dlt_poc_msb_cycl2;
|
regs->reg0240_synt_sli1.lst_entry_l0 = syn->sp.lst_entry_l0;
|
regs->reg0239_synt_sli0.ref_pic_lst_mdf_l0 = syn->sp.ref_pic_lst_mdf_l0;
|
|
return;
|
}
|
|
static MPP_RET hal_h265e_v580_send_regs(MppDev dev, H265eV580RegSet *hw_regs, H265eV580StatusElem *reg_out)
|
{
|
RK_U32 *regs = (RK_U32*)hw_regs;
|
MppDevRegWrCfg cfg;
|
MppDevRegRdCfg cfg1;
|
MPP_RET ret = MPP_OK;
|
RK_U32 i;
|
|
cfg.reg = (RK_U32*)&hw_regs->reg_ctl;
|
cfg.size = sizeof(hevc_vepu580_control_cfg);
|
cfg.offset = VEPU580_CTL_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &cfg);
|
if (ret) {
|
mpp_err_f("set register write failed %d\n", ret);
|
goto FAILE;
|
}
|
|
if (hal_h265e_debug & HAL_H265E_DBG_CTL_REGS) {
|
regs = (RK_U32*)&hw_regs->reg_ctl;
|
for (i = 0; i < sizeof(hevc_vepu580_control_cfg) / 4; i++) {
|
hal_h265e_dbg_ctl("ctl reg[%04x]: 0%08x\n", i * 4, regs[i]);
|
}
|
}
|
|
cfg.reg = &hw_regs->reg_base;
|
cfg.size = sizeof(hevc_vepu580_base);
|
cfg.offset = VEPU580_BASE_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &cfg);
|
if (ret) {
|
mpp_err_f("set register write failed %d\n", ret);
|
goto FAILE;
|
}
|
|
if (hal_h265e_debug & HAL_H265E_DBG_REGS) {
|
regs = (RK_U32*)(&hw_regs->reg_base);
|
for (i = 0; i < 32; i++) {
|
hal_h265e_dbg_regs("hw add cfg reg[%04x]: 0%08x\n", i * 4, regs[i]);
|
}
|
regs += 32;
|
for (i = 0; i < (sizeof(hevc_vepu580_base) - 128) / 4; i++) {
|
hal_h265e_dbg_regs("set reg[%04x]: 0%08x\n", i * 4, regs[i]);
|
}
|
}
|
|
cfg.reg = &hw_regs->reg_rc_klut;
|
cfg.size = sizeof(hevc_vepu580_rc_klut);
|
cfg.offset = VEPU580_RCKULT_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &cfg);
|
|
if (hal_h265e_debug & HAL_H265E_DBG_RCKUT_REGS) {
|
regs = (RK_U32*)&hw_regs->reg_rc_klut;
|
for (i = 0; i < sizeof(hevc_vepu580_rc_klut) / 4; i++) {
|
hal_h265e_dbg_rckut("set reg[%04x]: 0%08x\n", i * 4, regs[i]);
|
}
|
}
|
|
if (ret) {
|
mpp_err_f("set rc kult write failed %d\n", ret);
|
goto FAILE;
|
}
|
|
cfg.reg = &hw_regs->reg_wgt;
|
cfg.size = sizeof(hevc_vepu580_wgt);
|
cfg.offset = VEPU580_WEG_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &cfg);
|
if (ret) {
|
mpp_err_f("set register write failed %d\n", ret);
|
goto FAILE;
|
}
|
|
if (hal_h265e_debug & HAL_H265E_DBG_WGT_REGS) {
|
regs = (RK_U32*)&hw_regs->reg_wgt;
|
for (i = 0; i < sizeof(hevc_vepu580_wgt) / 4; i++) {
|
hal_h265e_dbg_wgt("set reg[%04x]: 0%08x\n", i * 4, regs[i]);
|
}
|
}
|
|
cfg.reg = &hw_regs->reg_rdo;
|
cfg.size = sizeof(vepu580_rdo_cfg);
|
cfg.offset = VEPU580_RDOCFG_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &cfg);
|
if (ret) {
|
mpp_err_f("set register write failed %d\n", ret);
|
goto FAILE;
|
}
|
|
cfg.reg = &hw_regs->reg_osd_cfg;
|
cfg.size = sizeof(vepu580_osd_cfg);
|
cfg.offset = VEPU580_OSD_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &cfg);
|
if (ret) {
|
mpp_err_f("set register write failed %d\n", ret);
|
goto FAILE;
|
}
|
|
cfg1.reg = ®_out->hw_status;
|
cfg1.size = sizeof(RK_U32);
|
cfg1.offset = VEPU580_REG_BASE_HW_STATUS;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &cfg1);
|
if (ret) {
|
mpp_err_f("set register read failed %d\n", ret);
|
goto FAILE;
|
}
|
|
cfg1.reg = ®_out->st;
|
cfg1.size = sizeof(H265eV580StatusElem) - 4;
|
cfg1.offset = VEPU580_STATUS_OFFSET;
|
|
ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &cfg1);
|
if (ret) {
|
mpp_err_f("set register read failed %d\n", ret);
|
goto FAILE;
|
}
|
FAILE:
|
return ret;
|
}
|
|
static void vepu580_h265_set_me_regs(H265eV580HalContext *ctx, H265eSyntax_new *syn, hevc_vepu580_base *regs)
|
{
|
|
RK_U32 cime_w = 11, cime_h = 7;
|
RK_S32 merangx = (cime_w + 1) * 32;
|
RK_S32 merangy = (cime_h + 1) * 32;
|
RK_S32 pic_wd64 = MPP_ALIGN(syn->pp.pic_width, 64) >> 6;
|
|
if (merangx > 384) {
|
merangx = 384;
|
}
|
if (merangy > 320) {
|
merangy = 320;
|
}
|
|
if (syn->pp.pic_width < merangx + 60 || syn->pp.pic_width <= 352) {
|
if (merangx > syn->pp.pic_width ) {
|
merangx = syn->pp.pic_width;
|
}
|
merangx = merangx / 4 * 2;
|
}
|
|
if (syn->pp.pic_height < merangy + 60 || syn->pp.pic_height <= 288) {
|
if (merangy > syn->pp.pic_height) {
|
merangy = syn->pp.pic_height;
|
}
|
merangy = merangy / 4 * 2;
|
}
|
|
{
|
RK_S32 merange_x = merangx / 2;
|
RK_S32 merange_y = merangy / 2;
|
RK_S32 mxneg = ((-(merange_x << 2)) >> 2) / 4;
|
RK_S32 myneg = ((-(merange_y << 2)) >> 2) / 4;
|
RK_S32 mxpos = (((merange_x << 2) - 4) >> 2) / 4;
|
RK_S32 mypos = (((merange_y << 2) - 4) >> 2) / 4;
|
|
mxneg = MPP_MIN(abs(mxneg), mxpos) * 4;
|
myneg = MPP_MIN(abs(myneg), mypos) * 4;
|
|
merangx = mxneg * 2;
|
merangy = myneg * 2;
|
}
|
regs->reg0220_me_rnge.cme_srch_h = merangx / 32;
|
regs->reg0220_me_rnge.cme_srch_v = merangy / 32;
|
|
regs->reg0220_me_rnge.rme_srch_h = 7;
|
regs->reg0220_me_rnge.rme_srch_v = 5;
|
regs->reg0220_me_rnge.dlt_frm_num = 0x1;
|
|
regs->reg0221_me_cfg.pmv_mdst_h = 5;
|
regs->reg0221_me_cfg.pmv_mdst_v = 5;
|
regs->reg0221_me_cfg.mv_limit = 0;
|
regs->reg0221_me_cfg.pmv_num = 2;
|
|
//regs->reg0221_me_cfg.rme_dis = 0;
|
// regs->reg0221_me_cfg.rme_dis = 2;
|
|
|
|
if (syn->pp.sps_temporal_mvp_enabled_flag &&
|
(ctx->frame_type != INTRA_FRAME)) {
|
if (ctx->last_frame_type == INTRA_FRAME) {
|
regs->reg0221_me_cfg.colmv_load = 0;
|
} else {
|
regs->reg0221_me_cfg.colmv_load = 1;
|
}
|
regs->reg0221_me_cfg.colmv_stor = 1;
|
}
|
|
if (syn->pp.pic_width > 2688) {
|
regs->reg0222_me_cach.cme_rama_h = 12;
|
} else if (syn->pp.pic_width > 2048) {
|
regs->reg0222_me_cach.cme_rama_h = 16;
|
} else {
|
regs->reg0222_me_cach.cme_rama_h = 20;
|
}
|
|
{
|
RK_S32 swin_scope_wd16 = (regs->reg0220_me_rnge.cme_srch_h + 3 + 1) / 4 * 2 + 1;
|
RK_S32 tmpMin = (regs->reg0220_me_rnge.cme_srch_v + 3) / 4 * 2 + 1;
|
if (regs->reg0222_me_cach.cme_rama_h / 4 < tmpMin) {
|
tmpMin = regs->reg0222_me_cach.cme_rama_h / 4;
|
}
|
regs->reg0222_me_cach.cme_rama_max =
|
(pic_wd64 * (tmpMin - 1)) + ((pic_wd64 >= swin_scope_wd16) ? swin_scope_wd16 : pic_wd64 * 2);
|
}
|
regs->reg0222_me_cach.cach_l2_tag = 0x0;
|
|
pic_wd64 = pic_wd64 << 6;
|
|
if (pic_wd64 <= 512)
|
regs->reg0222_me_cach.cach_l2_tag = 0x0;
|
else if (pic_wd64 <= 1024)
|
regs->reg0222_me_cach.cach_l2_tag = 0x1;
|
else if (pic_wd64 <= 2048)
|
regs->reg0222_me_cach.cach_l2_tag = 0x2;
|
else if (pic_wd64 <= 4096)
|
regs->reg0222_me_cach.cach_l2_tag = 0x3;
|
|
}
|
|
void vepu580_h265_set_hw_address(H265eV580HalContext *ctx, hevc_vepu580_base *regs, HalEncTask *task)
|
{
|
HalEncTask *enc_task = task;
|
HalBuf *recon_buf, *ref_buf;
|
MppBuffer md_info_buf = enc_task->md_info;
|
H265eSyntax_new *syn = (H265eSyntax_new *)enc_task->syntax.data;
|
|
hal_h265e_enter();
|
|
regs->reg0160_adr_src0 = mpp_buffer_get_fd(enc_task->input);
|
regs->reg0161_adr_src1 = regs->reg0160_adr_src0;
|
regs->reg0162_adr_src2 = regs->reg0160_adr_src0;
|
|
recon_buf = hal_bufs_get_buf(ctx->dpb_bufs, syn->sp.recon_pic.slot_idx);
|
ref_buf = hal_bufs_get_buf(ctx->dpb_bufs, syn->sp.ref_pic.slot_idx);
|
|
if (!syn->sp.non_reference_flag) {
|
regs->reg0163_rfpw_h_addr = mpp_buffer_get_fd(recon_buf->buf[0]);
|
regs->reg0164_rfpw_b_addr = regs->reg0163_rfpw_h_addr;
|
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 164, ctx->fbc_header_len);
|
}
|
regs->reg0165_rfpr_h_addr = mpp_buffer_get_fd(ref_buf->buf[0]);
|
regs->reg0166_rfpr_b_addr = regs->reg0165_rfpr_h_addr;
|
regs->reg0167_cmvw_addr = mpp_buffer_get_fd(recon_buf->buf[2]);
|
regs->reg0168_cmvr_addr = mpp_buffer_get_fd(ref_buf->buf[2]);
|
regs->reg0169_dspw_addr = mpp_buffer_get_fd(recon_buf->buf[1]);
|
regs->reg0170_dspr_addr = mpp_buffer_get_fd(ref_buf->buf[1]);
|
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 166, ctx->fbc_header_len);
|
|
if (syn->pp.tiles_enabled_flag) {
|
if (NULL == ctx->tile_grp)
|
mpp_buffer_group_get_internal(&ctx->tile_grp, MPP_BUFFER_TYPE_ION);
|
|
mpp_assert(ctx->tile_grp);
|
|
if (NULL == ctx->hw_tile_buf[0]) {
|
mpp_buffer_get(ctx->tile_grp, &ctx->hw_tile_buf[0], TILE_BUF_SIZE);
|
}
|
|
if (NULL == ctx->hw_tile_buf[1]) {
|
mpp_buffer_get(ctx->tile_grp, &ctx->hw_tile_buf[1], TILE_BUF_SIZE);
|
}
|
|
if (NULL == ctx->hw_tile_stream) {
|
mpp_buffer_get(ctx->tile_grp, &ctx->hw_tile_stream, ctx->frame_size / 2);
|
}
|
|
regs->reg0176_lpfw_addr = mpp_buffer_get_fd(ctx->hw_tile_buf[0]);
|
regs->reg0177_lpfr_addr = mpp_buffer_get_fd(ctx->hw_tile_buf[1]);
|
}
|
|
if (md_info_buf) {
|
regs->reg0192_enc_pic.mei_stor = 1;
|
regs->reg0171_meiw_addr = mpp_buffer_get_fd(md_info_buf);
|
} else {
|
regs->reg0192_enc_pic.mei_stor = 0;
|
regs->reg0171_meiw_addr = 0;
|
}
|
|
regs->reg0172_bsbt_addr = mpp_buffer_get_fd(enc_task->output);
|
/* TODO: stream size relative with syntax */
|
regs->reg0173_bsbb_addr = regs->reg0172_bsbt_addr;
|
regs->reg0174_bsbr_addr = regs->reg0172_bsbt_addr;
|
regs->reg0175_adr_bsbs = regs->reg0172_bsbt_addr;
|
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 175, mpp_packet_get_length(task->packet));
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 172, mpp_buffer_get_size(enc_task->output));
|
}
|
|
static MPP_RET vepu580_h265e_save_pass1_patch(H265eV580RegSet *regs, H265eV580HalContext *ctx,
|
RK_S32 tiles_enabled_flag)
|
{
|
hevc_vepu580_base *reg_base = ®s->reg_base;
|
RK_S32 width = ctx->cfg->prep.width;
|
RK_S32 height = ctx->cfg->prep.height;
|
RK_S32 width_align = MPP_ALIGN(width, 64);
|
RK_S32 height_align = MPP_ALIGN(height, 16);
|
|
if (NULL == ctx->buf_pass1) {
|
mpp_buffer_get(NULL, &ctx->buf_pass1, width_align * height_align * 3 / 2);
|
if (!ctx->buf_pass1) {
|
mpp_err("buf_pass1 malloc fail, debreath invaild");
|
return MPP_NOK;
|
}
|
}
|
|
reg_base->reg0192_enc_pic.cur_frm_ref = 1;
|
reg_base->reg0163_rfpw_h_addr = mpp_buffer_get_fd(ctx->buf_pass1);
|
reg_base->reg0164_rfpw_b_addr = reg_base->reg0163_rfpw_h_addr;
|
reg_base->reg0192_enc_pic.rec_fbc_dis = 1;
|
|
if (tiles_enabled_flag)
|
reg_base->reg0238_synt_pps.lpf_fltr_acrs_til = 0;
|
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 164, width_align * height);
|
|
return MPP_OK;
|
}
|
|
static MPP_RET vepu580_h265e_use_pass1_patch(H265eV580RegSet *regs, H265eV580HalContext *ctx)
|
{
|
hevc_vepu580_control_cfg *reg_ctl = ®s->reg_ctl;
|
hevc_vepu580_base *reg_base = ®s->reg_base;
|
RK_U32 hor_stride = MPP_ALIGN(ctx->cfg->prep.width, 64);
|
RK_U32 ver_stride = MPP_ALIGN(ctx->cfg->prep.height, 16);
|
RK_U32 frame_size = hor_stride * ver_stride;
|
VepuFmtCfg *fmt = (VepuFmtCfg *)ctx->input_fmt;
|
MPP_RET ret = MPP_OK;
|
|
reg_ctl->reg0012_dtrns_map.src_bus_edin = fmt->src_endian;
|
reg_base->reg0198_src_fmt.src_cfmt = VEPU541_FMT_YUV420SP;
|
reg_base->reg0198_src_fmt.out_fmt = 1;
|
reg_base->reg0203_src_proc.afbcd_en = 0;
|
reg_base->reg0205_src_strd0.src_strd0 = hor_stride;
|
reg_base->reg0206_src_strd1.src_strd1 = hor_stride;
|
reg_base->reg0160_adr_src0 = mpp_buffer_get_fd(ctx->buf_pass1);
|
reg_base->reg0161_adr_src1 = reg_base->reg0160_adr_src0;
|
reg_base->reg0162_adr_src2 = reg_base->reg0160_adr_src0;
|
|
/* input cb addr */
|
ret = mpp_dev_multi_offset_update(ctx->reg_cfg, 161, frame_size);
|
if (ret)
|
mpp_err_f("set input cb addr offset failed %d\n", ret);
|
|
/* input cr addr */
|
ret = mpp_dev_multi_offset_update(ctx->reg_cfg, 162, frame_size);
|
if (ret)
|
mpp_err_f("set input cr addr offset failed %d\n", ret);
|
|
return MPP_OK;
|
}
|
|
static void setup_vepu580_split(H265eV580RegSet *regs, MppEncSliceSplit *cfg)
|
{
|
hal_h265e_dbg_func("enter\n");
|
|
switch (cfg->split_mode) {
|
case MPP_ENC_SPLIT_NONE : {
|
regs->reg_base.reg0216_sli_splt.sli_splt = 0;
|
regs->reg_base.reg0216_sli_splt.sli_splt_mode = 0;
|
regs->reg_base.reg0216_sli_splt.sli_splt_cpst = 0;
|
regs->reg_base.reg0216_sli_splt.sli_max_num_m1 = 0;
|
regs->reg_base.reg0216_sli_splt.sli_flsh = 0;
|
regs->reg_base.reg0218_sli_cnum.sli_splt_cnum_m1 = 0;
|
|
regs->reg_base.reg0217_sli_byte.sli_splt_byte = 0;
|
regs->reg_base.reg0192_enc_pic.slen_fifo = 0;
|
} break;
|
case MPP_ENC_SPLIT_BY_BYTE : {
|
regs->reg_base.reg0216_sli_splt.sli_splt = 1;
|
regs->reg_base.reg0216_sli_splt.sli_splt_mode = 0;
|
regs->reg_base.reg0216_sli_splt.sli_splt_cpst = 0;
|
regs->reg_base.reg0216_sli_splt.sli_max_num_m1 = 500;
|
regs->reg_base.reg0216_sli_splt.sli_flsh = 1;
|
regs->reg_base.reg0218_sli_cnum.sli_splt_cnum_m1 = 0;
|
|
regs->reg_base.reg0217_sli_byte.sli_splt_byte = cfg->split_arg;
|
regs->reg_base.reg0192_enc_pic.slen_fifo = cfg->split_out ? 1 : 0;
|
} break;
|
case MPP_ENC_SPLIT_BY_CTU : {
|
regs->reg_base.reg0216_sli_splt.sli_splt = 1;
|
regs->reg_base.reg0216_sli_splt.sli_splt_mode = 1;
|
regs->reg_base.reg0216_sli_splt.sli_splt_cpst = 0;
|
regs->reg_base.reg0216_sli_splt.sli_max_num_m1 = 500;
|
regs->reg_base.reg0216_sli_splt.sli_flsh = 1;
|
regs->reg_base.reg0218_sli_cnum.sli_splt_cnum_m1 = cfg->split_arg - 1;
|
|
regs->reg_base.reg0217_sli_byte.sli_splt_byte = 0;
|
regs->reg_base.reg0192_enc_pic.slen_fifo = cfg->split_out ? 1 : 0;
|
} break;
|
default : {
|
mpp_log_f("invalide slice split mode %d\n", cfg->split_mode);
|
} break;
|
}
|
|
cfg->change = 0;
|
|
hal_h265e_dbg_func("leave\n");
|
}
|
|
MPP_RET hal_h265e_v580_gen_regs(void *hal, HalEncTask *task)
|
{
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
HalEncTask *enc_task = task;
|
EncRcTask *rc_task = enc_task->rc_task;
|
EncFrmStatus *frm = &rc_task->frm;
|
H265eSyntax_new *syn = (H265eSyntax_new *)enc_task->syntax.data;
|
H265eV580RegSet *regs = (H265eV580RegSet *)ctx->regs[0];
|
RK_U32 pic_width_align8, pic_height_align8;
|
RK_S32 pic_wd64, pic_h64;
|
VepuFmtCfg *fmt = (VepuFmtCfg *)ctx->input_fmt;
|
hevc_vepu580_control_cfg *reg_ctl = ®s->reg_ctl;
|
hevc_vepu580_base *reg_base = ®s->reg_base;
|
hevc_vepu580_rc_klut *reg_klut = ®s->reg_rc_klut;
|
|
hal_h265e_enter();
|
pic_width_align8 = (syn->pp.pic_width + 7) & (~7);
|
pic_height_align8 = (syn->pp.pic_height + 7) & (~7);
|
pic_wd64 = (syn->pp.pic_width + 63) / 64;
|
pic_h64 = (syn->pp.pic_height + 63) / 64;
|
|
hal_h265e_dbg_simple("frame %d | type %d | start gen regs",
|
ctx->frame_cnt, ctx->frame_type);
|
|
memset(regs, 0, sizeof(H265eV580RegSet));
|
|
reg_ctl->reg0004_enc_strt.lkt_num = 0;
|
reg_ctl->reg0004_enc_strt.vepu_cmd = ctx->enc_mode;
|
reg_ctl->reg0005_enc_clr.safe_clr = 0x0;
|
reg_ctl->reg0005_enc_clr.force_clr = 0x0;
|
|
reg_ctl->reg0008_int_en.enc_done_en = 1;
|
reg_ctl->reg0008_int_en.lkt_node_done_en = 1;
|
reg_ctl->reg0008_int_en.sclr_done_en = 1;
|
reg_ctl->reg0008_int_en.slc_done_en = 1;
|
reg_ctl->reg0008_int_en.bsf_oflw_en = 1;
|
reg_ctl->reg0008_int_en.brsp_otsd_en = 1;
|
reg_ctl->reg0008_int_en.wbus_err_en = 1;
|
reg_ctl->reg0008_int_en.rbus_err_en = 1;
|
reg_ctl->reg0008_int_en.wdg_en = 1;
|
reg_ctl->reg0008_int_en.lkt_err_int_en = 0;
|
|
reg_ctl->reg0012_dtrns_map.lpfw_bus_ordr = 0x0;
|
reg_ctl->reg0012_dtrns_map.cmvw_bus_ordr = 0x0;
|
reg_ctl->reg0012_dtrns_map.dspw_bus_ordr = 0x0;
|
reg_ctl->reg0012_dtrns_map.rfpw_bus_ordr = 0x0;
|
reg_ctl->reg0012_dtrns_map.src_bus_edin = 0x0;
|
reg_ctl->reg0012_dtrns_map.meiw_bus_edin = 0x0;
|
reg_ctl->reg0012_dtrns_map.bsw_bus_edin = 0x7;
|
reg_ctl->reg0012_dtrns_map.lktr_bus_edin = 0x0;
|
reg_ctl->reg0012_dtrns_map.roir_bus_edin = 0x0;
|
reg_ctl->reg0012_dtrns_map.lktw_bus_edin = 0x0;
|
reg_ctl->reg0012_dtrns_map.afbc_bsize = 0x1;
|
reg_ctl->reg0012_dtrns_map.ebufw_bus_ordr = 0x0;
|
|
reg_ctl->reg0013_dtrns_cfg.dspr_otsd = (ctx->frame_type == INTER_P_FRAME);
|
reg_ctl->reg0013_dtrns_cfg.axi_brsp_cke = 0x0;
|
reg_ctl->reg0014_enc_wdg.vs_load_thd = 0x1fffff;
|
reg_ctl->reg0014_enc_wdg.rfp_load_thd = 0xff;
|
|
reg_ctl->reg0021_func_en.cke = 1;
|
reg_ctl->reg0021_func_en.resetn_hw_en = 1;
|
reg_ctl->reg0021_func_en.enc_done_tmvp_en = 1;
|
|
reg_base->reg0196_enc_rsl.pic_wd8_m1 = pic_width_align8 / 8 - 1;
|
reg_base->reg0197_src_fill.pic_wfill = (syn->pp.pic_width & 0x7)
|
? (8 - (syn->pp.pic_width & 0x7)) : 0;
|
reg_base->reg0196_enc_rsl.pic_hd8_m1 = pic_height_align8 / 8 - 1;
|
reg_base->reg0197_src_fill.pic_hfill = (syn->pp.pic_height & 0x7)
|
? (8 - (syn->pp.pic_height & 0x7)) : 0;
|
|
reg_base->reg0192_enc_pic.enc_stnd = 1; //H265
|
reg_base->reg0192_enc_pic.cur_frm_ref = !syn->sp.non_reference_flag; //current frame will be refered
|
reg_base->reg0192_enc_pic.bs_scp = 1;
|
reg_base->reg0192_enc_pic.log2_ctu_num = ceil(log2((double)pic_wd64 * pic_h64));
|
|
reg_base->reg0203_src_proc.src_mirr = 0;
|
reg_base->reg0203_src_proc.src_rot = 0;
|
reg_base->reg0203_src_proc.txa_en = 1;
|
reg_base->reg0203_src_proc.afbcd_en = (MPP_FRAME_FMT_IS_FBC(syn->pp.mpp_format)) ? 1 : 0;
|
|
reg_klut->klut_ofst.chrm_klut_ofst = (ctx->frame_type == INTRA_FRAME) ? 0 : 3;
|
memcpy(®_klut->klut_wgt0, &klut_weight[0], sizeof(klut_weight));
|
|
vepu580_h265_set_me_regs(ctx, syn, reg_base);
|
|
reg_base->reg0232_rdo_cfg.chrm_spcl = 1;
|
reg_base->reg0232_rdo_cfg.cu_inter_e = 0x06db;
|
reg_base->reg0232_rdo_cfg.cu_intra_e = 0xf;
|
|
if (syn->pp.num_long_term_ref_pics_sps) {
|
reg_base->reg0232_rdo_cfg.ltm_col = 0;
|
reg_base->reg0232_rdo_cfg.ltm_idx0l0 = 1;
|
} else {
|
reg_base->reg0232_rdo_cfg.ltm_col = 0;
|
reg_base->reg0232_rdo_cfg.ltm_idx0l0 = 0;
|
}
|
|
reg_base->reg0232_rdo_cfg.ccwa_e = 1;
|
reg_base->reg0232_rdo_cfg.scl_lst_sel = syn->pp.scaling_list_enabled_flag;
|
{
|
RK_U32 i_nal_type = 0;
|
|
/* TODO: extend syn->frame_coding_type definition */
|
if (ctx->frame_type == INTRA_FRAME) {
|
/* reset ref pictures */
|
i_nal_type = NAL_IDR_W_RADL;
|
} else if (ctx->frame_type == INTER_P_FRAME ) {
|
i_nal_type = NAL_TRAIL_R;
|
} else {
|
i_nal_type = NAL_TRAIL_R;
|
}
|
reg_base->reg0236_synt_nal.nal_unit_type = i_nal_type;
|
}
|
|
vepu580_h265_set_hw_address(ctx, reg_base, task);
|
vepu580_h265_set_pp_regs(regs, fmt, &ctx->cfg->prep, task);
|
vepu580_h265_set_rc_regs(ctx, regs, task);
|
vepu580_h265_set_slice_regs(syn, reg_base);
|
vepu580_h265_set_ref_regs(syn, reg_base);
|
|
vepu580_set_osd(&ctx->osd_cfg);
|
/* ROI configure */
|
vepu580_h265_set_roi_regs(ctx, reg_base);
|
|
/*paramet cfg*/
|
vepu580_h265_global_cfg_set(ctx, regs);
|
|
vepu580_h265e_tune_reg_patch(ctx->tune);
|
setup_vepu580_split(regs, &ctx->cfg->split);
|
/* two pass register patch */
|
if (frm->save_pass1)
|
vepu580_h265e_save_pass1_patch(regs, ctx, syn->pp.tiles_enabled_flag);
|
|
if (frm->use_pass1)
|
vepu580_h265e_use_pass1_patch(regs, ctx);
|
|
ctx->frame_num++;
|
|
hal_h265e_leave();
|
return MPP_OK;
|
}
|
|
void hal_h265e_v580_set_uniform_tile(hevc_vepu580_base *regs, H265eSyntax_new *syn, RK_U32 index)
|
{
|
if (syn->pp.tiles_enabled_flag) {
|
RK_S32 mb_w = MPP_ALIGN(syn->pp.pic_width, 64) / 64;
|
RK_S32 mb_h = MPP_ALIGN(syn->pp.pic_height, 64) / 64;
|
RK_S32 tile_width = (index + 1) * mb_w / (syn->pp.num_tile_columns_minus1 + 1) -
|
index * mb_w / (syn->pp.num_tile_columns_minus1 + 1);
|
|
if (index > 0) {
|
RK_U32 tmp = regs->reg0177_lpfr_addr;
|
regs->reg0177_lpfr_addr = regs->reg0176_lpfw_addr;
|
regs->reg0176_lpfw_addr = tmp;
|
|
regs->reg0193_dual_core.dchs_txid = index;
|
regs->reg0193_dual_core.dchs_rxid = index - 1;
|
regs->reg0193_dual_core.dchs_txe = 1;
|
regs->reg0193_dual_core.dchs_rxe = 1;
|
} else {
|
regs->reg0193_dual_core.dchs_txid = index;
|
regs->reg0193_dual_core.dchs_rxid = 0;
|
regs->reg0193_dual_core.dchs_txe = 1;
|
regs->reg0193_dual_core.dchs_rxe = 0;
|
}
|
/* dual core runtime offset should set to 2 to avoid data access conflict */
|
regs->reg0193_dual_core.dchs_ofst = 2;
|
|
if (index == syn->pp.num_tile_columns_minus1) {
|
tile_width = mb_w - index * mb_w / (syn->pp.num_tile_columns_minus1 + 1);
|
regs->reg0193_dual_core.dchs_txid = 0;
|
regs->reg0193_dual_core.dchs_txe = 0;
|
}
|
regs->reg0252_tile_cfg.tile_w_m1 = tile_width - 1;
|
regs->reg0252_tile_cfg.tile_h_m1 = mb_h - 1;
|
regs->reg212_rc_cfg.rc_ctu_num = tile_width;
|
regs->reg0252_tile_cfg.tile_en = syn->pp.tiles_enabled_flag;
|
regs->reg0253_tile_pos.tile_x = (index * mb_w / (syn->pp.num_tile_columns_minus1 + 1));
|
regs->reg0253_tile_pos.tile_y = 0;
|
|
hal_h265e_dbg_detail("tile_x %d, rc_ctu_num %d, tile_width_m1 %d",
|
regs->reg0253_tile_pos.tile_x, regs->reg212_rc_cfg.rc_ctu_num,
|
regs->reg0252_tile_cfg.tile_w_m1);
|
}
|
}
|
|
MPP_RET hal_h265e_v580_start(void *hal, HalEncTask *enc_task)
|
{
|
MPP_RET ret = MPP_OK;
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
RK_U32 k = 0;
|
H265eSyntax_new *syn = (H265eSyntax_new *)enc_task->syntax.data;
|
RK_U32 tile_num = (syn->pp.num_tile_columns_minus1 + 1) * (syn->pp.num_tile_rows_minus1 + 1);
|
hal_h265e_enter();
|
RK_U32 stream_len = 0;
|
VepuFmtCfg *fmt = (VepuFmtCfg *)ctx->input_fmt;
|
|
ctx->tile_num = tile_num;
|
|
if (enc_task->flags.err) {
|
hal_h265e_err("enc_task->flags.err %08x, return e arly",
|
enc_task->flags.err);
|
return MPP_NOK;
|
}
|
|
if (tile_num > MAX_TILE_NUM) {
|
mpp_log("tile_num big then support %d, max %d", tile_num, MAX_TILE_NUM);
|
return MPP_NOK;
|
}
|
|
for (k = 0; k < tile_num; k++) {
|
H265eV580RegSet *hw_regs = (H265eV580RegSet *)ctx->regs[k];
|
hevc_vepu580_base *reg_base = &hw_regs->reg_base;
|
H265eV580StatusElem *reg_out = (H265eV580StatusElem *)ctx->reg_out[k];
|
|
if (k)
|
memcpy(hw_regs, ctx->regs[0], sizeof(*hw_regs));
|
|
vepu580_h265_set_me_ram(syn, &hw_regs->reg_base, k);
|
|
/* set input info */
|
vepu580_h265_set_patch_info(ctx->reg_cfg, syn, (Vepu541Fmt)fmt->format, enc_task);
|
if (tile_num > 1)
|
hal_h265e_v580_set_uniform_tile(&hw_regs->reg_base, syn, k);
|
|
if (k) {
|
RK_U32 offset = 0;
|
|
if (!ctx->tile_parall_en) {
|
offset = mpp_packet_get_length(enc_task->packet);
|
offset += stream_len;
|
|
reg_base->reg0173_bsbb_addr = mpp_buffer_get_fd(enc_task->output);
|
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 175, offset);
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 172, mpp_buffer_get_size(enc_task->output));
|
} else {
|
reg_base->reg0172_bsbt_addr = mpp_buffer_get_fd(ctx->hw_tile_stream);
|
/* TODO: stream size relative with syntax */
|
reg_base->reg0173_bsbb_addr = reg_base->reg0172_bsbt_addr;
|
reg_base->reg0174_bsbr_addr = reg_base->reg0172_bsbt_addr;
|
reg_base->reg0175_adr_bsbs = reg_base->reg0172_bsbt_addr;
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 175, 0);
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 172, mpp_buffer_get_size(ctx->hw_tile_stream));
|
}
|
|
offset = ctx->fbc_header_len;
|
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 166, offset);
|
mpp_dev_multi_offset_update(ctx->reg_cfg, 164, offset);
|
|
if (enc_task->rc_task->frm.save_pass1)
|
vepu580_h265e_save_pass1_patch(hw_regs, ctx, syn->pp.tiles_enabled_flag);
|
|
if (enc_task->rc_task->frm.use_pass1)
|
vepu580_h265e_use_pass1_patch(hw_regs, ctx);
|
}
|
hal_h265e_v580_send_regs(ctx->dev, hw_regs, reg_out);
|
|
mpp_dev_ioctl(ctx->dev, MPP_DEV_REG_OFFS, ctx->reg_cfg);
|
|
if (k < tile_num - 1) {
|
if (!ctx->tile_parall_en) {
|
vepu580_h265_fbk *fb = &ctx->feedback;
|
|
ret = mpp_dev_ioctl(ctx->dev, MPP_DEV_CMD_SEND, NULL);
|
if (ret) {
|
mpp_err_f("send cmd failed %d\n", ret);
|
}
|
|
ret = mpp_dev_ioctl(ctx->dev, MPP_DEV_CMD_POLL, NULL);
|
if (ret) {
|
mpp_err_f("poll cmd failed %d\n", ret);
|
ret = MPP_ERR_VPUHW;
|
}
|
stream_len += reg_out->st.bs_lgth_l32;
|
fb->qp_sum += reg_out->st.qp_sum;
|
fb->out_strm_size += reg_out->st.bs_lgth_l32;
|
fb->sse_sum += (RK_S64)(reg_out->st.sse_h32 << 16) +
|
((reg_out->st.st_sse_bsl.sse_l16 >> 16) & 0xffff);
|
fb->st_madi += reg_out->st.madi;
|
fb->st_madp += reg_out->st.madp;
|
fb->st_mb_num += reg_out->st.st_bnum_b16.num_b16;
|
fb->st_ctu_num += reg_out->st.st_bnum_cme.num_ctu;
|
} else
|
mpp_dev_ioctl(ctx->dev, MPP_DEV_DELIMIT, NULL);
|
}
|
}
|
|
ret = mpp_dev_ioctl(ctx->dev, MPP_DEV_CMD_SEND, NULL);
|
if (ret) {
|
mpp_err_f("send cmd failed %d\n", ret);
|
}
|
hal_h265e_leave();
|
return ret;
|
}
|
|
static MPP_RET vepu580_h265_set_feedback(H265eV580HalContext *ctx, HalEncTask *enc_task, RK_U32 index)
|
{
|
EncRcTaskInfo *hal_rc_ret = (EncRcTaskInfo *)&enc_task->rc_task->info;
|
vepu580_h265_fbk *fb = &ctx->feedback;
|
MppEncCfgSet *cfg = ctx->cfg;
|
RK_S32 mb64_num = ((cfg->prep.width + 63) / 64) * ((cfg->prep.height + 63) / 64);
|
RK_S32 mb8_num = (mb64_num << 6);
|
RK_S32 mb4_num = (mb8_num << 2);
|
|
hal_h265e_enter();
|
H265eV580StatusElem *elem = (H265eV580StatusElem *)ctx->reg_out[index];
|
RK_U32 hw_status = elem->hw_status;
|
|
fb->qp_sum += elem->st.qp_sum;
|
|
fb->out_strm_size += elem->st.bs_lgth_l32;
|
|
fb->sse_sum += (RK_S64)(elem->st.sse_h32 << 16) +
|
((elem->st.st_sse_bsl.sse_l16 >> 16) & 0xffff);
|
|
fb->hw_status = hw_status;
|
hal_h265e_dbg_detail("hw_status: 0x%08x", hw_status);
|
if (hw_status & RKV_ENC_INT_LINKTABLE_FINISH)
|
hal_h265e_err("RKV_ENC_INT_LINKTABLE_FINISH");
|
|
if (hw_status & RKV_ENC_INT_ONE_FRAME_FINISH)
|
hal_h265e_dbg_detail("RKV_ENC_INT_ONE_FRAME_FINISH");
|
|
if (hw_status & RKV_ENC_INT_ONE_SLICE_FINISH)
|
hal_h265e_dbg_detail("RKV_ENC_INT_ONE_SLICE_FINISH");
|
|
if (hw_status & RKV_ENC_INT_SAFE_CLEAR_FINISH)
|
hal_h265e_err("RKV_ENC_INT_SAFE_CLEAR_FINISH");
|
|
if (hw_status & RKV_ENC_INT_BIT_STREAM_OVERFLOW)
|
hal_h265e_err("RKV_ENC_INT_BIT_STREAM_OVERFLOW");
|
|
if (hw_status & RKV_ENC_INT_BUS_WRITE_FULL)
|
hal_h265e_err("RKV_ENC_INT_BUS_WRITE_FULL");
|
|
if (hw_status & RKV_ENC_INT_BUS_WRITE_ERROR)
|
hal_h265e_err("RKV_ENC_INT_BUS_WRITE_ERROR");
|
|
if (hw_status & RKV_ENC_INT_BUS_READ_ERROR)
|
hal_h265e_err("RKV_ENC_INT_BUS_READ_ERROR");
|
|
if (hw_status & RKV_ENC_INT_TIMEOUT_ERROR)
|
hal_h265e_err("RKV_ENC_INT_TIMEOUT_ERROR");
|
|
fb->st_madi += elem->st.madi;
|
fb->st_madp += elem->st.madp;
|
fb->st_mb_num += elem->st.st_bnum_b16.num_b16;
|
fb->st_ctu_num += elem->st.st_bnum_cme.num_ctu;
|
|
fb->st_lvl64_inter_num += elem->st.st_pnum_p64.pnum_p64;
|
fb->st_lvl32_inter_num += elem->st.st_pnum_p32.pnum_p32;
|
fb->st_lvl32_intra_num += elem->st.st_pnum_i32.pnum_i32;
|
fb->st_lvl16_inter_num += elem->st.st_pnum_p16.pnum_p16;
|
fb->st_lvl16_intra_num += elem->st.st_pnum_i16.pnum_i16;
|
fb->st_lvl8_inter_num += elem->st.st_pnum_p8.pnum_p8;
|
fb->st_lvl8_intra_num += elem->st.st_pnum_i8.pnum_i8;
|
fb->st_lvl4_intra_num += elem->st.st_pnum_i4.pnum_i4;
|
memcpy(&fb->st_cu_num_qp[0], &elem->st.st_b8_qp0, 52 * sizeof(RK_U32));
|
|
if (index == (ctx->tile_num - 1)) {
|
hal_rc_ret->bit_real += fb->out_strm_size * 8;
|
|
if (fb->st_mb_num) {
|
fb->st_madi = fb->st_madi / fb->st_mb_num;
|
} else {
|
fb->st_madi = 0;
|
}
|
if (fb->st_ctu_num) {
|
fb->st_madp = fb->st_madp / fb->st_ctu_num;
|
} else {
|
fb->st_madp = 0;
|
}
|
|
if (mb4_num > 0)
|
hal_rc_ret->iblk4_prop = ((((fb->st_lvl4_intra_num + fb->st_lvl8_intra_num) << 2) +
|
(fb->st_lvl16_intra_num << 4) +
|
(fb->st_lvl32_intra_num << 6)) << 8) / mb4_num;
|
|
if (mb64_num > 0) {
|
/*
|
hal_cfg[k].inter_lv8_prop = ((fb->st_lvl8_inter_num + (fb->st_lvl16_inter_num << 2) +
|
(fb->st_lvl32_inter_num << 4) +
|
(fb->st_lvl64_inter_num << 6)) << 8) / mb8_num;*/
|
|
hal_rc_ret->quality_real = fb->qp_sum / mb8_num;
|
// hal_cfg[k].sse = fb->sse_sum / mb64_num;
|
}
|
|
hal_rc_ret->madi += fb->st_madi;
|
hal_rc_ret->madp += fb->st_madp;
|
}
|
hal_h265e_leave();
|
return MPP_OK;
|
}
|
|
void save_to_file(char *name, void *ptr, size_t size)
|
{
|
FILE *fp = fopen(name, "w+b");
|
if (fp) {
|
fwrite(ptr, 1, size, fp);
|
fclose(fp);
|
} else
|
mpp_err("create file %s failed\n", name);
|
}
|
|
void dump_files(H265eV580HalContext *ctx, HalEncTask *enc_task)
|
{
|
H265eSyntax_new *syn = (H265eSyntax_new *)enc_task->syntax.data;
|
HalBuf *hal_buf = hal_bufs_get_buf(ctx->dpb_bufs, syn->sp.ref_pic.slot_idx);
|
size_t buf_size = mpp_buffer_get_size(hal_buf->buf[0]);
|
size_t dws_size = mpp_buffer_get_size(hal_buf->buf[1]);
|
void *ptr = mpp_buffer_get_ptr(hal_buf->buf[0]);
|
void *dws_ptr = mpp_buffer_get_ptr(hal_buf->buf[1]);
|
RK_U32 frm_num = ctx->frame_num;
|
RK_S32 pid = getpid();
|
char name[128];
|
size_t name_len = sizeof(name) - 1;
|
|
snprintf(name, name_len, "/data/refr_fbd_%d_frm%d.bin", pid, frm_num);
|
save_to_file(name, ptr + ctx->fbc_header_len, buf_size - ctx->fbc_header_len);
|
|
snprintf(name, name_len, "/data/refr_fbh_%d_frm%d.bin", pid, frm_num);
|
save_to_file(name, ptr, ctx->fbc_header_len);
|
|
snprintf(name, name_len, "/data/refr_dsp_%d_frm%d.bin", pid, frm_num);
|
save_to_file(name, dws_ptr, dws_size);
|
|
hal_buf = hal_bufs_get_buf(ctx->dpb_bufs, syn->sp.recon_pic.slot_idx);
|
buf_size = mpp_buffer_get_size(hal_buf->buf[0]);
|
dws_size = mpp_buffer_get_size(hal_buf->buf[1]);
|
ptr = mpp_buffer_get_ptr(hal_buf->buf[0]);
|
dws_ptr = mpp_buffer_get_ptr(hal_buf->buf[1]);
|
|
snprintf(name, name_len, "/data/recn_fbd_%d_frm%d.bin", pid, frm_num);
|
save_to_file(name, ptr + ctx->fbc_header_len, buf_size - ctx->fbc_header_len);
|
|
snprintf(name, name_len, "/data/recn_fbh_%d_frm%d.bin", pid, frm_num);
|
save_to_file(name, ptr, ctx->fbc_header_len);
|
|
snprintf(name, name_len, "/data/recn_dsp_%d_frm%d.bin", pid, frm_num);
|
save_to_file(name, dws_ptr, dws_size);
|
}
|
|
MPP_RET hal_h265e_v580_wait(void *hal, HalEncTask *task)
|
{
|
MPP_RET ret = MPP_OK;
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
HalEncTask *enc_task = task;
|
H265eV580StatusElem *elem = (H265eV580StatusElem *)ctx->reg_out;
|
hal_h265e_enter();
|
|
if (enc_task->flags.err) {
|
hal_h265e_err("enc_task->flags.err %08x, return early",
|
enc_task->flags.err);
|
return MPP_NOK;
|
}
|
|
if (ctx->cfg->split.split_out) {
|
EncOutParam param;
|
RK_U32 slice_len = 0;
|
RK_U32 slice_last = 0;
|
RK_U32 finish_cnt = 0;
|
RK_U32 tile1_offset = 0;
|
RK_U32 stream_len = 0;
|
RK_U32 offset = mpp_packet_get_length(enc_task->packet);
|
void* ptr = mpp_packet_get_pos(enc_task->packet);
|
MppDevPollCfg *poll_cfg = (MppDevPollCfg *)((char *)ctx->poll_cfgs);
|
|
param.task = task;
|
param.base = mpp_packet_get_data(task->packet);
|
|
do {
|
RK_S32 i = 0;
|
poll_cfg->poll_type = 0;
|
poll_cfg->poll_ret = 0;
|
poll_cfg->count_max = ctx->poll_slice_max;
|
poll_cfg->count_ret = 0;
|
|
ret = mpp_dev_ioctl(ctx->dev, MPP_DEV_CMD_POLL, poll_cfg);
|
|
for (i = 0; i < poll_cfg->count_ret; i++) {
|
slice_last = poll_cfg->slice_info[i].last;
|
slice_len = poll_cfg->slice_info[i].length;
|
param.length = slice_len;
|
|
if (finish_cnt > 0) {
|
void *tile1_ptr = mpp_buffer_get_ptr(ctx->hw_tile_stream);
|
|
memcpy(ptr + stream_len + offset, tile1_ptr + tile1_offset, slice_len);
|
tile1_offset += slice_len;
|
}
|
|
if (slice_last) {
|
finish_cnt++;
|
if (ctx->tile_parall_en) {
|
if (finish_cnt + 1 > ctx->tile_num) {
|
ctx->output_cb->cmd = ENC_OUTPUT_FINISH;
|
}
|
}
|
} else
|
ctx->output_cb->cmd = ENC_OUTPUT_SLICE;
|
|
stream_len += slice_len;
|
mpp_callback(ctx->output_cb, ¶m);
|
}
|
|
if (ctx->tile_parall_en) {
|
if (finish_cnt + 1 > ctx->tile_num) {
|
break;
|
}
|
} else if (slice_last) {
|
break;
|
}
|
} while (1);
|
} else {
|
RK_U32 i = 0;
|
if (ctx->tile_parall_en) {
|
for (i = 0; i < ctx->tile_num; i ++)
|
ret = mpp_dev_ioctl(ctx->dev, MPP_DEV_CMD_POLL, NULL);
|
} else {
|
ret = mpp_dev_ioctl(ctx->dev, MPP_DEV_CMD_POLL, NULL);
|
}
|
|
for (i = 0; i < MAX_TILE_NUM; i++) {
|
RK_U32 hw_status = ((H265eV580StatusElem *)ctx->reg_out[i])->hw_status;
|
|
if (ctx->tile_dump_err &&
|
(hw_status & (RKV_ENC_INT_BUS_WRITE_ERROR | RKV_ENC_INT_BUS_READ_ERROR))) {
|
dump_files(ctx, enc_task);
|
break;
|
}
|
}
|
|
if (ret)
|
mpp_err_f("poll cmd failed %d status %d \n", ret, elem->hw_status);
|
}
|
|
hal_h265e_leave();
|
return ret;
|
}
|
|
MPP_RET hal_h265e_v580_get_task(void *hal, HalEncTask *task)
|
{
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
MppFrame frame = task->frame;
|
EncFrmStatus *frm_status = &task->rc_task->frm;
|
|
hal_h265e_enter();
|
|
if (vepu580_h265_setup_hal_bufs(ctx)) {
|
hal_h265e_err("vepu541_h265_allocate_buffers failed, free buffers and return\n");
|
task->flags.err |= HAL_ENC_TASK_ERR_ALLOC;
|
return MPP_ERR_MALLOC;
|
}
|
|
if (!frm_status->reencode)
|
ctx->last_frame_type = ctx->frame_type;
|
|
if (frm_status->is_intra) {
|
ctx->frame_type = INTRA_FRAME;
|
} else {
|
ctx->frame_type = INTER_P_FRAME;
|
}
|
if (!frm_status->reencode && mpp_frame_has_meta(task->frame)) {
|
MppMeta meta = mpp_frame_get_meta(frame);
|
|
mpp_meta_get_ptr_d(meta, KEY_ROI_DATA2, (void **)&ctx->roi_data, NULL);
|
mpp_meta_get_ptr_d(meta, KEY_OSD_DATA, (void **)&ctx->osd_cfg.osd_data, NULL);
|
mpp_meta_get_ptr_d(meta, KEY_OSD_DATA2, (void **)&ctx->osd_cfg.osd_data2, NULL);
|
}
|
memset(&ctx->feedback, 0, sizeof(vepu580_h265_fbk));
|
task->part_first = 1;
|
task->part_last = 0;
|
|
mpp_dev_multi_offset_reset(ctx->reg_cfg);
|
|
hal_h265e_leave();
|
return MPP_OK;
|
}
|
|
MPP_RET hal_h265e_v580_ret_task(void *hal, HalEncTask *task)
|
{
|
H265eV580HalContext *ctx = (H265eV580HalContext *)hal;
|
HalEncTask *enc_task = task;
|
vepu580_h265_fbk *fb = &ctx->feedback;
|
|
hal_h265e_enter();
|
|
if (ctx->tile_parall_en) {
|
RK_U32 i = 0, stream_len = 0;;
|
RK_U32 offset = mpp_packet_get_length(enc_task->packet);
|
void* ptr = mpp_packet_get_pos(enc_task->packet);
|
|
for (i = 0; i < ctx->tile_num; i ++) {
|
vepu580_h265_set_feedback(ctx, enc_task, i);
|
if (!ctx->cfg->split.split_out) {
|
if (i) { //copy tile 1 stream
|
RK_U32 len = fb->out_strm_size - stream_len;
|
void *tile1_ptr = mpp_buffer_get_ptr(ctx->hw_tile_stream);
|
memcpy(ptr + stream_len + offset, tile1_ptr, len);
|
}
|
stream_len = fb->out_strm_size;
|
}
|
}
|
} else {
|
vepu580_h265_set_feedback(ctx, enc_task, ctx->tile_num - 1);
|
}
|
|
enc_task->hw_length = fb->out_strm_size;
|
enc_task->length += fb->out_strm_size;
|
|
vepu580_h265e_tune_stat_update(ctx->tune);
|
|
hal_h265e_dbg_detail("output stream size %d\n", fb->out_strm_size);
|
|
hal_h265e_leave();
|
return MPP_OK;
|
}
|
|
const MppEncHalApi hal_h265e_vepu580 = {
|
"hal_h265e_v580",
|
MPP_VIDEO_CodingHEVC,
|
sizeof(H265eV580HalContext),
|
0,
|
hal_h265e_v580_init,
|
hal_h265e_v580_deinit,
|
hal_h265e_vepu580_prepare,
|
hal_h265e_v580_get_task,
|
hal_h265e_v580_gen_regs,
|
hal_h265e_v580_start,
|
hal_h265e_v580_wait,
|
NULL,
|
NULL,
|
hal_h265e_v580_ret_task,
|
};
|