1*437bfbebSnyanmisaka /* SPDX-License-Identifier: Apache-2.0 OR MIT */
2*437bfbebSnyanmisaka /*
3*437bfbebSnyanmisaka * Copyright (c) 2024 Rockchip Electronics Co., Ltd.
4*437bfbebSnyanmisaka */
5*437bfbebSnyanmisaka
6*437bfbebSnyanmisaka #define MODULE_TAG "hal_h264d_vdpu383"
7*437bfbebSnyanmisaka
8*437bfbebSnyanmisaka #include <string.h>
9*437bfbebSnyanmisaka
10*437bfbebSnyanmisaka #include "mpp_env.h"
11*437bfbebSnyanmisaka #include "mpp_mem.h"
12*437bfbebSnyanmisaka #include "mpp_common.h"
13*437bfbebSnyanmisaka #include "mpp_bitput.h"
14*437bfbebSnyanmisaka #include "mpp_buffer_impl.h"
15*437bfbebSnyanmisaka
16*437bfbebSnyanmisaka #include "hal_h264d_global.h"
17*437bfbebSnyanmisaka #include "hal_h264d_vdpu383.h"
18*437bfbebSnyanmisaka #include "vdpu383_h264d.h"
19*437bfbebSnyanmisaka #include "mpp_dec_cb_param.h"
20*437bfbebSnyanmisaka
21*437bfbebSnyanmisaka /* Number registers for the decoder */
22*437bfbebSnyanmisaka #define DEC_VDPU383_REGISTERS 276
23*437bfbebSnyanmisaka
24*437bfbebSnyanmisaka #define VDPU383_CABAC_TAB_SIZE (928*4 + 128) /* bytes */
25*437bfbebSnyanmisaka #define VDPU383_SPSPPS_SIZE (168 + 128) /* bytes */
26*437bfbebSnyanmisaka #define VDPU383_RPS_SIZE (128 + 128 + 128) /* bytes */
27*437bfbebSnyanmisaka #define VDPU383_SCALING_LIST_SIZE (6*16+2*64 + 128) /* bytes */
28*437bfbebSnyanmisaka #define VDPU383_ERROR_INFO_SIZE (256*144*4) /* bytes */
29*437bfbebSnyanmisaka #define H264_CTU_SIZE 16
30*437bfbebSnyanmisaka
31*437bfbebSnyanmisaka #define VDPU383_CABAC_TAB_ALIGNED_SIZE (MPP_ALIGN(VDPU383_CABAC_TAB_SIZE, SZ_4K))
32*437bfbebSnyanmisaka #define VDPU383_ERROR_INFO_ALIGNED_SIZE (0)
33*437bfbebSnyanmisaka #define VDPU383_SPSPPS_ALIGNED_SIZE (MPP_ALIGN(VDPU383_SPSPPS_SIZE, SZ_4K))
34*437bfbebSnyanmisaka #define VDPU383_RPS_ALIGNED_SIZE (MPP_ALIGN(VDPU383_RPS_SIZE, SZ_4K))
35*437bfbebSnyanmisaka #define VDPU383_SCALING_LIST_ALIGNED_SIZE (MPP_ALIGN(VDPU383_SCALING_LIST_SIZE, SZ_4K))
36*437bfbebSnyanmisaka #define VDPU383_STREAM_INFO_SET_SIZE (VDPU383_SPSPPS_ALIGNED_SIZE + \
37*437bfbebSnyanmisaka VDPU383_RPS_ALIGNED_SIZE + \
38*437bfbebSnyanmisaka VDPU383_SCALING_LIST_ALIGNED_SIZE)
39*437bfbebSnyanmisaka
40*437bfbebSnyanmisaka #define VDPU383_CABAC_TAB_OFFSET (0)
41*437bfbebSnyanmisaka #define VDPU383_ERROR_INFO_OFFSET (VDPU383_CABAC_TAB_OFFSET + VDPU383_CABAC_TAB_ALIGNED_SIZE)
42*437bfbebSnyanmisaka #define VDPU383_STREAM_INFO_OFFSET_BASE (VDPU383_ERROR_INFO_OFFSET + VDPU383_ERROR_INFO_ALIGNED_SIZE)
43*437bfbebSnyanmisaka #define VDPU383_SPSPPS_OFFSET(pos) (VDPU383_STREAM_INFO_OFFSET_BASE + (VDPU383_STREAM_INFO_SET_SIZE * pos))
44*437bfbebSnyanmisaka #define VDPU383_RPS_OFFSET(pos) (VDPU383_SPSPPS_OFFSET(pos) + VDPU383_SPSPPS_ALIGNED_SIZE)
45*437bfbebSnyanmisaka #define VDPU383_SCALING_LIST_OFFSET(pos) (VDPU383_RPS_OFFSET(pos) + VDPU383_RPS_ALIGNED_SIZE)
46*437bfbebSnyanmisaka #define VDPU383_INFO_BUFFER_SIZE(cnt) (VDPU383_STREAM_INFO_OFFSET_BASE + (VDPU383_STREAM_INFO_SET_SIZE * cnt))
47*437bfbebSnyanmisaka
48*437bfbebSnyanmisaka #define VDPU383_SPS_PPS_LEN (MPP_ALIGN(1338, 128) / 8) // byte, 1338 bit
49*437bfbebSnyanmisaka
50*437bfbebSnyanmisaka #define SET_REF_INFO(regs, index, field, value)\
51*437bfbebSnyanmisaka do{ \
52*437bfbebSnyanmisaka switch(index){\
53*437bfbebSnyanmisaka case 0: regs.reg99.ref0_##field = value; break;\
54*437bfbebSnyanmisaka case 1: regs.reg99.ref1_##field = value; break;\
55*437bfbebSnyanmisaka case 2: regs.reg99.ref2_##field = value; break;\
56*437bfbebSnyanmisaka case 3: regs.reg99.ref3_##field = value; break;\
57*437bfbebSnyanmisaka case 4: regs.reg100.ref4_##field = value; break;\
58*437bfbebSnyanmisaka case 5: regs.reg100.ref5_##field = value; break;\
59*437bfbebSnyanmisaka case 6: regs.reg100.ref6_##field = value; break;\
60*437bfbebSnyanmisaka case 7: regs.reg100.ref7_##field = value; break;\
61*437bfbebSnyanmisaka case 8: regs.reg101.ref8_##field = value; break;\
62*437bfbebSnyanmisaka case 9: regs.reg101.ref9_##field = value; break;\
63*437bfbebSnyanmisaka case 10: regs.reg101.ref10_##field = value; break;\
64*437bfbebSnyanmisaka case 11: regs.reg101.ref11_##field = value; break;\
65*437bfbebSnyanmisaka case 12: regs.reg102.ref12_##field = value; break;\
66*437bfbebSnyanmisaka case 13: regs.reg102.ref13_##field = value; break;\
67*437bfbebSnyanmisaka case 14: regs.reg102.ref14_##field = value; break;\
68*437bfbebSnyanmisaka case 15: regs.reg102.ref15_##field = value; break;\
69*437bfbebSnyanmisaka default: break;}\
70*437bfbebSnyanmisaka }while(0)
71*437bfbebSnyanmisaka
72*437bfbebSnyanmisaka #define VDPU383_FAST_REG_SET_CNT 3
73*437bfbebSnyanmisaka
74*437bfbebSnyanmisaka typedef struct h264d_rkv_buf_t {
75*437bfbebSnyanmisaka RK_U32 valid;
76*437bfbebSnyanmisaka Vdpu383H264dRegSet *regs;
77*437bfbebSnyanmisaka } H264dRkvBuf_t;
78*437bfbebSnyanmisaka
79*437bfbebSnyanmisaka typedef struct Vdpu383H264dRegCtx_t {
80*437bfbebSnyanmisaka RK_U8 spspps[VDPU383_SPS_PPS_LEN];
81*437bfbebSnyanmisaka RK_U8 rps[VDPU383_RPS_SIZE];
82*437bfbebSnyanmisaka RK_U8 sclst[VDPU383_SCALING_LIST_SIZE];
83*437bfbebSnyanmisaka
84*437bfbebSnyanmisaka MppBuffer bufs;
85*437bfbebSnyanmisaka RK_S32 bufs_fd;
86*437bfbebSnyanmisaka void *bufs_ptr;
87*437bfbebSnyanmisaka RK_U32 offset_cabac;
88*437bfbebSnyanmisaka RK_U32 offset_errinfo;
89*437bfbebSnyanmisaka RK_U32 offset_spspps[VDPU383_FAST_REG_SET_CNT];
90*437bfbebSnyanmisaka RK_U32 offset_rps[VDPU383_FAST_REG_SET_CNT];
91*437bfbebSnyanmisaka RK_U32 offset_sclst[VDPU383_FAST_REG_SET_CNT];
92*437bfbebSnyanmisaka
93*437bfbebSnyanmisaka H264dRkvBuf_t reg_buf[VDPU383_FAST_REG_SET_CNT];
94*437bfbebSnyanmisaka
95*437bfbebSnyanmisaka RK_U32 spspps_offset;
96*437bfbebSnyanmisaka RK_U32 rps_offset;
97*437bfbebSnyanmisaka RK_U32 sclst_offset;
98*437bfbebSnyanmisaka
99*437bfbebSnyanmisaka RK_S32 width;
100*437bfbebSnyanmisaka RK_S32 height;
101*437bfbebSnyanmisaka /* rcb buffers info */
102*437bfbebSnyanmisaka RK_U32 bit_depth;
103*437bfbebSnyanmisaka RK_U32 mbaff;
104*437bfbebSnyanmisaka RK_U32 chroma_format_idc;
105*437bfbebSnyanmisaka
106*437bfbebSnyanmisaka RK_S32 rcb_buf_size;
107*437bfbebSnyanmisaka Vdpu383RcbInfo rcb_info[RCB_BUF_COUNT];
108*437bfbebSnyanmisaka MppBuffer rcb_buf[VDPU383_FAST_REG_SET_CNT];
109*437bfbebSnyanmisaka
110*437bfbebSnyanmisaka Vdpu383H264dRegSet *regs;
111*437bfbebSnyanmisaka HalBufs origin_bufs;
112*437bfbebSnyanmisaka } Vdpu383H264dRegCtx;
113*437bfbebSnyanmisaka
114*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_deinit(void *hal);
rkv_ver_align(RK_U32 val)115*437bfbebSnyanmisaka static RK_U32 rkv_ver_align(RK_U32 val)
116*437bfbebSnyanmisaka {
117*437bfbebSnyanmisaka return MPP_ALIGN(val, 16);
118*437bfbebSnyanmisaka }
119*437bfbebSnyanmisaka
rkv_len_align(RK_U32 val)120*437bfbebSnyanmisaka static RK_U32 rkv_len_align(RK_U32 val)
121*437bfbebSnyanmisaka {
122*437bfbebSnyanmisaka return (2 * MPP_ALIGN(val, 16));
123*437bfbebSnyanmisaka }
124*437bfbebSnyanmisaka
rkv_len_align_422(RK_U32 val)125*437bfbebSnyanmisaka static RK_U32 rkv_len_align_422(RK_U32 val)
126*437bfbebSnyanmisaka {
127*437bfbebSnyanmisaka return ((5 * MPP_ALIGN(val, 16)) / 2);
128*437bfbebSnyanmisaka }
129*437bfbebSnyanmisaka
vdpu383_setup_scale_origin_bufs(H264dHalCtx_t * p_hal,MppFrame mframe)130*437bfbebSnyanmisaka static MPP_RET vdpu383_setup_scale_origin_bufs(H264dHalCtx_t *p_hal, MppFrame mframe)
131*437bfbebSnyanmisaka {
132*437bfbebSnyanmisaka Vdpu383H264dRegCtx *ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
133*437bfbebSnyanmisaka /* for 8K FrameBuf scale mode */
134*437bfbebSnyanmisaka size_t origin_buf_size = 0;
135*437bfbebSnyanmisaka
136*437bfbebSnyanmisaka origin_buf_size = mpp_frame_get_buf_size(mframe);
137*437bfbebSnyanmisaka
138*437bfbebSnyanmisaka if (!origin_buf_size) {
139*437bfbebSnyanmisaka mpp_err_f("origin_bufs get buf size failed\n");
140*437bfbebSnyanmisaka return MPP_NOK;
141*437bfbebSnyanmisaka }
142*437bfbebSnyanmisaka if (ctx->origin_bufs) {
143*437bfbebSnyanmisaka hal_bufs_deinit(ctx->origin_bufs);
144*437bfbebSnyanmisaka ctx->origin_bufs = NULL;
145*437bfbebSnyanmisaka }
146*437bfbebSnyanmisaka hal_bufs_init(&ctx->origin_bufs);
147*437bfbebSnyanmisaka if (!ctx->origin_bufs) {
148*437bfbebSnyanmisaka mpp_err_f("origin_bufs init fail\n");
149*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
150*437bfbebSnyanmisaka }
151*437bfbebSnyanmisaka hal_bufs_setup(ctx->origin_bufs, 16, 1, &origin_buf_size);
152*437bfbebSnyanmisaka
153*437bfbebSnyanmisaka return MPP_OK;
154*437bfbebSnyanmisaka }
155*437bfbebSnyanmisaka
prepare_spspps(H264dHalCtx_t * p_hal,RK_U64 * data,RK_U32 len)156*437bfbebSnyanmisaka static MPP_RET prepare_spspps(H264dHalCtx_t *p_hal, RK_U64 *data, RK_U32 len)
157*437bfbebSnyanmisaka {
158*437bfbebSnyanmisaka RK_S32 i = 0;
159*437bfbebSnyanmisaka RK_S32 is_long_term = 0, voidx = 0;
160*437bfbebSnyanmisaka DXVA_PicParams_H264_MVC *pp = p_hal->pp;
161*437bfbebSnyanmisaka RK_U32 tmp = 0;
162*437bfbebSnyanmisaka BitputCtx_t bp;
163*437bfbebSnyanmisaka
164*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, data, len);
165*437bfbebSnyanmisaka
166*437bfbebSnyanmisaka if (!p_hal->fast_mode && !pp->spspps_update) {
167*437bfbebSnyanmisaka bp.index = 2;
168*437bfbebSnyanmisaka bp.bitpos = 24;
169*437bfbebSnyanmisaka bp.bvalue = bp.pbuf[bp.index] & 0xFFFFFF;
170*437bfbebSnyanmisaka } else {
171*437bfbebSnyanmisaka RK_U32 pic_width, pic_height;
172*437bfbebSnyanmisaka
173*437bfbebSnyanmisaka //!< sps syntax
174*437bfbebSnyanmisaka pic_width = 16 * (pp->wFrameWidthInMbsMinus1 + 1);
175*437bfbebSnyanmisaka pic_height = 16 * (pp->wFrameHeightInMbsMinus1 + 1);
176*437bfbebSnyanmisaka pic_height *= (2 - pp->frame_mbs_only_flag);
177*437bfbebSnyanmisaka pic_height /= (1 + pp->field_pic_flag);
178*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->seq_parameter_set_id, 4);
179*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->profile_idc, 8);
180*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->constraint_set3_flag, 1);
181*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->chroma_format_idc, 2);
182*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->bit_depth_luma_minus8, 3);
183*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->bit_depth_chroma_minus8, 3);
184*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1); // set 0
185*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->log2_max_frame_num_minus4, 4);
186*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->num_ref_frames, 5);
187*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pic_order_cnt_type, 2);
188*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->log2_max_pic_order_cnt_lsb_minus4, 4);
189*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->delta_pic_order_always_zero_flag, 1);
190*437bfbebSnyanmisaka mpp_put_bits(&bp, pic_width, 16);
191*437bfbebSnyanmisaka mpp_put_bits(&bp, pic_height, 16);
192*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->frame_mbs_only_flag, 1);
193*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->MbaffFrameFlag, 1);
194*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->direct_8x8_inference_flag, 1);
195*437bfbebSnyanmisaka /* multi-view */
196*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvc_extension_enable, 1);
197*437bfbebSnyanmisaka if (pp->mvc_extension_enable) {
198*437bfbebSnyanmisaka mpp_put_bits(&bp, (pp->num_views_minus1 + 1), 2);
199*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->view_id[0], 10);
200*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->view_id[1], 10);
201*437bfbebSnyanmisaka } else {
202*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 22);
203*437bfbebSnyanmisaka }
204*437bfbebSnyanmisaka // hw_fifo_align_bits(&bp, 128);
205*437bfbebSnyanmisaka //!< pps syntax
206*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pps_pic_parameter_set_id, 8);
207*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pps_seq_parameter_set_id, 5);
208*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->entropy_coding_mode_flag, 1);
209*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pic_order_present_flag, 1);
210*437bfbebSnyanmisaka
211*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->num_ref_idx_l0_active_minus1, 5);
212*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->num_ref_idx_l1_active_minus1, 5);
213*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->weighted_pred_flag, 1);
214*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->weighted_bipred_idc, 2);
215*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pic_init_qp_minus26, 7);
216*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pic_init_qs_minus26, 6);
217*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->chroma_qp_index_offset, 5);
218*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->deblocking_filter_control_present_flag, 1);
219*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->constrained_intra_pred_flag, 1);
220*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->redundant_pic_cnt_present_flag, 1);
221*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->transform_8x8_mode_flag, 1);
222*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->second_chroma_qp_index_offset, 5);
223*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->scaleing_list_enable_flag, 1);
224*437bfbebSnyanmisaka }
225*437bfbebSnyanmisaka
226*437bfbebSnyanmisaka //!< set dpb
227*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
228*437bfbebSnyanmisaka is_long_term = (pp->RefFrameList[i].bPicEntry != 0xff) ? pp->RefFrameList[i].AssociatedFlag : 0;
229*437bfbebSnyanmisaka tmp |= (RK_U32)(is_long_term & 0x1) << i;
230*437bfbebSnyanmisaka }
231*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
232*437bfbebSnyanmisaka voidx = (pp->RefFrameList[i].bPicEntry != 0xff) ? pp->RefPicLayerIdList[i] : 0;
233*437bfbebSnyanmisaka tmp |= (RK_U32)(voidx & 0x1) << (i + 16);
234*437bfbebSnyanmisaka }
235*437bfbebSnyanmisaka mpp_put_bits(&bp, tmp, 32);
236*437bfbebSnyanmisaka /* set current frame */
237*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->field_pic_flag, 1);
238*437bfbebSnyanmisaka mpp_put_bits(&bp, (pp->field_pic_flag && pp->CurrPic.AssociatedFlag), 1);
239*437bfbebSnyanmisaka
240*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->CurrFieldOrderCnt[0], 32);
241*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->CurrFieldOrderCnt[1], 32);
242*437bfbebSnyanmisaka
243*437bfbebSnyanmisaka /* refer poc */
244*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
245*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->FieldOrderCntList[i][0], 32);
246*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->FieldOrderCntList[i][1], 32);
247*437bfbebSnyanmisaka }
248*437bfbebSnyanmisaka
249*437bfbebSnyanmisaka tmp = 0;
250*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
251*437bfbebSnyanmisaka RK_U32 field_flag = (pp->RefPicFiledFlags >> i) & 0x01;
252*437bfbebSnyanmisaka
253*437bfbebSnyanmisaka tmp |= field_flag << i;
254*437bfbebSnyanmisaka }
255*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
256*437bfbebSnyanmisaka RK_U32 top_used = (pp->UsedForReferenceFlags >> (2 * i + 0)) & 0x01;
257*437bfbebSnyanmisaka
258*437bfbebSnyanmisaka tmp |= top_used << (i + 16);
259*437bfbebSnyanmisaka }
260*437bfbebSnyanmisaka mpp_put_bits(&bp, tmp, 32);
261*437bfbebSnyanmisaka
262*437bfbebSnyanmisaka tmp = 0;
263*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
264*437bfbebSnyanmisaka RK_U32 bot_used = (pp->UsedForReferenceFlags >> (2 * i + 1)) & 0x01;
265*437bfbebSnyanmisaka
266*437bfbebSnyanmisaka tmp |= bot_used << i;
267*437bfbebSnyanmisaka }
268*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
269*437bfbebSnyanmisaka RK_U32 ref_colmv_used = (pp->RefPicColmvUsedFlags >> i) & 0x01;
270*437bfbebSnyanmisaka
271*437bfbebSnyanmisaka tmp |= ref_colmv_used << (i + 16);
272*437bfbebSnyanmisaka }
273*437bfbebSnyanmisaka mpp_put_bits(&bp, tmp, 32);
274*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0);//128
275*437bfbebSnyanmisaka
276*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
277*437bfbebSnyanmisaka {
278*437bfbebSnyanmisaka char *cur_fname = "global_cfg.dat";
279*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
280*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
281*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 64 * bp.index + bp.bitpos, 64, 0);
282*437bfbebSnyanmisaka }
283*437bfbebSnyanmisaka #endif
284*437bfbebSnyanmisaka
285*437bfbebSnyanmisaka return MPP_OK;
286*437bfbebSnyanmisaka }
287*437bfbebSnyanmisaka
prepare_framerps(H264dHalCtx_t * p_hal,RK_U64 * data,RK_U32 len)288*437bfbebSnyanmisaka static MPP_RET prepare_framerps(H264dHalCtx_t *p_hal, RK_U64 *data, RK_U32 len)
289*437bfbebSnyanmisaka {
290*437bfbebSnyanmisaka RK_S32 i = 0, j = 0;
291*437bfbebSnyanmisaka RK_S32 dpb_idx = 0, voidx = 0;
292*437bfbebSnyanmisaka RK_S32 dpb_valid = 0, bottom_flag = 0;
293*437bfbebSnyanmisaka RK_U32 max_frame_num = 0;
294*437bfbebSnyanmisaka RK_U16 frame_num_wrap = 0;
295*437bfbebSnyanmisaka RK_U32 tmp = 0;
296*437bfbebSnyanmisaka
297*437bfbebSnyanmisaka BitputCtx_t bp;
298*437bfbebSnyanmisaka DXVA_PicParams_H264_MVC *pp = p_hal->pp;
299*437bfbebSnyanmisaka
300*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, data, len);
301*437bfbebSnyanmisaka
302*437bfbebSnyanmisaka max_frame_num = 1 << (pp->log2_max_frame_num_minus4 + 4);
303*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
304*437bfbebSnyanmisaka if ((pp->NonExistingFrameFlags >> i) & 0x01) {
305*437bfbebSnyanmisaka frame_num_wrap = 0;
306*437bfbebSnyanmisaka } else {
307*437bfbebSnyanmisaka if (pp->RefFrameList[i].AssociatedFlag) {
308*437bfbebSnyanmisaka frame_num_wrap = pp->FrameNumList[i];
309*437bfbebSnyanmisaka } else {
310*437bfbebSnyanmisaka frame_num_wrap = (pp->FrameNumList[i] > pp->frame_num) ?
311*437bfbebSnyanmisaka (pp->FrameNumList[i] - max_frame_num) : pp->FrameNumList[i];
312*437bfbebSnyanmisaka }
313*437bfbebSnyanmisaka }
314*437bfbebSnyanmisaka mpp_put_bits(&bp, frame_num_wrap, 16);
315*437bfbebSnyanmisaka }
316*437bfbebSnyanmisaka
317*437bfbebSnyanmisaka tmp = 0;
318*437bfbebSnyanmisaka for (i = 0; i < 16; i++) {
319*437bfbebSnyanmisaka tmp |= (RK_U32)pp->RefPicLayerIdList[i] << (i + 16);
320*437bfbebSnyanmisaka }
321*437bfbebSnyanmisaka mpp_put_bits(&bp, tmp, 32);
322*437bfbebSnyanmisaka
323*437bfbebSnyanmisaka for (i = 0; i < 32; i++) {
324*437bfbebSnyanmisaka tmp = 0;
325*437bfbebSnyanmisaka dpb_valid = (p_hal->slice_long[0].RefPicList[0][i].bPicEntry == 0xff) ? 0 : 1;
326*437bfbebSnyanmisaka dpb_idx = dpb_valid ? p_hal->slice_long[0].RefPicList[0][i].Index7Bits : 0;
327*437bfbebSnyanmisaka bottom_flag = dpb_valid ? p_hal->slice_long[0].RefPicList[0][i].AssociatedFlag : 0;
328*437bfbebSnyanmisaka voidx = dpb_valid ? pp->RefPicLayerIdList[dpb_idx] : 0;
329*437bfbebSnyanmisaka
330*437bfbebSnyanmisaka tmp |= (RK_U32)(dpb_idx | (dpb_valid << 4)) & 0x1f;
331*437bfbebSnyanmisaka tmp |= (RK_U32)(bottom_flag & 0x1) << 5;
332*437bfbebSnyanmisaka if (dpb_valid)
333*437bfbebSnyanmisaka tmp |= (RK_U32)(voidx & 0x1) << 6;
334*437bfbebSnyanmisaka mpp_put_bits(&bp, tmp, 7);
335*437bfbebSnyanmisaka }
336*437bfbebSnyanmisaka
337*437bfbebSnyanmisaka for (j = 1; j < 3; j++) {
338*437bfbebSnyanmisaka for (i = 0; i < 32; i++) {
339*437bfbebSnyanmisaka tmp = 0;
340*437bfbebSnyanmisaka dpb_valid = (p_hal->slice_long[0].RefPicList[j][i].bPicEntry == 0xff) ? 0 : 1;
341*437bfbebSnyanmisaka dpb_idx = dpb_valid ? p_hal->slice_long[0].RefPicList[j][i].Index7Bits : 0;
342*437bfbebSnyanmisaka bottom_flag = dpb_valid ? p_hal->slice_long[0].RefPicList[j][i].AssociatedFlag : 0;
343*437bfbebSnyanmisaka voidx = dpb_valid ? pp->RefPicLayerIdList[dpb_idx] : 0;
344*437bfbebSnyanmisaka tmp |= (RK_U32)(dpb_idx | (dpb_valid << 4)) & 0x1f;
345*437bfbebSnyanmisaka tmp |= (RK_U32)(bottom_flag & 0x1) << 5;
346*437bfbebSnyanmisaka if (dpb_valid)
347*437bfbebSnyanmisaka tmp |= (RK_U32)(voidx & 0x1) << 6;
348*437bfbebSnyanmisaka mpp_put_bits(&bp, tmp, 7);
349*437bfbebSnyanmisaka }
350*437bfbebSnyanmisaka }
351*437bfbebSnyanmisaka
352*437bfbebSnyanmisaka mpp_put_align(&bp, 128, 0);
353*437bfbebSnyanmisaka
354*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
355*437bfbebSnyanmisaka {
356*437bfbebSnyanmisaka char *cur_fname = "rps.dat";
357*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
358*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
359*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 64 * bp.index + bp.bitpos, 64, 0);
360*437bfbebSnyanmisaka }
361*437bfbebSnyanmisaka #endif
362*437bfbebSnyanmisaka
363*437bfbebSnyanmisaka return MPP_OK;
364*437bfbebSnyanmisaka }
365*437bfbebSnyanmisaka
prepare_scanlist(H264dHalCtx_t * p_hal,RK_U8 * data,RK_U32 len)366*437bfbebSnyanmisaka static MPP_RET prepare_scanlist(H264dHalCtx_t *p_hal, RK_U8 *data, RK_U32 len)
367*437bfbebSnyanmisaka {
368*437bfbebSnyanmisaka RK_U32 i = 0, j = 0, n = 0;
369*437bfbebSnyanmisaka
370*437bfbebSnyanmisaka if (!p_hal->pp->scaleing_list_enable_flag)
371*437bfbebSnyanmisaka return MPP_OK;
372*437bfbebSnyanmisaka
373*437bfbebSnyanmisaka for (i = 0; i < 6; i++) { //4x4, 6 lists
374*437bfbebSnyanmisaka /* dump by block4x4, vectial direction */
375*437bfbebSnyanmisaka for (j = 0; j < 4; j++) {
376*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 0];
377*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 1];
378*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 2];
379*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 3];
380*437bfbebSnyanmisaka }
381*437bfbebSnyanmisaka }
382*437bfbebSnyanmisaka
383*437bfbebSnyanmisaka for (i = 0; i < 2; i++) { //8x8, 2 lists
384*437bfbebSnyanmisaka RK_U32 blk4_x = 0, blk4_y = 0;
385*437bfbebSnyanmisaka
386*437bfbebSnyanmisaka /* dump by block4x4, vectial direction */
387*437bfbebSnyanmisaka for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
388*437bfbebSnyanmisaka for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
389*437bfbebSnyanmisaka RK_U32 pos = blk4_y * 8 + blk4_x;
390*437bfbebSnyanmisaka
391*437bfbebSnyanmisaka for (j = 0; j < 4; j++) {
392*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 0];
393*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 1];
394*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 2];
395*437bfbebSnyanmisaka data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 3];
396*437bfbebSnyanmisaka }
397*437bfbebSnyanmisaka }
398*437bfbebSnyanmisaka }
399*437bfbebSnyanmisaka }
400*437bfbebSnyanmisaka
401*437bfbebSnyanmisaka mpp_assert(n <= len);
402*437bfbebSnyanmisaka
403*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
404*437bfbebSnyanmisaka {
405*437bfbebSnyanmisaka char *cur_fname = "scanlist.dat";
406*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
407*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
408*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)data, 8 * n, 128, 0);
409*437bfbebSnyanmisaka }
410*437bfbebSnyanmisaka #endif
411*437bfbebSnyanmisaka
412*437bfbebSnyanmisaka return MPP_OK;
413*437bfbebSnyanmisaka }
414*437bfbebSnyanmisaka
set_registers(H264dHalCtx_t * p_hal,Vdpu383H264dRegSet * regs,HalTaskInfo * task)415*437bfbebSnyanmisaka static MPP_RET set_registers(H264dHalCtx_t *p_hal, Vdpu383H264dRegSet *regs, HalTaskInfo *task)
416*437bfbebSnyanmisaka {
417*437bfbebSnyanmisaka DXVA_PicParams_H264_MVC *pp = p_hal->pp;
418*437bfbebSnyanmisaka HalBuf *mv_buf = NULL;
419*437bfbebSnyanmisaka HalBuf *origin_buf = NULL;
420*437bfbebSnyanmisaka Vdpu383H264dRegCtx *ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
421*437bfbebSnyanmisaka
422*437bfbebSnyanmisaka // memset(regs, 0, sizeof(Vdpu383H264dRegSet));
423*437bfbebSnyanmisaka regs->h264d_paras.reg66_stream_len = p_hal->strm_len;
424*437bfbebSnyanmisaka
425*437bfbebSnyanmisaka //!< caculate the yuv_frame_size
426*437bfbebSnyanmisaka {
427*437bfbebSnyanmisaka MppFrame mframe = NULL;
428*437bfbebSnyanmisaka RK_U32 hor_virstride = 0;
429*437bfbebSnyanmisaka RK_U32 ver_virstride = 0;
430*437bfbebSnyanmisaka RK_U32 y_virstride = 0;
431*437bfbebSnyanmisaka RK_U32 uv_virstride = 0;
432*437bfbebSnyanmisaka
433*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits, SLOT_FRAME_PTR, &mframe);
434*437bfbebSnyanmisaka hor_virstride = mpp_frame_get_hor_stride(mframe);
435*437bfbebSnyanmisaka ver_virstride = mpp_frame_get_ver_stride(mframe);
436*437bfbebSnyanmisaka y_virstride = hor_virstride * ver_virstride;
437*437bfbebSnyanmisaka uv_virstride = hor_virstride * ver_virstride / 2;
438*437bfbebSnyanmisaka
439*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe))) {
440*437bfbebSnyanmisaka RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
441*437bfbebSnyanmisaka RK_U32 fbd_offset;
442*437bfbebSnyanmisaka
443*437bfbebSnyanmisaka fbd_offset = fbc_hdr_stride * MPP_ALIGN(ver_virstride, 64) / 16;
444*437bfbebSnyanmisaka
445*437bfbebSnyanmisaka regs->ctrl_regs.reg9.fbc_e = 1;
446*437bfbebSnyanmisaka regs->h264d_paras.reg68_hor_virstride = fbc_hdr_stride / 64;
447*437bfbebSnyanmisaka regs->h264d_addrs.reg193_fbc_payload_offset = fbd_offset;
448*437bfbebSnyanmisaka } else if (MPP_FRAME_FMT_IS_TILE(mpp_frame_get_fmt(mframe))) {
449*437bfbebSnyanmisaka regs->ctrl_regs.reg9.tile_e = 1;
450*437bfbebSnyanmisaka regs->h264d_paras.reg68_hor_virstride = hor_virstride * 6 / 16;
451*437bfbebSnyanmisaka regs->h264d_paras.reg70_y_virstride = (y_virstride + uv_virstride) / 16;
452*437bfbebSnyanmisaka } else {
453*437bfbebSnyanmisaka regs->ctrl_regs.reg9.fbc_e = 0;
454*437bfbebSnyanmisaka regs->h264d_paras.reg68_hor_virstride = hor_virstride / 16;
455*437bfbebSnyanmisaka regs->h264d_paras.reg69_raster_uv_hor_virstride = hor_virstride / 16;
456*437bfbebSnyanmisaka regs->h264d_paras.reg70_y_virstride = y_virstride / 16;
457*437bfbebSnyanmisaka }
458*437bfbebSnyanmisaka }
459*437bfbebSnyanmisaka //!< set current
460*437bfbebSnyanmisaka {
461*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
462*437bfbebSnyanmisaka RK_S32 fd = -1;
463*437bfbebSnyanmisaka
464*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits, SLOT_BUFFER, &mbuffer);
465*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(mbuffer);
466*437bfbebSnyanmisaka regs->h264d_addrs.reg168_decout_base = fd;
467*437bfbebSnyanmisaka regs->h264d_addrs.reg192_payload_st_cur_base = fd;
468*437bfbebSnyanmisaka
469*437bfbebSnyanmisaka //colmv_cur_base
470*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, pp->CurrPic.Index7Bits);
471*437bfbebSnyanmisaka regs->h264d_addrs.reg216_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
472*437bfbebSnyanmisaka regs->h264d_addrs.reg169_error_ref_base = fd;
473*437bfbebSnyanmisaka }
474*437bfbebSnyanmisaka //!< set reference
475*437bfbebSnyanmisaka {
476*437bfbebSnyanmisaka RK_S32 i = 0;
477*437bfbebSnyanmisaka RK_S32 fd = -1;
478*437bfbebSnyanmisaka RK_S32 ref_index = -1;
479*437bfbebSnyanmisaka RK_S32 near_index = -1;
480*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
481*437bfbebSnyanmisaka RK_U32 min_frame_num = 0;
482*437bfbebSnyanmisaka MppFrame mframe = NULL;
483*437bfbebSnyanmisaka
484*437bfbebSnyanmisaka for (i = 0; i < 15; i++) {
485*437bfbebSnyanmisaka if (pp->RefFrameList[i].bPicEntry != 0xff) {
486*437bfbebSnyanmisaka ref_index = pp->RefFrameList[i].Index7Bits;
487*437bfbebSnyanmisaka near_index = pp->RefFrameList[i].Index7Bits;
488*437bfbebSnyanmisaka } else {
489*437bfbebSnyanmisaka ref_index = (near_index < 0) ? pp->CurrPic.Index7Bits : near_index;
490*437bfbebSnyanmisaka }
491*437bfbebSnyanmisaka /* mark 3 to differ from current frame */
492*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, ref_index, SLOT_BUFFER, &mbuffer);
493*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, ref_index, SLOT_FRAME_PTR, &mframe);
494*437bfbebSnyanmisaka if (ctx->origin_bufs && mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY) {
495*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(ctx->origin_bufs, ref_index);
496*437bfbebSnyanmisaka mbuffer = origin_buf->buf[0];
497*437bfbebSnyanmisaka }
498*437bfbebSnyanmisaka
499*437bfbebSnyanmisaka if (pp->FrameNumList[i] < pp->frame_num &&
500*437bfbebSnyanmisaka pp->FrameNumList[i] > min_frame_num &&
501*437bfbebSnyanmisaka (!mpp_frame_get_errinfo(mframe))) {
502*437bfbebSnyanmisaka min_frame_num = pp->FrameNumList[i];
503*437bfbebSnyanmisaka regs->h264d_addrs.reg169_error_ref_base = mpp_buffer_get_fd(mbuffer);
504*437bfbebSnyanmisaka }
505*437bfbebSnyanmisaka
506*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(mbuffer);
507*437bfbebSnyanmisaka regs->h264d_addrs.reg170_185_ref_base[i] = fd;
508*437bfbebSnyanmisaka regs->h264d_addrs.reg195_210_payload_st_ref_base[i] = fd;
509*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, ref_index);
510*437bfbebSnyanmisaka regs->h264d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
511*437bfbebSnyanmisaka }
512*437bfbebSnyanmisaka
513*437bfbebSnyanmisaka if (pp->RefFrameList[15].bPicEntry != 0xff) {
514*437bfbebSnyanmisaka ref_index = pp->RefFrameList[15].Index7Bits;
515*437bfbebSnyanmisaka } else {
516*437bfbebSnyanmisaka ref_index = (near_index < 0) ? pp->CurrPic.Index7Bits : near_index;
517*437bfbebSnyanmisaka }
518*437bfbebSnyanmisaka
519*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, ref_index, SLOT_BUFFER, &mbuffer);
520*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(mbuffer);
521*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe) == 2) {
522*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(ctx->origin_bufs, ref_index);
523*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(origin_buf->buf[0]);
524*437bfbebSnyanmisaka }
525*437bfbebSnyanmisaka regs->h264d_addrs.reg170_185_ref_base[15] = fd;
526*437bfbebSnyanmisaka regs->h264d_addrs.reg195_210_payload_st_ref_base[15] = fd;
527*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, ref_index);
528*437bfbebSnyanmisaka regs->h264d_addrs.reg217_232_colmv_ref_base[15] = mpp_buffer_get_fd(mv_buf->buf[0]);
529*437bfbebSnyanmisaka }
530*437bfbebSnyanmisaka {
531*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
532*437bfbebSnyanmisaka Vdpu383H264dRegCtx *reg_ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
533*437bfbebSnyanmisaka
534*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->packet_slots, task->dec.input, SLOT_BUFFER, &mbuffer);
535*437bfbebSnyanmisaka regs->common_addr.reg128_strm_base = mpp_buffer_get_fd(mbuffer);
536*437bfbebSnyanmisaka // regs->h264d_paras.reg65_strm_start_bit = 2 * 8;
537*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
538*437bfbebSnyanmisaka {
539*437bfbebSnyanmisaka char *cur_fname = "stream_in.dat";
540*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
541*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
542*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(mbuffer),
543*437bfbebSnyanmisaka 8 * p_hal->strm_len, 128, 0);
544*437bfbebSnyanmisaka }
545*437bfbebSnyanmisaka #endif
546*437bfbebSnyanmisaka
547*437bfbebSnyanmisaka regs->common_addr.reg130_cabactbl_base = reg_ctx->bufs_fd;
548*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 130, reg_ctx->offset_cabac);
549*437bfbebSnyanmisaka }
550*437bfbebSnyanmisaka
551*437bfbebSnyanmisaka {
552*437bfbebSnyanmisaka //scale down config
553*437bfbebSnyanmisaka MppFrame mframe = NULL;
554*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
555*437bfbebSnyanmisaka RK_S32 fd = -1;
556*437bfbebSnyanmisaka MppFrameThumbnailMode thumbnail_mode;
557*437bfbebSnyanmisaka
558*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits, SLOT_BUFFER, &mbuffer);
559*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits,
560*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
561*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(mbuffer);
562*437bfbebSnyanmisaka thumbnail_mode = mpp_frame_get_thumbnail_en(mframe);
563*437bfbebSnyanmisaka switch (thumbnail_mode) {
564*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_ONLY:
565*437bfbebSnyanmisaka regs->common_addr.reg133_scale_down_base = fd;
566*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(ctx->origin_bufs, pp->CurrPic.Index7Bits);
567*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(origin_buf->buf[0]);
568*437bfbebSnyanmisaka regs->h264d_addrs.reg168_decout_base = fd;
569*437bfbebSnyanmisaka regs->h264d_addrs.reg192_payload_st_cur_base = fd;
570*437bfbebSnyanmisaka regs->h264d_addrs.reg169_error_ref_base = fd;
571*437bfbebSnyanmisaka vdpu383_setup_down_scale(mframe, p_hal->dev, ®s->ctrl_regs, (void*)®s->h264d_paras);
572*437bfbebSnyanmisaka break;
573*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_MIXED:
574*437bfbebSnyanmisaka regs->common_addr.reg133_scale_down_base = fd;
575*437bfbebSnyanmisaka vdpu383_setup_down_scale(mframe, p_hal->dev, ®s->ctrl_regs, (void*)®s->h264d_paras);
576*437bfbebSnyanmisaka break;
577*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_NONE:
578*437bfbebSnyanmisaka default:
579*437bfbebSnyanmisaka regs->ctrl_regs.reg9.scale_down_en = 0;
580*437bfbebSnyanmisaka break;
581*437bfbebSnyanmisaka }
582*437bfbebSnyanmisaka }
583*437bfbebSnyanmisaka
584*437bfbebSnyanmisaka return MPP_OK;
585*437bfbebSnyanmisaka }
586*437bfbebSnyanmisaka
init_ctrl_regs(Vdpu383H264dRegSet * regs)587*437bfbebSnyanmisaka static MPP_RET init_ctrl_regs(Vdpu383H264dRegSet *regs)
588*437bfbebSnyanmisaka {
589*437bfbebSnyanmisaka Vdpu383CtrlReg *ctrl_regs = ®s->ctrl_regs;
590*437bfbebSnyanmisaka
591*437bfbebSnyanmisaka ctrl_regs->reg8_dec_mode = 1; //!< h264
592*437bfbebSnyanmisaka ctrl_regs->reg9.buf_empty_en = 0;
593*437bfbebSnyanmisaka
594*437bfbebSnyanmisaka ctrl_regs->reg10.strmd_auto_gating_e = 1;
595*437bfbebSnyanmisaka ctrl_regs->reg10.inter_auto_gating_e = 1;
596*437bfbebSnyanmisaka ctrl_regs->reg10.intra_auto_gating_e = 1;
597*437bfbebSnyanmisaka ctrl_regs->reg10.transd_auto_gating_e = 1;
598*437bfbebSnyanmisaka ctrl_regs->reg10.recon_auto_gating_e = 1;
599*437bfbebSnyanmisaka ctrl_regs->reg10.filterd_auto_gating_e = 1;
600*437bfbebSnyanmisaka ctrl_regs->reg10.bus_auto_gating_e = 1;
601*437bfbebSnyanmisaka ctrl_regs->reg10.ctrl_auto_gating_e = 1;
602*437bfbebSnyanmisaka ctrl_regs->reg10.rcb_auto_gating_e = 1;
603*437bfbebSnyanmisaka ctrl_regs->reg10.err_prc_auto_gating_e = 1;
604*437bfbebSnyanmisaka
605*437bfbebSnyanmisaka ctrl_regs->reg13_core_timeout_threshold = 0xffffff;
606*437bfbebSnyanmisaka
607*437bfbebSnyanmisaka ctrl_regs->reg16.error_proc_disable = 1;
608*437bfbebSnyanmisaka ctrl_regs->reg16.error_spread_disable = 0;
609*437bfbebSnyanmisaka ctrl_regs->reg16.roi_error_ctu_cal_en = 0;
610*437bfbebSnyanmisaka
611*437bfbebSnyanmisaka ctrl_regs->reg20_cabac_error_en_lowbits = 0xfffedfff;
612*437bfbebSnyanmisaka ctrl_regs->reg21_cabac_error_en_highbits = 0x0ffbf9ff;
613*437bfbebSnyanmisaka
614*437bfbebSnyanmisaka /* performance */
615*437bfbebSnyanmisaka ctrl_regs->reg28.axi_perf_work_e = 1;
616*437bfbebSnyanmisaka ctrl_regs->reg28.axi_cnt_type = 1;
617*437bfbebSnyanmisaka ctrl_regs->reg28.rd_latency_id = 11;
618*437bfbebSnyanmisaka
619*437bfbebSnyanmisaka ctrl_regs->reg29.addr_align_type = 2;
620*437bfbebSnyanmisaka ctrl_regs->reg29.ar_cnt_id_type = 0;
621*437bfbebSnyanmisaka ctrl_regs->reg29.aw_cnt_id_type = 0;
622*437bfbebSnyanmisaka ctrl_regs->reg29.ar_count_id = 0xa;
623*437bfbebSnyanmisaka ctrl_regs->reg29.aw_count_id = 0;
624*437bfbebSnyanmisaka ctrl_regs->reg29.rd_band_width_mode = 0;
625*437bfbebSnyanmisaka
626*437bfbebSnyanmisaka return MPP_OK;
627*437bfbebSnyanmisaka }
628*437bfbebSnyanmisaka
vdpu383_h264d_init(void * hal,MppHalCfg * cfg)629*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_init(void *hal, MppHalCfg *cfg)
630*437bfbebSnyanmisaka {
631*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
632*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
633*437bfbebSnyanmisaka
634*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
635*437bfbebSnyanmisaka (void) cfg;
636*437bfbebSnyanmisaka
637*437bfbebSnyanmisaka MEM_CHECK(ret, p_hal->reg_ctx = mpp_calloc_size(void, sizeof(Vdpu383H264dRegCtx)));
638*437bfbebSnyanmisaka Vdpu383H264dRegCtx *reg_ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
639*437bfbebSnyanmisaka RK_U32 max_cnt = p_hal->fast_mode ? VDPU383_FAST_REG_SET_CNT : 1;
640*437bfbebSnyanmisaka RK_U32 i = 0;
641*437bfbebSnyanmisaka
642*437bfbebSnyanmisaka //!< malloc buffers
643*437bfbebSnyanmisaka FUN_CHECK(ret = mpp_buffer_get(p_hal->buf_group, ®_ctx->bufs,
644*437bfbebSnyanmisaka VDPU383_INFO_BUFFER_SIZE(max_cnt)));
645*437bfbebSnyanmisaka reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
646*437bfbebSnyanmisaka reg_ctx->bufs_ptr = mpp_buffer_get_ptr(reg_ctx->bufs);
647*437bfbebSnyanmisaka reg_ctx->offset_cabac = VDPU383_CABAC_TAB_OFFSET;
648*437bfbebSnyanmisaka reg_ctx->offset_errinfo = VDPU383_ERROR_INFO_OFFSET;
649*437bfbebSnyanmisaka for (i = 0; i < max_cnt; i++) {
650*437bfbebSnyanmisaka reg_ctx->reg_buf[i].regs = mpp_calloc(Vdpu383H264dRegSet, 1);
651*437bfbebSnyanmisaka init_ctrl_regs(reg_ctx->reg_buf[i].regs);
652*437bfbebSnyanmisaka reg_ctx->offset_spspps[i] = VDPU383_SPSPPS_OFFSET(i);
653*437bfbebSnyanmisaka reg_ctx->offset_rps[i] = VDPU383_RPS_OFFSET(i);
654*437bfbebSnyanmisaka reg_ctx->offset_sclst[i] = VDPU383_SCALING_LIST_OFFSET(i);
655*437bfbebSnyanmisaka }
656*437bfbebSnyanmisaka
657*437bfbebSnyanmisaka mpp_buffer_attach_dev(reg_ctx->bufs, p_hal->dev);
658*437bfbebSnyanmisaka
659*437bfbebSnyanmisaka if (!p_hal->fast_mode) {
660*437bfbebSnyanmisaka reg_ctx->regs = reg_ctx->reg_buf[0].regs;
661*437bfbebSnyanmisaka reg_ctx->spspps_offset = reg_ctx->offset_spspps[0];
662*437bfbebSnyanmisaka reg_ctx->rps_offset = reg_ctx->offset_rps[0];
663*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->offset_sclst[0];
664*437bfbebSnyanmisaka }
665*437bfbebSnyanmisaka
666*437bfbebSnyanmisaka //!< copy cabac table bytes
667*437bfbebSnyanmisaka memcpy((char *)reg_ctx->bufs_ptr + reg_ctx->offset_cabac,
668*437bfbebSnyanmisaka (void *)h264_cabac_table, sizeof(h264_cabac_table));
669*437bfbebSnyanmisaka
670*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
671*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_VER_ALIGN, rkv_ver_align);
672*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_LEN_ALIGN, rkv_len_align);
673*437bfbebSnyanmisaka
674*437bfbebSnyanmisaka if (cfg->hal_fbc_adj_cfg) {
675*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->func = vdpu383_afbc_align_calc;
676*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->expand = 16;
677*437bfbebSnyanmisaka }
678*437bfbebSnyanmisaka
679*437bfbebSnyanmisaka __RETURN:
680*437bfbebSnyanmisaka return MPP_OK;
681*437bfbebSnyanmisaka __FAILED:
682*437bfbebSnyanmisaka vdpu383_h264d_deinit(hal);
683*437bfbebSnyanmisaka
684*437bfbebSnyanmisaka return ret;
685*437bfbebSnyanmisaka }
686*437bfbebSnyanmisaka
vdpu383_h264d_deinit(void * hal)687*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_deinit(void *hal)
688*437bfbebSnyanmisaka {
689*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
690*437bfbebSnyanmisaka Vdpu383H264dRegCtx *reg_ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
691*437bfbebSnyanmisaka
692*437bfbebSnyanmisaka RK_U32 i = 0;
693*437bfbebSnyanmisaka RK_U32 loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
694*437bfbebSnyanmisaka
695*437bfbebSnyanmisaka if (reg_ctx->bufs) {
696*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->bufs);
697*437bfbebSnyanmisaka reg_ctx->bufs = NULL;
698*437bfbebSnyanmisaka }
699*437bfbebSnyanmisaka
700*437bfbebSnyanmisaka for (i = 0; i < loop; i++)
701*437bfbebSnyanmisaka MPP_FREE(reg_ctx->reg_buf[i].regs);
702*437bfbebSnyanmisaka
703*437bfbebSnyanmisaka loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->rcb_buf) : 1;
704*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
705*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
706*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
707*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
708*437bfbebSnyanmisaka }
709*437bfbebSnyanmisaka }
710*437bfbebSnyanmisaka
711*437bfbebSnyanmisaka if (p_hal->cmv_bufs) {
712*437bfbebSnyanmisaka hal_bufs_deinit(p_hal->cmv_bufs);
713*437bfbebSnyanmisaka p_hal->cmv_bufs = NULL;
714*437bfbebSnyanmisaka }
715*437bfbebSnyanmisaka
716*437bfbebSnyanmisaka if (reg_ctx->origin_bufs) {
717*437bfbebSnyanmisaka hal_bufs_deinit(reg_ctx->origin_bufs);
718*437bfbebSnyanmisaka reg_ctx->origin_bufs = NULL;
719*437bfbebSnyanmisaka }
720*437bfbebSnyanmisaka
721*437bfbebSnyanmisaka MPP_FREE(p_hal->reg_ctx);
722*437bfbebSnyanmisaka
723*437bfbebSnyanmisaka return MPP_OK;
724*437bfbebSnyanmisaka }
725*437bfbebSnyanmisaka
h264d_refine_rcb_size(H264dHalCtx_t * p_hal,Vdpu383RcbInfo * rcb_info,RK_S32 width,RK_S32 height)726*437bfbebSnyanmisaka static void h264d_refine_rcb_size(H264dHalCtx_t *p_hal, Vdpu383RcbInfo *rcb_info,
727*437bfbebSnyanmisaka RK_S32 width, RK_S32 height)
728*437bfbebSnyanmisaka {
729*437bfbebSnyanmisaka RK_U32 rcb_bits = 0;
730*437bfbebSnyanmisaka RK_U32 mbaff = p_hal->pp->MbaffFrameFlag;
731*437bfbebSnyanmisaka RK_U32 bit_depth = p_hal->pp->bit_depth_luma_minus8 + 8;
732*437bfbebSnyanmisaka RK_U32 chroma_format_idc = p_hal->pp->chroma_format_idc;
733*437bfbebSnyanmisaka RK_U32 row_uv_para = 1; // for yuv420/yuv422
734*437bfbebSnyanmisaka RK_U32 filterd_row_append = 8192;
735*437bfbebSnyanmisaka
736*437bfbebSnyanmisaka // vdpu383 h264d support yuv400/yuv420/yuv422
737*437bfbebSnyanmisaka if (chroma_format_idc == 0)
738*437bfbebSnyanmisaka row_uv_para = 0;
739*437bfbebSnyanmisaka
740*437bfbebSnyanmisaka width = MPP_ALIGN(width, H264_CTU_SIZE);
741*437bfbebSnyanmisaka height = MPP_ALIGN(height, H264_CTU_SIZE);
742*437bfbebSnyanmisaka /* RCB_STRMD_ROW && RCB_STRMD_TILE_ROW*/
743*437bfbebSnyanmisaka if (width > 4096)
744*437bfbebSnyanmisaka rcb_bits = ((width + 15) / 16) * 154 * (mbaff ? 2 : 1);
745*437bfbebSnyanmisaka else
746*437bfbebSnyanmisaka rcb_bits = 0;
747*437bfbebSnyanmisaka rcb_info[RCB_STRMD_ROW].size = MPP_RCB_BYTES(rcb_bits);
748*437bfbebSnyanmisaka rcb_info[RCB_STRMD_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
749*437bfbebSnyanmisaka /* RCB_INTER_ROW && RCB_INTER_TILE_ROW*/
750*437bfbebSnyanmisaka rcb_bits = ((width + 3) / 4) * 92 * (mbaff ? 2 : 1);
751*437bfbebSnyanmisaka rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
752*437bfbebSnyanmisaka rcb_info[RCB_INTER_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
753*437bfbebSnyanmisaka /* RCB_INTRA_ROW && RCB_INTRA_TILE_ROW*/
754*437bfbebSnyanmisaka rcb_bits = MPP_ALIGN(width, 512) * (bit_depth + 2) * (mbaff ? 2 : 1);
755*437bfbebSnyanmisaka if (chroma_format_idc == 1 || chroma_format_idc == 2)
756*437bfbebSnyanmisaka rcb_bits = rcb_bits * 5 / 2; //TODO:
757*437bfbebSnyanmisaka
758*437bfbebSnyanmisaka rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
759*437bfbebSnyanmisaka rcb_info[RCB_INTRA_TILE_ROW].size = 0;
760*437bfbebSnyanmisaka /* RCB_FILTERD_ROW && RCB_FILTERD_PROTECT_ROW*/
761*437bfbebSnyanmisaka // save space mode : half for RCB_FILTERD_ROW, half for RCB_FILTERD_PROTECT_ROW
762*437bfbebSnyanmisaka rcb_bits = width * 17 * ((6 + 3 * row_uv_para) * (mbaff ? 2 : 1) + 2 * row_uv_para + 1.5);
763*437bfbebSnyanmisaka if (width > 4096)
764*437bfbebSnyanmisaka filterd_row_append = 27648;
765*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
766*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_PROTECT_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
767*437bfbebSnyanmisaka
768*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_ROW].size = 0;
769*437bfbebSnyanmisaka /* RCB_FILTERD_TILE_COL */
770*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_COL].size = 0;
771*437bfbebSnyanmisaka
772*437bfbebSnyanmisaka }
773*437bfbebSnyanmisaka
hal_h264d_rcb_info_update(void * hal)774*437bfbebSnyanmisaka static void hal_h264d_rcb_info_update(void *hal)
775*437bfbebSnyanmisaka {
776*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t*)hal;
777*437bfbebSnyanmisaka RK_U32 mbaff = p_hal->pp->MbaffFrameFlag;
778*437bfbebSnyanmisaka RK_U32 bit_depth = p_hal->pp->bit_depth_luma_minus8 + 8;
779*437bfbebSnyanmisaka RK_U32 chroma_format_idc = p_hal->pp->chroma_format_idc;
780*437bfbebSnyanmisaka Vdpu383H264dRegCtx *ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
781*437bfbebSnyanmisaka RK_S32 width = MPP_ALIGN((p_hal->pp->wFrameWidthInMbsMinus1 + 1) << 4, 64);
782*437bfbebSnyanmisaka RK_S32 height = MPP_ALIGN((p_hal->pp->wFrameHeightInMbsMinus1 + 1) << 4, 64);
783*437bfbebSnyanmisaka
784*437bfbebSnyanmisaka if ( ctx->bit_depth != bit_depth ||
785*437bfbebSnyanmisaka ctx->chroma_format_idc != chroma_format_idc ||
786*437bfbebSnyanmisaka ctx->mbaff != mbaff ||
787*437bfbebSnyanmisaka ctx->width != width ||
788*437bfbebSnyanmisaka ctx->height != height) {
789*437bfbebSnyanmisaka RK_U32 i;
790*437bfbebSnyanmisaka RK_U32 loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(ctx->reg_buf) : 1;
791*437bfbebSnyanmisaka
792*437bfbebSnyanmisaka ctx->rcb_buf_size = vdpu383_get_rcb_buf_size(ctx->rcb_info, width, height);
793*437bfbebSnyanmisaka h264d_refine_rcb_size(hal, ctx->rcb_info, width, height);
794*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
795*437bfbebSnyanmisaka MppBuffer rcb_buf = ctx->rcb_buf[i];
796*437bfbebSnyanmisaka
797*437bfbebSnyanmisaka if (rcb_buf) {
798*437bfbebSnyanmisaka mpp_buffer_put(rcb_buf);
799*437bfbebSnyanmisaka ctx->rcb_buf[i] = NULL;
800*437bfbebSnyanmisaka }
801*437bfbebSnyanmisaka mpp_buffer_get(p_hal->buf_group, &rcb_buf, ctx->rcb_buf_size);
802*437bfbebSnyanmisaka ctx->rcb_buf[i] = rcb_buf;
803*437bfbebSnyanmisaka }
804*437bfbebSnyanmisaka ctx->bit_depth = bit_depth;
805*437bfbebSnyanmisaka ctx->width = width;
806*437bfbebSnyanmisaka ctx->height = height;
807*437bfbebSnyanmisaka ctx->mbaff = mbaff;
808*437bfbebSnyanmisaka ctx->chroma_format_idc = chroma_format_idc;
809*437bfbebSnyanmisaka }
810*437bfbebSnyanmisaka }
811*437bfbebSnyanmisaka
vdpu383_h264d_gen_regs(void * hal,HalTaskInfo * task)812*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_gen_regs(void *hal, HalTaskInfo *task)
813*437bfbebSnyanmisaka {
814*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
815*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
816*437bfbebSnyanmisaka RK_S32 width = MPP_ALIGN((p_hal->pp->wFrameWidthInMbsMinus1 + 1) << 4, 64);
817*437bfbebSnyanmisaka RK_S32 height = MPP_ALIGN((p_hal->pp->wFrameHeightInMbsMinus1 + 1) << 4, 64);
818*437bfbebSnyanmisaka Vdpu383H264dRegCtx *ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
819*437bfbebSnyanmisaka Vdpu383H264dRegSet *regs = ctx->regs;
820*437bfbebSnyanmisaka MppFrame mframe;
821*437bfbebSnyanmisaka RK_S32 mv_size = MPP_ALIGN(width, 64) * MPP_ALIGN(height, 16); // 16 byte unit
822*437bfbebSnyanmisaka
823*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
824*437bfbebSnyanmisaka
825*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
826*437bfbebSnyanmisaka (task->dec.flags.ref_err && !p_hal->cfg->base.disable_error)) {
827*437bfbebSnyanmisaka goto __RETURN;
828*437bfbebSnyanmisaka }
829*437bfbebSnyanmisaka
830*437bfbebSnyanmisaka /* if is field mode is enabled enlarge colmv buffer and disable colmv compression */
831*437bfbebSnyanmisaka if (!p_hal->pp->frame_mbs_only_flag)
832*437bfbebSnyanmisaka mv_size *= 2;
833*437bfbebSnyanmisaka
834*437bfbebSnyanmisaka if (p_hal->cmv_bufs == NULL || p_hal->mv_size < mv_size) {
835*437bfbebSnyanmisaka size_t size = mv_size;
836*437bfbebSnyanmisaka
837*437bfbebSnyanmisaka if (p_hal->cmv_bufs) {
838*437bfbebSnyanmisaka hal_bufs_deinit(p_hal->cmv_bufs);
839*437bfbebSnyanmisaka p_hal->cmv_bufs = NULL;
840*437bfbebSnyanmisaka }
841*437bfbebSnyanmisaka
842*437bfbebSnyanmisaka hal_bufs_init(&p_hal->cmv_bufs);
843*437bfbebSnyanmisaka if (p_hal->cmv_bufs == NULL) {
844*437bfbebSnyanmisaka mpp_err_f("colmv bufs init fail");
845*437bfbebSnyanmisaka goto __RETURN;
846*437bfbebSnyanmisaka }
847*437bfbebSnyanmisaka p_hal->mv_size = mv_size;
848*437bfbebSnyanmisaka p_hal->mv_count = mpp_buf_slot_get_count(p_hal->frame_slots);
849*437bfbebSnyanmisaka hal_bufs_setup(p_hal->cmv_bufs, p_hal->mv_count, 1, &size);
850*437bfbebSnyanmisaka }
851*437bfbebSnyanmisaka
852*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, p_hal->pp->CurrPic.Index7Bits, SLOT_FRAME_PTR, &mframe);
853*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY &&
854*437bfbebSnyanmisaka ctx->origin_bufs == NULL) {
855*437bfbebSnyanmisaka vdpu383_setup_scale_origin_bufs(p_hal, mframe);
856*437bfbebSnyanmisaka }
857*437bfbebSnyanmisaka
858*437bfbebSnyanmisaka if (p_hal->fast_mode) {
859*437bfbebSnyanmisaka RK_U32 i = 0;
860*437bfbebSnyanmisaka for (i = 0; i < MPP_ARRAY_ELEMS(ctx->reg_buf); i++) {
861*437bfbebSnyanmisaka if (!ctx->reg_buf[i].valid) {
862*437bfbebSnyanmisaka task->dec.reg_index = i;
863*437bfbebSnyanmisaka regs = ctx->reg_buf[i].regs;
864*437bfbebSnyanmisaka
865*437bfbebSnyanmisaka ctx->spspps_offset = ctx->offset_spspps[i];
866*437bfbebSnyanmisaka ctx->rps_offset = ctx->offset_rps[i];
867*437bfbebSnyanmisaka ctx->sclst_offset = ctx->offset_sclst[i];
868*437bfbebSnyanmisaka ctx->reg_buf[i].valid = 1;
869*437bfbebSnyanmisaka break;
870*437bfbebSnyanmisaka }
871*437bfbebSnyanmisaka }
872*437bfbebSnyanmisaka }
873*437bfbebSnyanmisaka
874*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
875*437bfbebSnyanmisaka {
876*437bfbebSnyanmisaka memset(dump_cur_dir, 0, sizeof(dump_cur_dir));
877*437bfbebSnyanmisaka sprintf(dump_cur_dir, "avc/Frame%04d", dump_cur_frame);
878*437bfbebSnyanmisaka if (access(dump_cur_dir, 0)) {
879*437bfbebSnyanmisaka if (mkdir(dump_cur_dir))
880*437bfbebSnyanmisaka mpp_err_f("error: mkdir %s\n", dump_cur_dir);
881*437bfbebSnyanmisaka }
882*437bfbebSnyanmisaka dump_cur_frame++;
883*437bfbebSnyanmisaka }
884*437bfbebSnyanmisaka #endif
885*437bfbebSnyanmisaka
886*437bfbebSnyanmisaka prepare_spspps(p_hal, (RK_U64 *)&ctx->spspps, sizeof(ctx->spspps) / 8);
887*437bfbebSnyanmisaka prepare_framerps(p_hal, (RK_U64 *)&ctx->rps, sizeof(ctx->rps) / 8);
888*437bfbebSnyanmisaka prepare_scanlist(p_hal, ctx->sclst, sizeof(ctx->sclst));
889*437bfbebSnyanmisaka set_registers(p_hal, regs, task);
890*437bfbebSnyanmisaka
891*437bfbebSnyanmisaka //!< copy spspps datas
892*437bfbebSnyanmisaka memcpy((char *)ctx->bufs_ptr + ctx->spspps_offset, (char *)ctx->spspps, sizeof(ctx->spspps));
893*437bfbebSnyanmisaka
894*437bfbebSnyanmisaka regs->common_addr.reg131_gbl_base = ctx->bufs_fd;
895*437bfbebSnyanmisaka regs->h264d_paras.reg67_global_len = VDPU383_SPS_PPS_LEN / 16; // 128 bit as unit
896*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 131, ctx->spspps_offset);
897*437bfbebSnyanmisaka
898*437bfbebSnyanmisaka memcpy((char *)ctx->bufs_ptr + ctx->rps_offset, (void *)ctx->rps, sizeof(ctx->rps));
899*437bfbebSnyanmisaka regs->common_addr.reg129_rps_base = ctx->bufs_fd;
900*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 129, ctx->rps_offset);
901*437bfbebSnyanmisaka
902*437bfbebSnyanmisaka if (p_hal->pp->scaleing_list_enable_flag) {
903*437bfbebSnyanmisaka memcpy((char *)ctx->bufs_ptr + ctx->sclst_offset, (void *)ctx->sclst, sizeof(ctx->sclst));
904*437bfbebSnyanmisaka regs->common_addr.reg132_scanlist_addr = ctx->bufs_fd;
905*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 132, ctx->sclst_offset);
906*437bfbebSnyanmisaka } else {
907*437bfbebSnyanmisaka regs->common_addr.reg132_scanlist_addr = 0;
908*437bfbebSnyanmisaka }
909*437bfbebSnyanmisaka
910*437bfbebSnyanmisaka hal_h264d_rcb_info_update(p_hal);
911*437bfbebSnyanmisaka vdpu383_setup_rcb(®s->common_addr, p_hal->dev, p_hal->fast_mode ?
912*437bfbebSnyanmisaka ctx->rcb_buf[task->dec.reg_index] : ctx->rcb_buf[0],
913*437bfbebSnyanmisaka ctx->rcb_info);
914*437bfbebSnyanmisaka vdpu383_setup_statistic(®s->ctrl_regs);
915*437bfbebSnyanmisaka mpp_buffer_sync_end(ctx->bufs);
916*437bfbebSnyanmisaka
917*437bfbebSnyanmisaka __RETURN:
918*437bfbebSnyanmisaka return ret = MPP_OK;
919*437bfbebSnyanmisaka }
920*437bfbebSnyanmisaka
vdpu383_h264d_start(void * hal,HalTaskInfo * task)921*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_start(void *hal, HalTaskInfo *task)
922*437bfbebSnyanmisaka {
923*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
924*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
925*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
926*437bfbebSnyanmisaka
927*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
928*437bfbebSnyanmisaka (task->dec.flags.ref_err && !p_hal->cfg->base.disable_error)) {
929*437bfbebSnyanmisaka goto __RETURN;
930*437bfbebSnyanmisaka }
931*437bfbebSnyanmisaka
932*437bfbebSnyanmisaka Vdpu383H264dRegCtx *reg_ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
933*437bfbebSnyanmisaka Vdpu383H264dRegSet *regs = p_hal->fast_mode ?
934*437bfbebSnyanmisaka reg_ctx->reg_buf[task->dec.reg_index].regs :
935*437bfbebSnyanmisaka reg_ctx->regs;
936*437bfbebSnyanmisaka MppDev dev = p_hal->dev;
937*437bfbebSnyanmisaka
938*437bfbebSnyanmisaka do {
939*437bfbebSnyanmisaka MppDevRegWrCfg wr_cfg;
940*437bfbebSnyanmisaka MppDevRegRdCfg rd_cfg;
941*437bfbebSnyanmisaka
942*437bfbebSnyanmisaka wr_cfg.reg = ®s->ctrl_regs;
943*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->ctrl_regs);
944*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CTRL_REGS;
945*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
946*437bfbebSnyanmisaka if (ret) {
947*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
948*437bfbebSnyanmisaka break;
949*437bfbebSnyanmisaka }
950*437bfbebSnyanmisaka
951*437bfbebSnyanmisaka wr_cfg.reg = ®s->common_addr;
952*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->common_addr);
953*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
954*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
955*437bfbebSnyanmisaka if (ret) {
956*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
957*437bfbebSnyanmisaka break;
958*437bfbebSnyanmisaka }
959*437bfbebSnyanmisaka
960*437bfbebSnyanmisaka wr_cfg.reg = ®s->h264d_paras;
961*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->h264d_paras);
962*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_PARAS_REGS;
963*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
964*437bfbebSnyanmisaka if (ret) {
965*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
966*437bfbebSnyanmisaka break;
967*437bfbebSnyanmisaka }
968*437bfbebSnyanmisaka
969*437bfbebSnyanmisaka wr_cfg.reg = ®s->h264d_addrs;
970*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->h264d_addrs);
971*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
972*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
973*437bfbebSnyanmisaka if (ret) {
974*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
975*437bfbebSnyanmisaka break;
976*437bfbebSnyanmisaka }
977*437bfbebSnyanmisaka
978*437bfbebSnyanmisaka rd_cfg.reg = ®s->ctrl_regs.reg15;
979*437bfbebSnyanmisaka rd_cfg.size = sizeof(regs->ctrl_regs.reg15);
980*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_INTERRUPT_REGS;
981*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
982*437bfbebSnyanmisaka if (ret) {
983*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
984*437bfbebSnyanmisaka break;
985*437bfbebSnyanmisaka }
986*437bfbebSnyanmisaka
987*437bfbebSnyanmisaka /* rcb info for sram */
988*437bfbebSnyanmisaka vdpu383_set_rcbinfo(dev, (Vdpu383RcbInfo*)reg_ctx->rcb_info);
989*437bfbebSnyanmisaka
990*437bfbebSnyanmisaka /* send request to hardware */
991*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
992*437bfbebSnyanmisaka if (ret) {
993*437bfbebSnyanmisaka mpp_err_f("send cmd failed %d\n", ret);
994*437bfbebSnyanmisaka break;
995*437bfbebSnyanmisaka }
996*437bfbebSnyanmisaka } while (0);
997*437bfbebSnyanmisaka
998*437bfbebSnyanmisaka __RETURN:
999*437bfbebSnyanmisaka return ret = MPP_OK;
1000*437bfbebSnyanmisaka }
1001*437bfbebSnyanmisaka
vdpu383_h264d_wait(void * hal,HalTaskInfo * task)1002*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_wait(void *hal, HalTaskInfo *task)
1003*437bfbebSnyanmisaka {
1004*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
1005*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1006*437bfbebSnyanmisaka
1007*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
1008*437bfbebSnyanmisaka Vdpu383H264dRegCtx *reg_ctx = (Vdpu383H264dRegCtx *)p_hal->reg_ctx;
1009*437bfbebSnyanmisaka Vdpu383H264dRegSet *p_regs = p_hal->fast_mode ?
1010*437bfbebSnyanmisaka reg_ctx->reg_buf[task->dec.reg_index].regs :
1011*437bfbebSnyanmisaka reg_ctx->regs;
1012*437bfbebSnyanmisaka
1013*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1014*437bfbebSnyanmisaka (task->dec.flags.ref_err && !p_hal->cfg->base.disable_error)) {
1015*437bfbebSnyanmisaka goto __SKIP_HARD;
1016*437bfbebSnyanmisaka }
1017*437bfbebSnyanmisaka
1018*437bfbebSnyanmisaka ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
1019*437bfbebSnyanmisaka if (ret)
1020*437bfbebSnyanmisaka mpp_err_f("poll cmd failed %d\n", ret);
1021*437bfbebSnyanmisaka
1022*437bfbebSnyanmisaka __SKIP_HARD:
1023*437bfbebSnyanmisaka if (p_hal->dec_cb) {
1024*437bfbebSnyanmisaka DecCbHalDone param;
1025*437bfbebSnyanmisaka
1026*437bfbebSnyanmisaka param.task = (void *)&task->dec;
1027*437bfbebSnyanmisaka param.regs = (RK_U32 *)p_regs;
1028*437bfbebSnyanmisaka
1029*437bfbebSnyanmisaka if ((!p_regs->ctrl_regs.reg15.rkvdec_frame_rdy_sta) ||
1030*437bfbebSnyanmisaka p_regs->ctrl_regs.reg15.rkvdec_strm_error_sta ||
1031*437bfbebSnyanmisaka p_regs->ctrl_regs.reg15.rkvdec_core_timeout_sta ||
1032*437bfbebSnyanmisaka p_regs->ctrl_regs.reg15.rkvdec_ip_timeout_sta ||
1033*437bfbebSnyanmisaka p_regs->ctrl_regs.reg15.rkvdec_bus_error_sta ||
1034*437bfbebSnyanmisaka p_regs->ctrl_regs.reg15.rkvdec_buffer_empty_sta ||
1035*437bfbebSnyanmisaka p_regs->ctrl_regs.reg15.rkvdec_colmv_ref_error_sta)
1036*437bfbebSnyanmisaka param.hard_err = 1;
1037*437bfbebSnyanmisaka else
1038*437bfbebSnyanmisaka param.hard_err = 0;
1039*437bfbebSnyanmisaka
1040*437bfbebSnyanmisaka mpp_callback(p_hal->dec_cb, ¶m);
1041*437bfbebSnyanmisaka }
1042*437bfbebSnyanmisaka memset(&p_regs->ctrl_regs.reg19, 0, sizeof(RK_U32));
1043*437bfbebSnyanmisaka if (p_hal->fast_mode) {
1044*437bfbebSnyanmisaka reg_ctx->reg_buf[task->dec.reg_index].valid = 0;
1045*437bfbebSnyanmisaka }
1046*437bfbebSnyanmisaka
1047*437bfbebSnyanmisaka (void)task;
1048*437bfbebSnyanmisaka __RETURN:
1049*437bfbebSnyanmisaka return ret = MPP_OK;
1050*437bfbebSnyanmisaka }
1051*437bfbebSnyanmisaka
vdpu383_h264d_reset(void * hal)1052*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_reset(void *hal)
1053*437bfbebSnyanmisaka {
1054*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
1055*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1056*437bfbebSnyanmisaka
1057*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
1058*437bfbebSnyanmisaka
1059*437bfbebSnyanmisaka
1060*437bfbebSnyanmisaka __RETURN:
1061*437bfbebSnyanmisaka return ret = MPP_OK;
1062*437bfbebSnyanmisaka }
1063*437bfbebSnyanmisaka
vdpu383_h264d_flush(void * hal)1064*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_flush(void *hal)
1065*437bfbebSnyanmisaka {
1066*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
1067*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1068*437bfbebSnyanmisaka
1069*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
1070*437bfbebSnyanmisaka
1071*437bfbebSnyanmisaka __RETURN:
1072*437bfbebSnyanmisaka return ret = MPP_OK;
1073*437bfbebSnyanmisaka }
1074*437bfbebSnyanmisaka
vdpu383_h264d_control(void * hal,MpiCmd cmd_type,void * param)1075*437bfbebSnyanmisaka MPP_RET vdpu383_h264d_control(void *hal, MpiCmd cmd_type, void *param)
1076*437bfbebSnyanmisaka {
1077*437bfbebSnyanmisaka MPP_RET ret = MPP_ERR_UNKNOW;
1078*437bfbebSnyanmisaka H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1079*437bfbebSnyanmisaka
1080*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
1081*437bfbebSnyanmisaka
1082*437bfbebSnyanmisaka switch ((MpiCmd)cmd_type) {
1083*437bfbebSnyanmisaka case MPP_DEC_SET_FRAME_INFO: {
1084*437bfbebSnyanmisaka MppFrameFormat fmt = mpp_frame_get_fmt((MppFrame)param);
1085*437bfbebSnyanmisaka RK_U32 imgwidth = mpp_frame_get_width((MppFrame)param);
1086*437bfbebSnyanmisaka RK_U32 imgheight = mpp_frame_get_height((MppFrame)param);
1087*437bfbebSnyanmisaka
1088*437bfbebSnyanmisaka mpp_log("control info: fmt %d, w %d, h %d\n", fmt, imgwidth, imgheight);
1089*437bfbebSnyanmisaka if (fmt == MPP_FMT_YUV422SP) {
1090*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_LEN_ALIGN, rkv_len_align_422);
1091*437bfbebSnyanmisaka }
1092*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1093*437bfbebSnyanmisaka vdpu383_afbc_align_calc(p_hal->frame_slots, (MppFrame)param, 16);
1094*437bfbebSnyanmisaka } else if (imgwidth > 1920 || imgheight > 1088) {
1095*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
1096*437bfbebSnyanmisaka }
1097*437bfbebSnyanmisaka } break;
1098*437bfbebSnyanmisaka case MPP_DEC_GET_THUMBNAIL_FRAME_INFO: {
1099*437bfbebSnyanmisaka vdpu383_update_thumbnail_frame_info((MppFrame)param);
1100*437bfbebSnyanmisaka } break;
1101*437bfbebSnyanmisaka case MPP_DEC_SET_OUTPUT_FORMAT: {
1102*437bfbebSnyanmisaka } break;
1103*437bfbebSnyanmisaka default : {
1104*437bfbebSnyanmisaka } break;
1105*437bfbebSnyanmisaka }
1106*437bfbebSnyanmisaka
1107*437bfbebSnyanmisaka __RETURN:
1108*437bfbebSnyanmisaka return ret = MPP_OK;
1109*437bfbebSnyanmisaka }
1110*437bfbebSnyanmisaka
1111*437bfbebSnyanmisaka const MppHalApi hal_h264d_vdpu383 = {
1112*437bfbebSnyanmisaka .name = "h264d_vdpu383",
1113*437bfbebSnyanmisaka .type = MPP_CTX_DEC,
1114*437bfbebSnyanmisaka .coding = MPP_VIDEO_CodingAVC,
1115*437bfbebSnyanmisaka .ctx_size = sizeof(Vdpu383H264dRegCtx),
1116*437bfbebSnyanmisaka .flag = 0,
1117*437bfbebSnyanmisaka .init = vdpu383_h264d_init,
1118*437bfbebSnyanmisaka .deinit = vdpu383_h264d_deinit,
1119*437bfbebSnyanmisaka .reg_gen = vdpu383_h264d_gen_regs,
1120*437bfbebSnyanmisaka .start = vdpu383_h264d_start,
1121*437bfbebSnyanmisaka .wait = vdpu383_h264d_wait,
1122*437bfbebSnyanmisaka .reset = vdpu383_h264d_reset,
1123*437bfbebSnyanmisaka .flush = vdpu383_h264d_flush,
1124*437bfbebSnyanmisaka .control = vdpu383_h264d_control,
1125*437bfbebSnyanmisaka };
1126