xref: /rockchip-linux_mpp/mpp/hal/rkdec/h264d/hal_h264d_vdpu384a.c (revision 437bfbeb9567cca9cd9080e3f6954aa9d6a94f18)
1*437bfbebSnyanmisaka /* SPDX-License-Identifier: Apache-2.0 OR MIT */
2*437bfbebSnyanmisaka /*
3*437bfbebSnyanmisaka  * Copyright (c) 2024 Rockchip Electronics Co., Ltd.
4*437bfbebSnyanmisaka  */
5*437bfbebSnyanmisaka 
6*437bfbebSnyanmisaka #define MODULE_TAG "hal_h264d_vdpu384a"
7*437bfbebSnyanmisaka 
8*437bfbebSnyanmisaka #include <string.h>
9*437bfbebSnyanmisaka 
10*437bfbebSnyanmisaka #include "mpp_env.h"
11*437bfbebSnyanmisaka #include "mpp_mem.h"
12*437bfbebSnyanmisaka #include "mpp_common.h"
13*437bfbebSnyanmisaka #include "mpp_bitput.h"
14*437bfbebSnyanmisaka #include "mpp_buffer_impl.h"
15*437bfbebSnyanmisaka 
16*437bfbebSnyanmisaka #include "hal_h264d_global.h"
17*437bfbebSnyanmisaka #include "hal_h264d_vdpu384a.h"
18*437bfbebSnyanmisaka #include "vdpu384a_h264d.h"
19*437bfbebSnyanmisaka #include "mpp_dec_cb_param.h"
20*437bfbebSnyanmisaka 
21*437bfbebSnyanmisaka /* Number registers for the decoder */
22*437bfbebSnyanmisaka #define DEC_VDPU384A_REGISTERS       276
23*437bfbebSnyanmisaka 
24*437bfbebSnyanmisaka #define VDPU384A_SPSPPS_SIZE         (MPP_ALIGN(2266 + 64, 128) / 8) /* byte, 2266 bit + Reserve 64 */
25*437bfbebSnyanmisaka #define VDPU384A_SCALING_LIST_SIZE   (6*16+2*64 + 128)   /* bytes */
26*437bfbebSnyanmisaka #define VDPU384A_ERROR_INFO_SIZE     (256*144*4)         /* bytes */
27*437bfbebSnyanmisaka #define H264_CTU_SIZE               16
28*437bfbebSnyanmisaka 
29*437bfbebSnyanmisaka #define VDPU384A_ERROR_INFO_ALIGNED_SIZE     (0)
30*437bfbebSnyanmisaka #define VDPU384A_SPSPPS_ALIGNED_SIZE         (MPP_ALIGN(VDPU384A_SPSPPS_SIZE, SZ_4K))
31*437bfbebSnyanmisaka #define VDPU384A_SCALING_LIST_ALIGNED_SIZE   (MPP_ALIGN(VDPU384A_SCALING_LIST_SIZE, SZ_4K))
32*437bfbebSnyanmisaka #define VDPU384A_STREAM_INFO_SET_SIZE        (VDPU384A_SPSPPS_ALIGNED_SIZE + \
33*437bfbebSnyanmisaka                                              VDPU384A_SCALING_LIST_ALIGNED_SIZE)
34*437bfbebSnyanmisaka 
35*437bfbebSnyanmisaka #define VDPU384A_ERROR_INFO_OFFSET           (0)
36*437bfbebSnyanmisaka #define VDPU384A_STREAM_INFO_OFFSET_BASE     (VDPU384A_ERROR_INFO_OFFSET + VDPU384A_ERROR_INFO_ALIGNED_SIZE)
37*437bfbebSnyanmisaka #define VDPU384A_SPSPPS_OFFSET(pos)          (VDPU384A_STREAM_INFO_OFFSET_BASE + (VDPU384A_STREAM_INFO_SET_SIZE * pos))
38*437bfbebSnyanmisaka #define VDPU384A_SCALING_LIST_OFFSET(pos)    (VDPU384A_SPSPPS_OFFSET(pos) + VDPU384A_SPSPPS_ALIGNED_SIZE)
39*437bfbebSnyanmisaka #define VDPU384A_INFO_BUFFER_SIZE(cnt)       (VDPU384A_STREAM_INFO_OFFSET_BASE + (VDPU384A_STREAM_INFO_SET_SIZE * cnt))
40*437bfbebSnyanmisaka 
41*437bfbebSnyanmisaka #define SET_REF_INFO(regs, index, field, value)\
42*437bfbebSnyanmisaka     do{ \
43*437bfbebSnyanmisaka         switch(index){\
44*437bfbebSnyanmisaka         case 0: regs.reg99.ref0_##field = value; break;\
45*437bfbebSnyanmisaka         case 1: regs.reg99.ref1_##field = value; break;\
46*437bfbebSnyanmisaka         case 2: regs.reg99.ref2_##field = value; break;\
47*437bfbebSnyanmisaka         case 3: regs.reg99.ref3_##field = value; break;\
48*437bfbebSnyanmisaka         case 4: regs.reg100.ref4_##field = value; break;\
49*437bfbebSnyanmisaka         case 5: regs.reg100.ref5_##field = value; break;\
50*437bfbebSnyanmisaka         case 6: regs.reg100.ref6_##field = value; break;\
51*437bfbebSnyanmisaka         case 7: regs.reg100.ref7_##field = value; break;\
52*437bfbebSnyanmisaka         case 8: regs.reg101.ref8_##field = value; break;\
53*437bfbebSnyanmisaka         case 9: regs.reg101.ref9_##field = value; break;\
54*437bfbebSnyanmisaka         case 10: regs.reg101.ref10_##field = value; break;\
55*437bfbebSnyanmisaka         case 11: regs.reg101.ref11_##field = value; break;\
56*437bfbebSnyanmisaka         case 12: regs.reg102.ref12_##field = value; break;\
57*437bfbebSnyanmisaka         case 13: regs.reg102.ref13_##field = value; break;\
58*437bfbebSnyanmisaka         case 14: regs.reg102.ref14_##field = value; break;\
59*437bfbebSnyanmisaka         case 15: regs.reg102.ref15_##field = value; break;\
60*437bfbebSnyanmisaka         default: break;}\
61*437bfbebSnyanmisaka     }while(0)
62*437bfbebSnyanmisaka 
63*437bfbebSnyanmisaka #define VDPU384A_FAST_REG_SET_CNT    3
64*437bfbebSnyanmisaka 
65*437bfbebSnyanmisaka typedef struct h264d_rkv_buf_t {
66*437bfbebSnyanmisaka     RK_U32              valid;
67*437bfbebSnyanmisaka     Vdpu384aH264dRegSet  *regs;
68*437bfbebSnyanmisaka } H264dRkvBuf_t;
69*437bfbebSnyanmisaka 
70*437bfbebSnyanmisaka typedef struct Vdpu384aH264dRegCtx_t {
71*437bfbebSnyanmisaka     RK_U8               spspps[VDPU384A_SPSPPS_SIZE];
72*437bfbebSnyanmisaka     RK_U8               sclst[VDPU384A_SCALING_LIST_SIZE];
73*437bfbebSnyanmisaka 
74*437bfbebSnyanmisaka     MppBuffer           bufs;
75*437bfbebSnyanmisaka     RK_S32              bufs_fd;
76*437bfbebSnyanmisaka     void                *bufs_ptr;
77*437bfbebSnyanmisaka     RK_U32              offset_errinfo;
78*437bfbebSnyanmisaka     RK_U32              offset_spspps[VDPU384A_FAST_REG_SET_CNT];
79*437bfbebSnyanmisaka     RK_U32              offset_sclst[VDPU384A_FAST_REG_SET_CNT];
80*437bfbebSnyanmisaka 
81*437bfbebSnyanmisaka     H264dRkvBuf_t       reg_buf[VDPU384A_FAST_REG_SET_CNT];
82*437bfbebSnyanmisaka 
83*437bfbebSnyanmisaka     RK_U32              spspps_offset;
84*437bfbebSnyanmisaka     RK_U32              sclst_offset;
85*437bfbebSnyanmisaka 
86*437bfbebSnyanmisaka     RK_S32              width;
87*437bfbebSnyanmisaka     RK_S32              height;
88*437bfbebSnyanmisaka     /* rcb buffers info */
89*437bfbebSnyanmisaka     RK_U32              bit_depth;
90*437bfbebSnyanmisaka     RK_U32              mbaff;
91*437bfbebSnyanmisaka     RK_U32              chroma_format_idc;
92*437bfbebSnyanmisaka 
93*437bfbebSnyanmisaka     RK_S32              rcb_buf_size;
94*437bfbebSnyanmisaka     Vdpu384aRcbInfo      rcb_info[RCB_BUF_COUNT];
95*437bfbebSnyanmisaka     MppBuffer           rcb_buf[VDPU384A_FAST_REG_SET_CNT];
96*437bfbebSnyanmisaka 
97*437bfbebSnyanmisaka     Vdpu384aH264dRegSet  *regs;
98*437bfbebSnyanmisaka     HalBufs             origin_bufs;
99*437bfbebSnyanmisaka } Vdpu384aH264dRegCtx;
100*437bfbebSnyanmisaka 
101*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_deinit(void *hal);
rkv_ver_align(RK_U32 val)102*437bfbebSnyanmisaka static RK_U32 rkv_ver_align(RK_U32 val)
103*437bfbebSnyanmisaka {
104*437bfbebSnyanmisaka     return MPP_ALIGN(val, 16);
105*437bfbebSnyanmisaka }
106*437bfbebSnyanmisaka 
rkv_len_align(RK_U32 val)107*437bfbebSnyanmisaka static RK_U32 rkv_len_align(RK_U32 val)
108*437bfbebSnyanmisaka {
109*437bfbebSnyanmisaka     return (MPP_ALIGN(val, 16) * 3 / 2);
110*437bfbebSnyanmisaka }
111*437bfbebSnyanmisaka 
rkv_len_align_422(RK_U32 val)112*437bfbebSnyanmisaka static RK_U32 rkv_len_align_422(RK_U32 val)
113*437bfbebSnyanmisaka {
114*437bfbebSnyanmisaka     return ((5 * MPP_ALIGN(val, 16)) / 2);
115*437bfbebSnyanmisaka }
116*437bfbebSnyanmisaka 
vdpu384a_setup_scale_origin_bufs(H264dHalCtx_t * p_hal,MppFrame mframe)117*437bfbebSnyanmisaka static MPP_RET vdpu384a_setup_scale_origin_bufs(H264dHalCtx_t *p_hal, MppFrame mframe)
118*437bfbebSnyanmisaka {
119*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
120*437bfbebSnyanmisaka     /* for 8K FrameBuf scale mode */
121*437bfbebSnyanmisaka     size_t origin_buf_size = 0;
122*437bfbebSnyanmisaka 
123*437bfbebSnyanmisaka     origin_buf_size = mpp_frame_get_buf_size(mframe);
124*437bfbebSnyanmisaka 
125*437bfbebSnyanmisaka     if (!origin_buf_size) {
126*437bfbebSnyanmisaka         mpp_err_f("origin_bufs get buf size failed\n");
127*437bfbebSnyanmisaka         return MPP_NOK;
128*437bfbebSnyanmisaka     }
129*437bfbebSnyanmisaka     if (ctx->origin_bufs) {
130*437bfbebSnyanmisaka         hal_bufs_deinit(ctx->origin_bufs);
131*437bfbebSnyanmisaka         ctx->origin_bufs = NULL;
132*437bfbebSnyanmisaka     }
133*437bfbebSnyanmisaka     hal_bufs_init(&ctx->origin_bufs);
134*437bfbebSnyanmisaka     if (!ctx->origin_bufs) {
135*437bfbebSnyanmisaka         mpp_err_f("origin_bufs init fail\n");
136*437bfbebSnyanmisaka         return MPP_ERR_NOMEM;
137*437bfbebSnyanmisaka     }
138*437bfbebSnyanmisaka     hal_bufs_setup(ctx->origin_bufs, 16, 1, &origin_buf_size);
139*437bfbebSnyanmisaka 
140*437bfbebSnyanmisaka     return MPP_OK;
141*437bfbebSnyanmisaka }
142*437bfbebSnyanmisaka 
prepare_spspps(H264dHalCtx_t * p_hal,RK_U64 * data,RK_U32 len)143*437bfbebSnyanmisaka static MPP_RET prepare_spspps(H264dHalCtx_t *p_hal, RK_U64 *data, RK_U32 len)
144*437bfbebSnyanmisaka {
145*437bfbebSnyanmisaka     RK_S32 i = 0, j = 0;
146*437bfbebSnyanmisaka     RK_S32 is_long_term = 0, voidx = 0;
147*437bfbebSnyanmisaka     DXVA_PicParams_H264_MVC *pp = p_hal->pp;
148*437bfbebSnyanmisaka     RK_U32 tmp = 0;
149*437bfbebSnyanmisaka     BitputCtx_t bp;
150*437bfbebSnyanmisaka 
151*437bfbebSnyanmisaka     mpp_set_bitput_ctx(&bp, data, len);
152*437bfbebSnyanmisaka 
153*437bfbebSnyanmisaka     if (!p_hal->fast_mode && !pp->spspps_update) {
154*437bfbebSnyanmisaka         bp.index = 2;
155*437bfbebSnyanmisaka         bp.bitpos = 24;
156*437bfbebSnyanmisaka         bp.bvalue = bp.pbuf[bp.index] & 0xFFFFFF;
157*437bfbebSnyanmisaka     } else {
158*437bfbebSnyanmisaka         RK_U32 pic_width, pic_height;
159*437bfbebSnyanmisaka 
160*437bfbebSnyanmisaka         //!< sps syntax
161*437bfbebSnyanmisaka         pic_width   = 16 * (pp->wFrameWidthInMbsMinus1 + 1);
162*437bfbebSnyanmisaka         pic_height  = 16 * (pp->wFrameHeightInMbsMinus1 + 1);
163*437bfbebSnyanmisaka         pic_height *= (2 - pp->frame_mbs_only_flag);
164*437bfbebSnyanmisaka         pic_height /= (1 + pp->field_pic_flag);
165*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->seq_parameter_set_id, 4);
166*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->profile_idc, 8);
167*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->constraint_set3_flag, 1);
168*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->chroma_format_idc, 2);
169*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->bit_depth_luma_minus8, 3);
170*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->bit_depth_chroma_minus8, 3);
171*437bfbebSnyanmisaka         mpp_put_bits(&bp, 0, 1); // set 0
172*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->log2_max_frame_num_minus4, 4);
173*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->num_ref_frames, 5);
174*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->pic_order_cnt_type, 2);
175*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->log2_max_pic_order_cnt_lsb_minus4, 4);
176*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->delta_pic_order_always_zero_flag, 1);
177*437bfbebSnyanmisaka         mpp_put_bits(&bp, pic_width, 16);
178*437bfbebSnyanmisaka         mpp_put_bits(&bp, pic_height, 16);
179*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->frame_mbs_only_flag, 1);
180*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->MbaffFrameFlag, 1);
181*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->direct_8x8_inference_flag, 1);
182*437bfbebSnyanmisaka         /* multi-view */
183*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->mvc_extension_enable, 1);
184*437bfbebSnyanmisaka         if (pp->mvc_extension_enable) {
185*437bfbebSnyanmisaka             mpp_put_bits(&bp, (pp->num_views_minus1 + 1), 2);
186*437bfbebSnyanmisaka             mpp_put_bits(&bp, pp->view_id[0], 10);
187*437bfbebSnyanmisaka             mpp_put_bits(&bp, pp->view_id[1], 10);
188*437bfbebSnyanmisaka         } else {
189*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 22);
190*437bfbebSnyanmisaka         }
191*437bfbebSnyanmisaka         // hw_fifo_align_bits(&bp, 128);
192*437bfbebSnyanmisaka         //!< pps syntax
193*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->pps_pic_parameter_set_id, 8);
194*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->pps_seq_parameter_set_id, 5);
195*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->entropy_coding_mode_flag, 1);
196*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->pic_order_present_flag, 1);
197*437bfbebSnyanmisaka 
198*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->num_ref_idx_l0_active_minus1, 5);
199*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->num_ref_idx_l1_active_minus1, 5);
200*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->weighted_pred_flag, 1);
201*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->weighted_bipred_idc, 2);
202*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->pic_init_qp_minus26, 7);
203*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->pic_init_qs_minus26, 6);
204*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->chroma_qp_index_offset, 5);
205*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->deblocking_filter_control_present_flag, 1);
206*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->constrained_intra_pred_flag, 1);
207*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->redundant_pic_cnt_present_flag, 1);
208*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->transform_8x8_mode_flag, 1);
209*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->second_chroma_qp_index_offset, 5);
210*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->scaleing_list_enable_flag, 1);
211*437bfbebSnyanmisaka     }
212*437bfbebSnyanmisaka 
213*437bfbebSnyanmisaka     //!< set dpb
214*437bfbebSnyanmisaka     for (i = 0; i < 16; i++) {
215*437bfbebSnyanmisaka         is_long_term = (pp->RefFrameList[i].bPicEntry != 0xff) ? pp->RefFrameList[i].AssociatedFlag : 0;
216*437bfbebSnyanmisaka         tmp |= (RK_U32)(is_long_term & 0x1) << i;
217*437bfbebSnyanmisaka     }
218*437bfbebSnyanmisaka     for (i = 0; i < 16; i++) {
219*437bfbebSnyanmisaka         voidx = (pp->RefFrameList[i].bPicEntry != 0xff) ? pp->RefPicLayerIdList[i] : 0;
220*437bfbebSnyanmisaka         tmp |= (RK_U32)(voidx & 0x1) << (i + 16);
221*437bfbebSnyanmisaka     }
222*437bfbebSnyanmisaka     mpp_put_bits(&bp, tmp, 32);
223*437bfbebSnyanmisaka     /* set current frame */
224*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->field_pic_flag, 1);
225*437bfbebSnyanmisaka     mpp_put_bits(&bp, (pp->field_pic_flag && pp->CurrPic.AssociatedFlag), 1);
226*437bfbebSnyanmisaka 
227*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->CurrFieldOrderCnt[0], 32);
228*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->CurrFieldOrderCnt[1], 32);
229*437bfbebSnyanmisaka 
230*437bfbebSnyanmisaka     /* refer poc */
231*437bfbebSnyanmisaka     for (i = 0; i < 16; i++) {
232*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->FieldOrderCntList[i][0], 32);
233*437bfbebSnyanmisaka         mpp_put_bits(&bp, pp->FieldOrderCntList[i][1], 32);
234*437bfbebSnyanmisaka     }
235*437bfbebSnyanmisaka 
236*437bfbebSnyanmisaka     tmp = 0;
237*437bfbebSnyanmisaka     for (i = 0; i < 16; i++)
238*437bfbebSnyanmisaka         tmp |= ((pp->RefPicFiledFlags >> i) & 0x01) << i;
239*437bfbebSnyanmisaka     for (i = 0; i < 16; i++)
240*437bfbebSnyanmisaka         tmp |= ((pp->UsedForReferenceFlags >> (2 * i + 0)) & 0x01) << (i + 16);
241*437bfbebSnyanmisaka     mpp_put_bits(&bp, tmp, 32);
242*437bfbebSnyanmisaka 
243*437bfbebSnyanmisaka     tmp = 0;
244*437bfbebSnyanmisaka     for (i = 0; i < 16; i++)
245*437bfbebSnyanmisaka         tmp |= ((pp->UsedForReferenceFlags >> (2 * i + 1)) & 0x01) << i;
246*437bfbebSnyanmisaka     for (i = 0; i < 16; i++)
247*437bfbebSnyanmisaka         tmp |= ((pp->RefPicColmvUsedFlags >> i) & 0x01) << (i + 16);
248*437bfbebSnyanmisaka     mpp_put_bits(&bp, tmp, 32);
249*437bfbebSnyanmisaka 
250*437bfbebSnyanmisaka     /* rps */
251*437bfbebSnyanmisaka     {
252*437bfbebSnyanmisaka         RK_S32 dpb_idx = 0;
253*437bfbebSnyanmisaka         RK_S32 dpb_valid = 0, bottom_flag = 0;
254*437bfbebSnyanmisaka         RK_U32 max_frame_num = 0;
255*437bfbebSnyanmisaka         RK_U16 frame_num_wrap = 0;
256*437bfbebSnyanmisaka 
257*437bfbebSnyanmisaka         max_frame_num = 1 << (pp->log2_max_frame_num_minus4 + 4);
258*437bfbebSnyanmisaka         for (i = 0; i < 16; i++) {
259*437bfbebSnyanmisaka             if ((pp->NonExistingFrameFlags >> i) & 0x01) {
260*437bfbebSnyanmisaka                 frame_num_wrap = 0;
261*437bfbebSnyanmisaka             } else {
262*437bfbebSnyanmisaka                 if (pp->RefFrameList[i].AssociatedFlag) {
263*437bfbebSnyanmisaka                     frame_num_wrap = pp->FrameNumList[i];
264*437bfbebSnyanmisaka                 } else {
265*437bfbebSnyanmisaka                     frame_num_wrap = (pp->FrameNumList[i] > pp->frame_num) ?
266*437bfbebSnyanmisaka                                      (pp->FrameNumList[i] - max_frame_num) : pp->FrameNumList[i];
267*437bfbebSnyanmisaka                 }
268*437bfbebSnyanmisaka             }
269*437bfbebSnyanmisaka             mpp_put_bits(&bp, frame_num_wrap, 16);
270*437bfbebSnyanmisaka         }
271*437bfbebSnyanmisaka 
272*437bfbebSnyanmisaka         /* dbp_idx_p_l0_32x7bit + dbp_idx_b_l0_32x7bit + dbp_idx_b_l1_32x7bit */
273*437bfbebSnyanmisaka         for (j = 0; j < 3; j++) {
274*437bfbebSnyanmisaka             for (i = 0; i < 32; i++) {
275*437bfbebSnyanmisaka                 tmp = 0;
276*437bfbebSnyanmisaka                 dpb_valid = (p_hal->slice_long[0].RefPicList[j][i].bPicEntry == 0xff) ? 0 : 1;
277*437bfbebSnyanmisaka                 dpb_idx = dpb_valid ? p_hal->slice_long[0].RefPicList[j][i].Index7Bits : 0;
278*437bfbebSnyanmisaka                 bottom_flag = dpb_valid ? p_hal->slice_long[0].RefPicList[j][i].AssociatedFlag : 0;
279*437bfbebSnyanmisaka                 voidx = dpb_valid ? pp->RefPicLayerIdList[dpb_idx] : 0;
280*437bfbebSnyanmisaka                 tmp |= (RK_U32)(dpb_idx | (dpb_valid << 4)) & 0x1f;
281*437bfbebSnyanmisaka                 tmp |= (RK_U32)(bottom_flag & 0x1) << 5;
282*437bfbebSnyanmisaka                 if (dpb_valid)
283*437bfbebSnyanmisaka                     tmp |= (RK_U32)(voidx & 0x1) << 6;
284*437bfbebSnyanmisaka                 mpp_put_bits(&bp, tmp, 7);
285*437bfbebSnyanmisaka             }
286*437bfbebSnyanmisaka         }
287*437bfbebSnyanmisaka     }
288*437bfbebSnyanmisaka     mpp_put_align(&bp, 64, 0);//128
289*437bfbebSnyanmisaka 
290*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
291*437bfbebSnyanmisaka     {
292*437bfbebSnyanmisaka         char *cur_fname = "global_cfg.dat";
293*437bfbebSnyanmisaka         memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
294*437bfbebSnyanmisaka         sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
295*437bfbebSnyanmisaka         dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 64 * bp.index + bp.bitpos, 128, 0);
296*437bfbebSnyanmisaka     }
297*437bfbebSnyanmisaka #endif
298*437bfbebSnyanmisaka 
299*437bfbebSnyanmisaka     return MPP_OK;
300*437bfbebSnyanmisaka }
301*437bfbebSnyanmisaka 
prepare_scanlist(H264dHalCtx_t * p_hal,RK_U8 * data,RK_U32 len)302*437bfbebSnyanmisaka static MPP_RET prepare_scanlist(H264dHalCtx_t *p_hal, RK_U8 *data, RK_U32 len)
303*437bfbebSnyanmisaka {
304*437bfbebSnyanmisaka     RK_U32 i = 0, j = 0, n = 0;
305*437bfbebSnyanmisaka 
306*437bfbebSnyanmisaka     if (!p_hal->pp->scaleing_list_enable_flag)
307*437bfbebSnyanmisaka         return MPP_OK;
308*437bfbebSnyanmisaka 
309*437bfbebSnyanmisaka     for (i = 0; i < 6; i++) { //4x4, 6 lists
310*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
311*437bfbebSnyanmisaka         for (j = 0; j < 4; j++) {
312*437bfbebSnyanmisaka             data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 0];
313*437bfbebSnyanmisaka             data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 1];
314*437bfbebSnyanmisaka             data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 2];
315*437bfbebSnyanmisaka             data[n++] = p_hal->qm->bScalingLists4x4[i][j * 4 + 3];
316*437bfbebSnyanmisaka         }
317*437bfbebSnyanmisaka     }
318*437bfbebSnyanmisaka 
319*437bfbebSnyanmisaka     for (i = 0; i < 2; i++) { //8x8, 2 lists
320*437bfbebSnyanmisaka         RK_U32 blk4_x = 0, blk4_y = 0;
321*437bfbebSnyanmisaka 
322*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
323*437bfbebSnyanmisaka         for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
324*437bfbebSnyanmisaka             for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
325*437bfbebSnyanmisaka                 RK_U32 pos = blk4_y * 8 + blk4_x;
326*437bfbebSnyanmisaka 
327*437bfbebSnyanmisaka                 for (j = 0; j < 4; j++) {
328*437bfbebSnyanmisaka                     data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 0];
329*437bfbebSnyanmisaka                     data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 1];
330*437bfbebSnyanmisaka                     data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 2];
331*437bfbebSnyanmisaka                     data[n++] = p_hal->qm->bScalingLists8x8[i][pos + j * 8 + 3];
332*437bfbebSnyanmisaka                 }
333*437bfbebSnyanmisaka             }
334*437bfbebSnyanmisaka         }
335*437bfbebSnyanmisaka     }
336*437bfbebSnyanmisaka 
337*437bfbebSnyanmisaka     mpp_assert(n <= len);
338*437bfbebSnyanmisaka 
339*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
340*437bfbebSnyanmisaka     {
341*437bfbebSnyanmisaka         char *cur_fname = "scanlist.dat";
342*437bfbebSnyanmisaka         memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
343*437bfbebSnyanmisaka         sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
344*437bfbebSnyanmisaka         dump_data_to_file(dump_cur_fname_path, (void *)data, 8 * n, 128, 0);
345*437bfbebSnyanmisaka     }
346*437bfbebSnyanmisaka #endif
347*437bfbebSnyanmisaka 
348*437bfbebSnyanmisaka     return MPP_OK;
349*437bfbebSnyanmisaka }
350*437bfbebSnyanmisaka 
set_registers(H264dHalCtx_t * p_hal,Vdpu384aH264dRegSet * regs,HalTaskInfo * task)351*437bfbebSnyanmisaka static MPP_RET set_registers(H264dHalCtx_t *p_hal, Vdpu384aH264dRegSet *regs, HalTaskInfo *task)
352*437bfbebSnyanmisaka {
353*437bfbebSnyanmisaka     DXVA_PicParams_H264_MVC *pp = p_hal->pp;
354*437bfbebSnyanmisaka     HalBuf *mv_buf = NULL;
355*437bfbebSnyanmisaka     HalBuf *origin_buf = NULL;
356*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
357*437bfbebSnyanmisaka 
358*437bfbebSnyanmisaka     // memset(regs, 0, sizeof(Vdpu384aH264dRegSet));
359*437bfbebSnyanmisaka     regs->h264d_paras.reg66_stream_len = p_hal->strm_len;
360*437bfbebSnyanmisaka 
361*437bfbebSnyanmisaka     //!< caculate the yuv_frame_size
362*437bfbebSnyanmisaka     {
363*437bfbebSnyanmisaka         MppFrame mframe = NULL;
364*437bfbebSnyanmisaka         RK_U32 hor_virstride = 0;
365*437bfbebSnyanmisaka         RK_U32 ver_virstride = 0;
366*437bfbebSnyanmisaka         RK_U32 y_virstride = 0;
367*437bfbebSnyanmisaka         RK_U32 uv_virstride = 0;
368*437bfbebSnyanmisaka 
369*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits, SLOT_FRAME_PTR, &mframe);
370*437bfbebSnyanmisaka         hor_virstride = mpp_frame_get_hor_stride(mframe);
371*437bfbebSnyanmisaka         ver_virstride = mpp_frame_get_ver_stride(mframe);
372*437bfbebSnyanmisaka         y_virstride = hor_virstride * ver_virstride;
373*437bfbebSnyanmisaka         uv_virstride = hor_virstride * ver_virstride / 2;
374*437bfbebSnyanmisaka 
375*437bfbebSnyanmisaka         if (MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe))) {
376*437bfbebSnyanmisaka             RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
377*437bfbebSnyanmisaka             RK_U32 fbd_offset;
378*437bfbebSnyanmisaka 
379*437bfbebSnyanmisaka             fbd_offset = fbc_hdr_stride * MPP_ALIGN(ver_virstride, 64) / 16;
380*437bfbebSnyanmisaka 
381*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.dpb_data_sel = 0;
382*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.dpb_output_dis = 0;
383*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.pp_m_output_mode = 0;
384*437bfbebSnyanmisaka 
385*437bfbebSnyanmisaka             regs->h264d_paras.reg68_dpb_hor_virstride = fbc_hdr_stride / 64;
386*437bfbebSnyanmisaka             regs->h264d_addrs.reg193_dpb_fbc64x4_payload_offset = fbd_offset;
387*437bfbebSnyanmisaka             regs->h264d_paras.reg80_error_ref_hor_virstride = regs->h264d_paras.reg68_dpb_hor_virstride;
388*437bfbebSnyanmisaka         } else if (MPP_FRAME_FMT_IS_TILE(mpp_frame_get_fmt(mframe))) {
389*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.dpb_data_sel = 1;
390*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.dpb_output_dis = 1;
391*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.pp_m_output_mode = 2;
392*437bfbebSnyanmisaka 
393*437bfbebSnyanmisaka             regs->h264d_paras.reg77_pp_m_hor_stride = hor_virstride * 6 / 16;
394*437bfbebSnyanmisaka             regs->h264d_paras.reg79_pp_m_y_virstride = (y_virstride + uv_virstride) / 16;
395*437bfbebSnyanmisaka             regs->h264d_paras.reg80_error_ref_hor_virstride = regs->h264d_paras.reg77_pp_m_hor_stride;
396*437bfbebSnyanmisaka         } else {
397*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.dpb_data_sel = 1;
398*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.dpb_output_dis = 1;
399*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.pp_m_output_mode = 1;
400*437bfbebSnyanmisaka 
401*437bfbebSnyanmisaka             regs->h264d_paras.reg77_pp_m_hor_stride = hor_virstride / 16;
402*437bfbebSnyanmisaka             regs->h264d_paras.reg78_pp_m_uv_hor_stride = hor_virstride / 16;
403*437bfbebSnyanmisaka             regs->h264d_paras.reg79_pp_m_y_virstride = y_virstride / 16;
404*437bfbebSnyanmisaka             regs->h264d_paras.reg80_error_ref_hor_virstride = regs->h264d_paras.reg77_pp_m_hor_stride;
405*437bfbebSnyanmisaka         }
406*437bfbebSnyanmisaka         regs->h264d_paras.reg81_error_ref_raster_uv_hor_virstride = regs->h264d_paras.reg78_pp_m_uv_hor_stride;
407*437bfbebSnyanmisaka         regs->h264d_paras.reg82_error_ref_virstride = regs->h264d_paras.reg79_pp_m_y_virstride;
408*437bfbebSnyanmisaka     }
409*437bfbebSnyanmisaka     //!< set current
410*437bfbebSnyanmisaka     {
411*437bfbebSnyanmisaka         MppBuffer mbuffer = NULL;
412*437bfbebSnyanmisaka         RK_S32 fd = -1;
413*437bfbebSnyanmisaka 
414*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits, SLOT_BUFFER, &mbuffer);
415*437bfbebSnyanmisaka         fd = mpp_buffer_get_fd(mbuffer);
416*437bfbebSnyanmisaka         /* output rkfbc64 */
417*437bfbebSnyanmisaka         // regs->h264d_addrs.reg168_dpb_decout_base = fd;
418*437bfbebSnyanmisaka         /* output raster/tile4x4 */
419*437bfbebSnyanmisaka         regs->common_addr.reg135_pp_m_decout_base = fd;
420*437bfbebSnyanmisaka         regs->h264d_addrs.reg192_dpb_payload64x4_st_cur_base = fd;
421*437bfbebSnyanmisaka 
422*437bfbebSnyanmisaka         //colmv_cur_base
423*437bfbebSnyanmisaka         mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, pp->CurrPic.Index7Bits);
424*437bfbebSnyanmisaka         regs->h264d_addrs.reg216_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
425*437bfbebSnyanmisaka         regs->h264d_addrs.reg169_error_ref_base = fd;
426*437bfbebSnyanmisaka     }
427*437bfbebSnyanmisaka     //!< set reference
428*437bfbebSnyanmisaka     {
429*437bfbebSnyanmisaka         RK_S32 i = 0;
430*437bfbebSnyanmisaka         RK_S32 fd = -1;
431*437bfbebSnyanmisaka         RK_S32 ref_index = -1;
432*437bfbebSnyanmisaka         RK_S32 near_index = -1;
433*437bfbebSnyanmisaka         MppBuffer mbuffer = NULL;
434*437bfbebSnyanmisaka         RK_U32 min_frame_num  = 0;
435*437bfbebSnyanmisaka         MppFrame mframe = NULL;
436*437bfbebSnyanmisaka 
437*437bfbebSnyanmisaka         for (i = 0; i < 15; i++) {
438*437bfbebSnyanmisaka             if (pp->RefFrameList[i].bPicEntry != 0xff) {
439*437bfbebSnyanmisaka                 ref_index = pp->RefFrameList[i].Index7Bits;
440*437bfbebSnyanmisaka                 near_index = pp->RefFrameList[i].Index7Bits;
441*437bfbebSnyanmisaka             } else {
442*437bfbebSnyanmisaka                 ref_index = (near_index < 0) ? pp->CurrPic.Index7Bits : near_index;
443*437bfbebSnyanmisaka             }
444*437bfbebSnyanmisaka             /* mark 3 to differ from current frame */
445*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal->frame_slots, ref_index, SLOT_BUFFER, &mbuffer);
446*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal->frame_slots, ref_index, SLOT_FRAME_PTR, &mframe);
447*437bfbebSnyanmisaka             if (ctx->origin_bufs && mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY) {
448*437bfbebSnyanmisaka                 origin_buf = hal_bufs_get_buf(ctx->origin_bufs, ref_index);
449*437bfbebSnyanmisaka                 mbuffer = origin_buf->buf[0];
450*437bfbebSnyanmisaka             }
451*437bfbebSnyanmisaka 
452*437bfbebSnyanmisaka             if (pp->FrameNumList[i] < pp->frame_num &&
453*437bfbebSnyanmisaka                 pp->FrameNumList[i] > min_frame_num &&
454*437bfbebSnyanmisaka                 (!mpp_frame_get_errinfo(mframe))) {
455*437bfbebSnyanmisaka                 min_frame_num = pp->FrameNumList[i];
456*437bfbebSnyanmisaka                 regs->h264d_addrs.reg169_error_ref_base = mpp_buffer_get_fd(mbuffer);
457*437bfbebSnyanmisaka             }
458*437bfbebSnyanmisaka 
459*437bfbebSnyanmisaka             fd = mpp_buffer_get_fd(mbuffer);
460*437bfbebSnyanmisaka             regs->h264d_addrs.reg170_185_ref_base[i] = fd;
461*437bfbebSnyanmisaka             regs->h264d_addrs.reg195_210_payload_st_ref_base[i] = fd;
462*437bfbebSnyanmisaka             mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, ref_index);
463*437bfbebSnyanmisaka             regs->h264d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
464*437bfbebSnyanmisaka         }
465*437bfbebSnyanmisaka 
466*437bfbebSnyanmisaka         if (pp->RefFrameList[15].bPicEntry != 0xff) {
467*437bfbebSnyanmisaka             ref_index = pp->RefFrameList[15].Index7Bits;
468*437bfbebSnyanmisaka         } else {
469*437bfbebSnyanmisaka             ref_index = (near_index < 0) ? pp->CurrPic.Index7Bits : near_index;
470*437bfbebSnyanmisaka         }
471*437bfbebSnyanmisaka 
472*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->frame_slots, ref_index, SLOT_BUFFER, &mbuffer);
473*437bfbebSnyanmisaka         fd = mpp_buffer_get_fd(mbuffer);
474*437bfbebSnyanmisaka         if (mpp_frame_get_thumbnail_en(mframe) == 2) {
475*437bfbebSnyanmisaka             origin_buf = hal_bufs_get_buf(ctx->origin_bufs, ref_index);
476*437bfbebSnyanmisaka             fd = mpp_buffer_get_fd(origin_buf->buf[0]);
477*437bfbebSnyanmisaka         }
478*437bfbebSnyanmisaka         regs->h264d_addrs.reg170_185_ref_base[15] = fd;
479*437bfbebSnyanmisaka         regs->h264d_addrs.reg195_210_payload_st_ref_base[15] = fd;
480*437bfbebSnyanmisaka         mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, ref_index);
481*437bfbebSnyanmisaka         regs->h264d_addrs.reg217_232_colmv_ref_base[15] = mpp_buffer_get_fd(mv_buf->buf[0]);
482*437bfbebSnyanmisaka     }
483*437bfbebSnyanmisaka     {
484*437bfbebSnyanmisaka         MppBuffer mbuffer = NULL;
485*437bfbebSnyanmisaka 
486*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->packet_slots, task->dec.input, SLOT_BUFFER, &mbuffer);
487*437bfbebSnyanmisaka         regs->common_addr.reg128_strm_base = mpp_buffer_get_fd(mbuffer);
488*437bfbebSnyanmisaka         regs->common_addr.reg129_stream_buf_st_base = mpp_buffer_get_fd(mbuffer);
489*437bfbebSnyanmisaka         regs->common_addr.reg130_stream_buf_end_base = mpp_buffer_get_fd(mbuffer);
490*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(p_hal->dev, 130, mpp_buffer_get_size(mbuffer));
491*437bfbebSnyanmisaka         // regs->h264d_paras.reg65_strm_start_bit = 2 * 8;
492*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
493*437bfbebSnyanmisaka         {
494*437bfbebSnyanmisaka             char *cur_fname = "stream_in.dat";
495*437bfbebSnyanmisaka             memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
496*437bfbebSnyanmisaka             sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
497*437bfbebSnyanmisaka             dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(mbuffer),
498*437bfbebSnyanmisaka                               8 * p_hal->strm_len, 128, 0);
499*437bfbebSnyanmisaka         }
500*437bfbebSnyanmisaka #endif
501*437bfbebSnyanmisaka     }
502*437bfbebSnyanmisaka 
503*437bfbebSnyanmisaka     {
504*437bfbebSnyanmisaka         //scale down config
505*437bfbebSnyanmisaka         MppFrame mframe = NULL;
506*437bfbebSnyanmisaka         MppBuffer mbuffer = NULL;
507*437bfbebSnyanmisaka         RK_S32 fd = -1;
508*437bfbebSnyanmisaka         MppFrameThumbnailMode thumbnail_mode;
509*437bfbebSnyanmisaka 
510*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits, SLOT_BUFFER, &mbuffer);
511*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->frame_slots, pp->CurrPic.Index7Bits,
512*437bfbebSnyanmisaka                               SLOT_FRAME_PTR, &mframe);
513*437bfbebSnyanmisaka         fd = mpp_buffer_get_fd(mbuffer);
514*437bfbebSnyanmisaka         thumbnail_mode = mpp_frame_get_thumbnail_en(mframe);
515*437bfbebSnyanmisaka         switch (thumbnail_mode) {
516*437bfbebSnyanmisaka         case MPP_FRAME_THUMBNAIL_ONLY:
517*437bfbebSnyanmisaka             regs->common_addr.reg133_scale_down_base = fd;
518*437bfbebSnyanmisaka             origin_buf = hal_bufs_get_buf(ctx->origin_bufs, pp->CurrPic.Index7Bits);
519*437bfbebSnyanmisaka             fd = mpp_buffer_get_fd(origin_buf->buf[0]);
520*437bfbebSnyanmisaka             /* output rkfbc64 */
521*437bfbebSnyanmisaka             // regs->h264d_addrs.reg168_dpb_decout_base = fd;
522*437bfbebSnyanmisaka             /* output raster/tile4x4 */
523*437bfbebSnyanmisaka             regs->common_addr.reg135_pp_m_decout_base = fd;
524*437bfbebSnyanmisaka             regs->h264d_addrs.reg192_dpb_payload64x4_st_cur_base = fd;
525*437bfbebSnyanmisaka             regs->h264d_addrs.reg169_error_ref_base = fd;
526*437bfbebSnyanmisaka             vdpu384a_setup_down_scale(mframe, p_hal->dev, &regs->ctrl_regs, (void*)&regs->h264d_paras);
527*437bfbebSnyanmisaka             break;
528*437bfbebSnyanmisaka         case MPP_FRAME_THUMBNAIL_MIXED:
529*437bfbebSnyanmisaka             regs->common_addr.reg133_scale_down_base = fd;
530*437bfbebSnyanmisaka             vdpu384a_setup_down_scale(mframe, p_hal->dev, &regs->ctrl_regs, (void*)&regs->h264d_paras);
531*437bfbebSnyanmisaka             break;
532*437bfbebSnyanmisaka         case MPP_FRAME_THUMBNAIL_NONE:
533*437bfbebSnyanmisaka         default:
534*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.scale_down_en = 0;
535*437bfbebSnyanmisaka             break;
536*437bfbebSnyanmisaka         }
537*437bfbebSnyanmisaka     }
538*437bfbebSnyanmisaka 
539*437bfbebSnyanmisaka     return MPP_OK;
540*437bfbebSnyanmisaka }
541*437bfbebSnyanmisaka 
init_ctrl_regs(Vdpu384aH264dRegSet * regs)542*437bfbebSnyanmisaka static MPP_RET init_ctrl_regs(Vdpu384aH264dRegSet *regs)
543*437bfbebSnyanmisaka {
544*437bfbebSnyanmisaka     Vdpu384aCtrlReg *ctrl_regs = &regs->ctrl_regs;
545*437bfbebSnyanmisaka 
546*437bfbebSnyanmisaka     ctrl_regs->reg8_dec_mode = 1;  //!< h264
547*437bfbebSnyanmisaka     ctrl_regs->reg9.low_latency_en = 0;
548*437bfbebSnyanmisaka 
549*437bfbebSnyanmisaka     ctrl_regs->reg10.strmd_auto_gating_e      = 1;
550*437bfbebSnyanmisaka     ctrl_regs->reg10.inter_auto_gating_e      = 1;
551*437bfbebSnyanmisaka     ctrl_regs->reg10.intra_auto_gating_e      = 1;
552*437bfbebSnyanmisaka     ctrl_regs->reg10.transd_auto_gating_e     = 1;
553*437bfbebSnyanmisaka     ctrl_regs->reg10.recon_auto_gating_e      = 1;
554*437bfbebSnyanmisaka     ctrl_regs->reg10.filterd_auto_gating_e    = 1;
555*437bfbebSnyanmisaka     ctrl_regs->reg10.bus_auto_gating_e        = 1;
556*437bfbebSnyanmisaka     ctrl_regs->reg10.ctrl_auto_gating_e       = 1;
557*437bfbebSnyanmisaka     ctrl_regs->reg10.rcb_auto_gating_e        = 1;
558*437bfbebSnyanmisaka     ctrl_regs->reg10.err_prc_auto_gating_e    = 1;
559*437bfbebSnyanmisaka 
560*437bfbebSnyanmisaka     ctrl_regs->reg11.rd_outstanding = 32;
561*437bfbebSnyanmisaka     ctrl_regs->reg11.wr_outstanding = 250;
562*437bfbebSnyanmisaka 
563*437bfbebSnyanmisaka     ctrl_regs->reg13_core_timeout_threshold = 0xffffff;
564*437bfbebSnyanmisaka 
565*437bfbebSnyanmisaka     ctrl_regs->reg16.error_proc_disable = 1;
566*437bfbebSnyanmisaka     ctrl_regs->reg16.error_spread_disable = 0;
567*437bfbebSnyanmisaka     ctrl_regs->reg16.roi_error_ctu_cal_en = 0;
568*437bfbebSnyanmisaka 
569*437bfbebSnyanmisaka     ctrl_regs->reg20_cabac_error_en_lowbits = 0xfffedfff;
570*437bfbebSnyanmisaka     ctrl_regs->reg21_cabac_error_en_highbits = 0x0ffbf9ff;
571*437bfbebSnyanmisaka 
572*437bfbebSnyanmisaka     /* performance */
573*437bfbebSnyanmisaka     ctrl_regs->reg28.axi_perf_work_e = 1;
574*437bfbebSnyanmisaka     ctrl_regs->reg28.axi_cnt_type = 1;
575*437bfbebSnyanmisaka     ctrl_regs->reg28.rd_latency_id = 11;
576*437bfbebSnyanmisaka 
577*437bfbebSnyanmisaka     ctrl_regs->reg29.addr_align_type = 2;
578*437bfbebSnyanmisaka     ctrl_regs->reg29.ar_cnt_id_type = 0;
579*437bfbebSnyanmisaka     ctrl_regs->reg29.aw_cnt_id_type = 0;
580*437bfbebSnyanmisaka     ctrl_regs->reg29.ar_count_id = 0xa;
581*437bfbebSnyanmisaka     ctrl_regs->reg29.aw_count_id = 0;
582*437bfbebSnyanmisaka     ctrl_regs->reg29.rd_band_width_mode = 0;
583*437bfbebSnyanmisaka 
584*437bfbebSnyanmisaka     return MPP_OK;
585*437bfbebSnyanmisaka }
586*437bfbebSnyanmisaka 
vdpu384a_h264d_init(void * hal,MppHalCfg * cfg)587*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_init(void *hal, MppHalCfg *cfg)
588*437bfbebSnyanmisaka {
589*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
590*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
591*437bfbebSnyanmisaka 
592*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
593*437bfbebSnyanmisaka     (void) cfg;
594*437bfbebSnyanmisaka 
595*437bfbebSnyanmisaka     MEM_CHECK(ret, p_hal->reg_ctx = mpp_calloc_size(void, sizeof(Vdpu384aH264dRegCtx)));
596*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *reg_ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
597*437bfbebSnyanmisaka     RK_U32 max_cnt = p_hal->fast_mode ? VDPU384A_FAST_REG_SET_CNT : 1;
598*437bfbebSnyanmisaka     RK_U32 i = 0;
599*437bfbebSnyanmisaka 
600*437bfbebSnyanmisaka     //!< malloc buffers
601*437bfbebSnyanmisaka     FUN_CHECK(ret = mpp_buffer_get(p_hal->buf_group, &reg_ctx->bufs,
602*437bfbebSnyanmisaka                                    VDPU384A_INFO_BUFFER_SIZE(max_cnt)));
603*437bfbebSnyanmisaka     reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
604*437bfbebSnyanmisaka     reg_ctx->bufs_ptr = mpp_buffer_get_ptr(reg_ctx->bufs);
605*437bfbebSnyanmisaka     reg_ctx->offset_errinfo = VDPU384A_ERROR_INFO_OFFSET;
606*437bfbebSnyanmisaka     for (i = 0; i < max_cnt; i++) {
607*437bfbebSnyanmisaka         reg_ctx->reg_buf[i].regs = mpp_calloc(Vdpu384aH264dRegSet, 1);
608*437bfbebSnyanmisaka         init_ctrl_regs(reg_ctx->reg_buf[i].regs);
609*437bfbebSnyanmisaka         reg_ctx->offset_spspps[i] = VDPU384A_SPSPPS_OFFSET(i);
610*437bfbebSnyanmisaka         reg_ctx->offset_sclst[i] = VDPU384A_SCALING_LIST_OFFSET(i);
611*437bfbebSnyanmisaka     }
612*437bfbebSnyanmisaka 
613*437bfbebSnyanmisaka     mpp_buffer_attach_dev(reg_ctx->bufs, p_hal->dev);
614*437bfbebSnyanmisaka 
615*437bfbebSnyanmisaka     if (!p_hal->fast_mode) {
616*437bfbebSnyanmisaka         reg_ctx->regs = reg_ctx->reg_buf[0].regs;
617*437bfbebSnyanmisaka         reg_ctx->spspps_offset = reg_ctx->offset_spspps[0];
618*437bfbebSnyanmisaka         reg_ctx->sclst_offset = reg_ctx->offset_sclst[0];
619*437bfbebSnyanmisaka     }
620*437bfbebSnyanmisaka 
621*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
622*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->frame_slots, SLOTS_VER_ALIGN, rkv_ver_align);
623*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->frame_slots, SLOTS_LEN_ALIGN, rkv_len_align);
624*437bfbebSnyanmisaka 
625*437bfbebSnyanmisaka     if (cfg->hal_fbc_adj_cfg) {
626*437bfbebSnyanmisaka         cfg->hal_fbc_adj_cfg->func = vdpu384a_afbc_align_calc;
627*437bfbebSnyanmisaka         cfg->hal_fbc_adj_cfg->expand = 16;
628*437bfbebSnyanmisaka     }
629*437bfbebSnyanmisaka 
630*437bfbebSnyanmisaka __RETURN:
631*437bfbebSnyanmisaka     return MPP_OK;
632*437bfbebSnyanmisaka __FAILED:
633*437bfbebSnyanmisaka     vdpu384a_h264d_deinit(hal);
634*437bfbebSnyanmisaka 
635*437bfbebSnyanmisaka     return ret;
636*437bfbebSnyanmisaka }
637*437bfbebSnyanmisaka 
vdpu384a_h264d_deinit(void * hal)638*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_deinit(void *hal)
639*437bfbebSnyanmisaka {
640*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
641*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *reg_ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
642*437bfbebSnyanmisaka 
643*437bfbebSnyanmisaka     RK_U32 i = 0;
644*437bfbebSnyanmisaka     RK_U32 loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
645*437bfbebSnyanmisaka 
646*437bfbebSnyanmisaka     if (reg_ctx->bufs) {
647*437bfbebSnyanmisaka         mpp_buffer_put(reg_ctx->bufs);
648*437bfbebSnyanmisaka         reg_ctx->bufs = NULL;
649*437bfbebSnyanmisaka     }
650*437bfbebSnyanmisaka 
651*437bfbebSnyanmisaka     for (i = 0; i < loop; i++)
652*437bfbebSnyanmisaka         MPP_FREE(reg_ctx->reg_buf[i].regs);
653*437bfbebSnyanmisaka 
654*437bfbebSnyanmisaka     loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->rcb_buf) : 1;
655*437bfbebSnyanmisaka     for (i = 0; i < loop; i++) {
656*437bfbebSnyanmisaka         if (reg_ctx->rcb_buf[i]) {
657*437bfbebSnyanmisaka             mpp_buffer_put(reg_ctx->rcb_buf[i]);
658*437bfbebSnyanmisaka             reg_ctx->rcb_buf[i] = NULL;
659*437bfbebSnyanmisaka         }
660*437bfbebSnyanmisaka     }
661*437bfbebSnyanmisaka 
662*437bfbebSnyanmisaka     if (p_hal->cmv_bufs) {
663*437bfbebSnyanmisaka         hal_bufs_deinit(p_hal->cmv_bufs);
664*437bfbebSnyanmisaka         p_hal->cmv_bufs = NULL;
665*437bfbebSnyanmisaka     }
666*437bfbebSnyanmisaka 
667*437bfbebSnyanmisaka     if (reg_ctx->origin_bufs) {
668*437bfbebSnyanmisaka         hal_bufs_deinit(reg_ctx->origin_bufs);
669*437bfbebSnyanmisaka         reg_ctx->origin_bufs = NULL;
670*437bfbebSnyanmisaka     }
671*437bfbebSnyanmisaka 
672*437bfbebSnyanmisaka     MPP_FREE(p_hal->reg_ctx);
673*437bfbebSnyanmisaka 
674*437bfbebSnyanmisaka     return MPP_OK;
675*437bfbebSnyanmisaka }
676*437bfbebSnyanmisaka 
h264d_refine_rcb_size(H264dHalCtx_t * p_hal,Vdpu384aRcbInfo * rcb_info,RK_S32 width,RK_S32 height)677*437bfbebSnyanmisaka static void h264d_refine_rcb_size(H264dHalCtx_t *p_hal, Vdpu384aRcbInfo *rcb_info,
678*437bfbebSnyanmisaka                                   RK_S32 width, RK_S32 height)
679*437bfbebSnyanmisaka {
680*437bfbebSnyanmisaka     RK_U32 rcb_bits = 0;
681*437bfbebSnyanmisaka     RK_U32 mbaff = p_hal->pp->MbaffFrameFlag;
682*437bfbebSnyanmisaka     RK_U32 bit_depth = p_hal->pp->bit_depth_luma_minus8 + 8;
683*437bfbebSnyanmisaka     RK_U32 chroma_format_idc = p_hal->pp->chroma_format_idc;
684*437bfbebSnyanmisaka     RK_U32 row_uv_para = 1; // for yuv420/yuv422
685*437bfbebSnyanmisaka     RK_U32 filterd_row_append = 8192;
686*437bfbebSnyanmisaka 
687*437bfbebSnyanmisaka     // vdpu384a h264d support yuv400/yuv420/yuv422
688*437bfbebSnyanmisaka     if (chroma_format_idc == 0)
689*437bfbebSnyanmisaka         row_uv_para = 0;
690*437bfbebSnyanmisaka 
691*437bfbebSnyanmisaka     width = MPP_ALIGN(width, H264_CTU_SIZE);
692*437bfbebSnyanmisaka     height = MPP_ALIGN(height, H264_CTU_SIZE);
693*437bfbebSnyanmisaka     /* RCB_STRMD_ROW && RCB_STRMD_TILE_ROW*/
694*437bfbebSnyanmisaka     if (width > 4096)
695*437bfbebSnyanmisaka         rcb_bits = ((width + 15) / 16) * 158 * (mbaff ? 2 : 1);
696*437bfbebSnyanmisaka     else
697*437bfbebSnyanmisaka         rcb_bits = 0;
698*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_ROW].size = MPP_RCB_BYTES(rcb_bits);
699*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
700*437bfbebSnyanmisaka     /* RCB_INTER_ROW && RCB_INTER_TILE_ROW*/
701*437bfbebSnyanmisaka     rcb_bits = ((width + 3) / 4) * 92 * (mbaff ? 2 : 1);
702*437bfbebSnyanmisaka     rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
703*437bfbebSnyanmisaka     rcb_info[RCB_INTER_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
704*437bfbebSnyanmisaka     /* RCB_INTRA_ROW && RCB_INTRA_TILE_ROW*/
705*437bfbebSnyanmisaka     rcb_bits = MPP_ALIGN(width, 512) * (bit_depth + 2) * (mbaff ? 2 : 1);
706*437bfbebSnyanmisaka     if (chroma_format_idc == 1 || chroma_format_idc == 2)
707*437bfbebSnyanmisaka         rcb_bits = rcb_bits * 5 / 2; //TODO:
708*437bfbebSnyanmisaka 
709*437bfbebSnyanmisaka     rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
710*437bfbebSnyanmisaka     rcb_info[RCB_INTRA_TILE_ROW].size = 0;
711*437bfbebSnyanmisaka     /* RCB_FILTERD_ROW && RCB_FILTERD_PROTECT_ROW*/
712*437bfbebSnyanmisaka     // save space mode : half for RCB_FILTERD_ROW, half for RCB_FILTERD_PROTECT_ROW
713*437bfbebSnyanmisaka     rcb_bits = width * 13 * ((6 + 3 * row_uv_para) * (mbaff ? 2 : 1) + 2 * row_uv_para + 1.5);
714*437bfbebSnyanmisaka     if (width > 4096)
715*437bfbebSnyanmisaka         filterd_row_append = 27648;
716*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
717*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_PROTECT_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
718*437bfbebSnyanmisaka 
719*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_TILE_ROW].size = 0;
720*437bfbebSnyanmisaka     /* RCB_FILTERD_TILE_COL */
721*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_TILE_COL].size = 0;
722*437bfbebSnyanmisaka 
723*437bfbebSnyanmisaka }
724*437bfbebSnyanmisaka 
hal_h264d_rcb_info_update(void * hal)725*437bfbebSnyanmisaka static void hal_h264d_rcb_info_update(void *hal)
726*437bfbebSnyanmisaka {
727*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t*)hal;
728*437bfbebSnyanmisaka     RK_U32 mbaff = p_hal->pp->MbaffFrameFlag;
729*437bfbebSnyanmisaka     RK_U32 bit_depth = p_hal->pp->bit_depth_luma_minus8 + 8;
730*437bfbebSnyanmisaka     RK_U32 chroma_format_idc = p_hal->pp->chroma_format_idc;
731*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
732*437bfbebSnyanmisaka     RK_S32 width = MPP_ALIGN((p_hal->pp->wFrameWidthInMbsMinus1 + 1) << 4, 64);
733*437bfbebSnyanmisaka     RK_S32 height = MPP_ALIGN((p_hal->pp->wFrameHeightInMbsMinus1 + 1) << 4, 64);
734*437bfbebSnyanmisaka 
735*437bfbebSnyanmisaka     if ( ctx->bit_depth != bit_depth ||
736*437bfbebSnyanmisaka          ctx->chroma_format_idc != chroma_format_idc ||
737*437bfbebSnyanmisaka          ctx->mbaff != mbaff ||
738*437bfbebSnyanmisaka          ctx->width != width ||
739*437bfbebSnyanmisaka          ctx->height != height) {
740*437bfbebSnyanmisaka         RK_U32 i;
741*437bfbebSnyanmisaka         RK_U32 loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(ctx->reg_buf) : 1;
742*437bfbebSnyanmisaka 
743*437bfbebSnyanmisaka         ctx->rcb_buf_size = vdpu384a_get_rcb_buf_size(ctx->rcb_info, width, height);
744*437bfbebSnyanmisaka         h264d_refine_rcb_size(hal, ctx->rcb_info, width, height);
745*437bfbebSnyanmisaka         /* vdpu384a_check_rcb_buf_size(ctx->rcb_info, width, height); */
746*437bfbebSnyanmisaka         for (i = 0; i < loop; i++) {
747*437bfbebSnyanmisaka             MppBuffer rcb_buf = ctx->rcb_buf[i];
748*437bfbebSnyanmisaka 
749*437bfbebSnyanmisaka             if (rcb_buf) {
750*437bfbebSnyanmisaka                 mpp_buffer_put(rcb_buf);
751*437bfbebSnyanmisaka                 ctx->rcb_buf[i] = NULL;
752*437bfbebSnyanmisaka             }
753*437bfbebSnyanmisaka             mpp_buffer_get(p_hal->buf_group, &rcb_buf, ctx->rcb_buf_size);
754*437bfbebSnyanmisaka             ctx->rcb_buf[i] = rcb_buf;
755*437bfbebSnyanmisaka         }
756*437bfbebSnyanmisaka         ctx->bit_depth      = bit_depth;
757*437bfbebSnyanmisaka         ctx->width          = width;
758*437bfbebSnyanmisaka         ctx->height         = height;
759*437bfbebSnyanmisaka         ctx->mbaff          = mbaff;
760*437bfbebSnyanmisaka         ctx->chroma_format_idc = chroma_format_idc;
761*437bfbebSnyanmisaka     }
762*437bfbebSnyanmisaka }
763*437bfbebSnyanmisaka 
vdpu384a_h264d_gen_regs(void * hal,HalTaskInfo * task)764*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_gen_regs(void *hal, HalTaskInfo *task)
765*437bfbebSnyanmisaka {
766*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
767*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
768*437bfbebSnyanmisaka     RK_S32 width = MPP_ALIGN((p_hal->pp->wFrameWidthInMbsMinus1 + 1) << 4, 64);
769*437bfbebSnyanmisaka     RK_S32 height = MPP_ALIGN((p_hal->pp->wFrameHeightInMbsMinus1 + 1) << 4, 64);
770*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
771*437bfbebSnyanmisaka     Vdpu384aH264dRegSet *regs = ctx->regs;
772*437bfbebSnyanmisaka     MppFrame mframe;
773*437bfbebSnyanmisaka     RK_S32 mv_size = MPP_ALIGN(width, 64) * MPP_ALIGN(height, 16); // 16 byte unit
774*437bfbebSnyanmisaka 
775*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
776*437bfbebSnyanmisaka 
777*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
778*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !p_hal->cfg->base.disable_error)) {
779*437bfbebSnyanmisaka         goto __RETURN;
780*437bfbebSnyanmisaka     }
781*437bfbebSnyanmisaka 
782*437bfbebSnyanmisaka     /* if is field mode is enabled enlarge colmv buffer and disable colmv compression */
783*437bfbebSnyanmisaka     if (!p_hal->pp->frame_mbs_only_flag)
784*437bfbebSnyanmisaka         mv_size *= 2;
785*437bfbebSnyanmisaka 
786*437bfbebSnyanmisaka     if (p_hal->cmv_bufs == NULL || p_hal->mv_size < mv_size) {
787*437bfbebSnyanmisaka         size_t size = mv_size;
788*437bfbebSnyanmisaka 
789*437bfbebSnyanmisaka         if (p_hal->cmv_bufs) {
790*437bfbebSnyanmisaka             hal_bufs_deinit(p_hal->cmv_bufs);
791*437bfbebSnyanmisaka             p_hal->cmv_bufs = NULL;
792*437bfbebSnyanmisaka         }
793*437bfbebSnyanmisaka 
794*437bfbebSnyanmisaka         hal_bufs_init(&p_hal->cmv_bufs);
795*437bfbebSnyanmisaka         if (p_hal->cmv_bufs == NULL) {
796*437bfbebSnyanmisaka             mpp_err_f("colmv bufs init fail");
797*437bfbebSnyanmisaka             goto __RETURN;
798*437bfbebSnyanmisaka         }
799*437bfbebSnyanmisaka         p_hal->mv_size = mv_size;
800*437bfbebSnyanmisaka         p_hal->mv_count = mpp_buf_slot_get_count(p_hal->frame_slots);
801*437bfbebSnyanmisaka         hal_bufs_setup(p_hal->cmv_bufs, p_hal->mv_count, 1, &size);
802*437bfbebSnyanmisaka     }
803*437bfbebSnyanmisaka 
804*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->frame_slots, p_hal->pp->CurrPic.Index7Bits, SLOT_FRAME_PTR, &mframe);
805*437bfbebSnyanmisaka     if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY &&
806*437bfbebSnyanmisaka         ctx->origin_bufs == NULL) {
807*437bfbebSnyanmisaka         vdpu384a_setup_scale_origin_bufs(p_hal, mframe);
808*437bfbebSnyanmisaka     }
809*437bfbebSnyanmisaka 
810*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
811*437bfbebSnyanmisaka         RK_U32 i = 0;
812*437bfbebSnyanmisaka         for (i = 0; i <  MPP_ARRAY_ELEMS(ctx->reg_buf); i++) {
813*437bfbebSnyanmisaka             if (!ctx->reg_buf[i].valid) {
814*437bfbebSnyanmisaka                 task->dec.reg_index = i;
815*437bfbebSnyanmisaka                 regs = ctx->reg_buf[i].regs;
816*437bfbebSnyanmisaka 
817*437bfbebSnyanmisaka                 ctx->spspps_offset = ctx->offset_spspps[i];
818*437bfbebSnyanmisaka                 ctx->sclst_offset = ctx->offset_sclst[i];
819*437bfbebSnyanmisaka                 ctx->reg_buf[i].valid = 1;
820*437bfbebSnyanmisaka                 break;
821*437bfbebSnyanmisaka             }
822*437bfbebSnyanmisaka         }
823*437bfbebSnyanmisaka     }
824*437bfbebSnyanmisaka 
825*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
826*437bfbebSnyanmisaka     {
827*437bfbebSnyanmisaka         memset(dump_cur_dir, 0, sizeof(dump_cur_dir));
828*437bfbebSnyanmisaka         sprintf(dump_cur_dir, "avc/Frame%04d", dump_cur_frame);
829*437bfbebSnyanmisaka         if (access(dump_cur_dir, 0)) {
830*437bfbebSnyanmisaka             if (mkdir(dump_cur_dir))
831*437bfbebSnyanmisaka                 mpp_err_f("error: mkdir %s\n", dump_cur_dir);
832*437bfbebSnyanmisaka         }
833*437bfbebSnyanmisaka         dump_cur_frame++;
834*437bfbebSnyanmisaka     }
835*437bfbebSnyanmisaka #endif
836*437bfbebSnyanmisaka 
837*437bfbebSnyanmisaka     prepare_spspps(p_hal, (RK_U64 *)&ctx->spspps, sizeof(ctx->spspps) / 8);
838*437bfbebSnyanmisaka     prepare_scanlist(p_hal, ctx->sclst, sizeof(ctx->sclst));
839*437bfbebSnyanmisaka     set_registers(p_hal, regs, task);
840*437bfbebSnyanmisaka 
841*437bfbebSnyanmisaka     //!< copy spspps datas
842*437bfbebSnyanmisaka     memcpy((char *)ctx->bufs_ptr + ctx->spspps_offset, (char *)ctx->spspps, sizeof(ctx->spspps));
843*437bfbebSnyanmisaka 
844*437bfbebSnyanmisaka     regs->common_addr.reg131_gbl_base = ctx->bufs_fd;
845*437bfbebSnyanmisaka     regs->h264d_paras.reg67_global_len = VDPU384A_SPSPPS_SIZE / 16; // 128 bit as unit
846*437bfbebSnyanmisaka     mpp_dev_set_reg_offset(p_hal->dev, 131, ctx->spspps_offset);
847*437bfbebSnyanmisaka 
848*437bfbebSnyanmisaka     if (p_hal->pp->scaleing_list_enable_flag) {
849*437bfbebSnyanmisaka         memcpy((char *)ctx->bufs_ptr + ctx->sclst_offset, (void *)ctx->sclst, sizeof(ctx->sclst));
850*437bfbebSnyanmisaka         regs->common_addr.reg132_scanlist_addr = ctx->bufs_fd;
851*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(p_hal->dev, 132, ctx->sclst_offset);
852*437bfbebSnyanmisaka     } else {
853*437bfbebSnyanmisaka         regs->common_addr.reg132_scanlist_addr = 0;
854*437bfbebSnyanmisaka     }
855*437bfbebSnyanmisaka 
856*437bfbebSnyanmisaka     hal_h264d_rcb_info_update(p_hal);
857*437bfbebSnyanmisaka     vdpu384a_setup_rcb(&regs->common_addr, p_hal->dev, p_hal->fast_mode ?
858*437bfbebSnyanmisaka                        ctx->rcb_buf[task->dec.reg_index] : ctx->rcb_buf[0],
859*437bfbebSnyanmisaka                        ctx->rcb_info);
860*437bfbebSnyanmisaka     vdpu384a_setup_statistic(&regs->ctrl_regs);
861*437bfbebSnyanmisaka     mpp_buffer_sync_end(ctx->bufs);
862*437bfbebSnyanmisaka 
863*437bfbebSnyanmisaka __RETURN:
864*437bfbebSnyanmisaka     return ret = MPP_OK;
865*437bfbebSnyanmisaka }
866*437bfbebSnyanmisaka 
vdpu384a_h264d_start(void * hal,HalTaskInfo * task)867*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_start(void *hal, HalTaskInfo *task)
868*437bfbebSnyanmisaka {
869*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
870*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
871*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
872*437bfbebSnyanmisaka 
873*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
874*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !p_hal->cfg->base.disable_error)) {
875*437bfbebSnyanmisaka         goto __RETURN;
876*437bfbebSnyanmisaka     }
877*437bfbebSnyanmisaka 
878*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *reg_ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
879*437bfbebSnyanmisaka     Vdpu384aH264dRegSet *regs = p_hal->fast_mode ?
880*437bfbebSnyanmisaka                                 reg_ctx->reg_buf[task->dec.reg_index].regs :
881*437bfbebSnyanmisaka                                 reg_ctx->regs;
882*437bfbebSnyanmisaka     MppDev dev = p_hal->dev;
883*437bfbebSnyanmisaka 
884*437bfbebSnyanmisaka     do {
885*437bfbebSnyanmisaka         MppDevRegWrCfg wr_cfg;
886*437bfbebSnyanmisaka         MppDevRegRdCfg rd_cfg;
887*437bfbebSnyanmisaka 
888*437bfbebSnyanmisaka         wr_cfg.reg = &regs->ctrl_regs;
889*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->ctrl_regs);
890*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CTRL_REGS;
891*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
892*437bfbebSnyanmisaka         if (ret) {
893*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
894*437bfbebSnyanmisaka             break;
895*437bfbebSnyanmisaka         }
896*437bfbebSnyanmisaka 
897*437bfbebSnyanmisaka         wr_cfg.reg = &regs->common_addr;
898*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->common_addr);
899*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
900*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
901*437bfbebSnyanmisaka         if (ret) {
902*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
903*437bfbebSnyanmisaka             break;
904*437bfbebSnyanmisaka         }
905*437bfbebSnyanmisaka 
906*437bfbebSnyanmisaka         wr_cfg.reg = &regs->h264d_paras;
907*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->h264d_paras);
908*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_PARAS_REGS;
909*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
910*437bfbebSnyanmisaka         if (ret) {
911*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
912*437bfbebSnyanmisaka             break;
913*437bfbebSnyanmisaka         }
914*437bfbebSnyanmisaka 
915*437bfbebSnyanmisaka         wr_cfg.reg = &regs->h264d_addrs;
916*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->h264d_addrs);
917*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
918*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
919*437bfbebSnyanmisaka         if (ret) {
920*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
921*437bfbebSnyanmisaka             break;
922*437bfbebSnyanmisaka         }
923*437bfbebSnyanmisaka 
924*437bfbebSnyanmisaka         rd_cfg.reg = &regs->ctrl_regs.reg15;
925*437bfbebSnyanmisaka         rd_cfg.size = sizeof(regs->ctrl_regs.reg15);
926*437bfbebSnyanmisaka         rd_cfg.offset = OFFSET_INTERRUPT_REGS;
927*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
928*437bfbebSnyanmisaka         if (ret) {
929*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
930*437bfbebSnyanmisaka             break;
931*437bfbebSnyanmisaka         }
932*437bfbebSnyanmisaka 
933*437bfbebSnyanmisaka         /* rcb info for sram */
934*437bfbebSnyanmisaka         vdpu384a_set_rcbinfo(dev, (Vdpu384aRcbInfo*)reg_ctx->rcb_info);
935*437bfbebSnyanmisaka 
936*437bfbebSnyanmisaka         /* send request to hardware */
937*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
938*437bfbebSnyanmisaka         if (ret) {
939*437bfbebSnyanmisaka             mpp_err_f("send cmd failed %d\n", ret);
940*437bfbebSnyanmisaka             break;
941*437bfbebSnyanmisaka         }
942*437bfbebSnyanmisaka     } while (0);
943*437bfbebSnyanmisaka 
944*437bfbebSnyanmisaka __RETURN:
945*437bfbebSnyanmisaka     return ret = MPP_OK;
946*437bfbebSnyanmisaka }
947*437bfbebSnyanmisaka 
vdpu384a_h264d_wait(void * hal,HalTaskInfo * task)948*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_wait(void *hal, HalTaskInfo *task)
949*437bfbebSnyanmisaka {
950*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
951*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
952*437bfbebSnyanmisaka 
953*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
954*437bfbebSnyanmisaka     Vdpu384aH264dRegCtx *reg_ctx = (Vdpu384aH264dRegCtx *)p_hal->reg_ctx;
955*437bfbebSnyanmisaka     Vdpu384aH264dRegSet *p_regs = p_hal->fast_mode ?
956*437bfbebSnyanmisaka                                   reg_ctx->reg_buf[task->dec.reg_index].regs :
957*437bfbebSnyanmisaka                                   reg_ctx->regs;
958*437bfbebSnyanmisaka 
959*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
960*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !p_hal->cfg->base.disable_error)) {
961*437bfbebSnyanmisaka         goto __SKIP_HARD;
962*437bfbebSnyanmisaka     }
963*437bfbebSnyanmisaka 
964*437bfbebSnyanmisaka     ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
965*437bfbebSnyanmisaka     if (ret)
966*437bfbebSnyanmisaka         mpp_err_f("poll cmd failed %d\n", ret);
967*437bfbebSnyanmisaka 
968*437bfbebSnyanmisaka __SKIP_HARD:
969*437bfbebSnyanmisaka     if (p_hal->dec_cb) {
970*437bfbebSnyanmisaka         DecCbHalDone param;
971*437bfbebSnyanmisaka 
972*437bfbebSnyanmisaka         param.task = (void *)&task->dec;
973*437bfbebSnyanmisaka         param.regs = (RK_U32 *)p_regs;
974*437bfbebSnyanmisaka 
975*437bfbebSnyanmisaka         if ((!p_regs->ctrl_regs.reg15.rkvdec_frame_rdy_sta) ||
976*437bfbebSnyanmisaka             p_regs->ctrl_regs.reg15.rkvdec_strm_error_sta ||
977*437bfbebSnyanmisaka             p_regs->ctrl_regs.reg15.rkvdec_core_timeout_sta ||
978*437bfbebSnyanmisaka             p_regs->ctrl_regs.reg15.rkvdec_ip_timeout_sta ||
979*437bfbebSnyanmisaka             p_regs->ctrl_regs.reg15.rkvdec_bus_error_sta ||
980*437bfbebSnyanmisaka             p_regs->ctrl_regs.reg15.rkvdec_buffer_empty_sta ||
981*437bfbebSnyanmisaka             p_regs->ctrl_regs.reg15.rkvdec_colmv_ref_error_sta)
982*437bfbebSnyanmisaka             param.hard_err = 1;
983*437bfbebSnyanmisaka         else
984*437bfbebSnyanmisaka             param.hard_err = 0;
985*437bfbebSnyanmisaka 
986*437bfbebSnyanmisaka         mpp_callback(p_hal->dec_cb, &param);
987*437bfbebSnyanmisaka     }
988*437bfbebSnyanmisaka     memset(&p_regs->ctrl_regs.reg19, 0, sizeof(RK_U32));
989*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
990*437bfbebSnyanmisaka         reg_ctx->reg_buf[task->dec.reg_index].valid = 0;
991*437bfbebSnyanmisaka     }
992*437bfbebSnyanmisaka 
993*437bfbebSnyanmisaka     (void)task;
994*437bfbebSnyanmisaka __RETURN:
995*437bfbebSnyanmisaka     return ret = MPP_OK;
996*437bfbebSnyanmisaka }
997*437bfbebSnyanmisaka 
vdpu384a_h264d_reset(void * hal)998*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_reset(void *hal)
999*437bfbebSnyanmisaka {
1000*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
1001*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1002*437bfbebSnyanmisaka 
1003*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
1004*437bfbebSnyanmisaka 
1005*437bfbebSnyanmisaka 
1006*437bfbebSnyanmisaka __RETURN:
1007*437bfbebSnyanmisaka     return ret = MPP_OK;
1008*437bfbebSnyanmisaka }
1009*437bfbebSnyanmisaka 
vdpu384a_h264d_flush(void * hal)1010*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_flush(void *hal)
1011*437bfbebSnyanmisaka {
1012*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
1013*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1014*437bfbebSnyanmisaka 
1015*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
1016*437bfbebSnyanmisaka 
1017*437bfbebSnyanmisaka __RETURN:
1018*437bfbebSnyanmisaka     return ret = MPP_OK;
1019*437bfbebSnyanmisaka }
1020*437bfbebSnyanmisaka 
vdpu384a_h264d_control(void * hal,MpiCmd cmd_type,void * param)1021*437bfbebSnyanmisaka MPP_RET vdpu384a_h264d_control(void *hal, MpiCmd cmd_type, void *param)
1022*437bfbebSnyanmisaka {
1023*437bfbebSnyanmisaka     MPP_RET ret = MPP_ERR_UNKNOW;
1024*437bfbebSnyanmisaka     H264dHalCtx_t *p_hal = (H264dHalCtx_t *)hal;
1025*437bfbebSnyanmisaka 
1026*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
1027*437bfbebSnyanmisaka 
1028*437bfbebSnyanmisaka     switch ((MpiCmd)cmd_type) {
1029*437bfbebSnyanmisaka     case MPP_DEC_SET_FRAME_INFO: {
1030*437bfbebSnyanmisaka         MppFrameFormat fmt = mpp_frame_get_fmt((MppFrame)param);
1031*437bfbebSnyanmisaka         RK_U32 imgwidth = mpp_frame_get_width((MppFrame)param);
1032*437bfbebSnyanmisaka         RK_U32 imgheight = mpp_frame_get_height((MppFrame)param);
1033*437bfbebSnyanmisaka 
1034*437bfbebSnyanmisaka         mpp_log("control info: fmt %d, w %d, h %d\n", fmt, imgwidth, imgheight);
1035*437bfbebSnyanmisaka         if (fmt == MPP_FMT_YUV422SP) {
1036*437bfbebSnyanmisaka             mpp_slots_set_prop(p_hal->frame_slots, SLOTS_LEN_ALIGN, rkv_len_align_422);
1037*437bfbebSnyanmisaka         }
1038*437bfbebSnyanmisaka         if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1039*437bfbebSnyanmisaka             vdpu384a_afbc_align_calc(p_hal->frame_slots, (MppFrame)param, 16);
1040*437bfbebSnyanmisaka         } else if (imgwidth > 1920 || imgheight > 1088) {
1041*437bfbebSnyanmisaka             mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
1042*437bfbebSnyanmisaka         }
1043*437bfbebSnyanmisaka     } break;
1044*437bfbebSnyanmisaka     case MPP_DEC_GET_THUMBNAIL_FRAME_INFO: {
1045*437bfbebSnyanmisaka         vdpu384a_update_thumbnail_frame_info((MppFrame)param);
1046*437bfbebSnyanmisaka     } break;
1047*437bfbebSnyanmisaka     case MPP_DEC_SET_OUTPUT_FORMAT: {
1048*437bfbebSnyanmisaka     } break;
1049*437bfbebSnyanmisaka     default : {
1050*437bfbebSnyanmisaka     } break;
1051*437bfbebSnyanmisaka     }
1052*437bfbebSnyanmisaka 
1053*437bfbebSnyanmisaka __RETURN:
1054*437bfbebSnyanmisaka     return ret = MPP_OK;
1055*437bfbebSnyanmisaka }
1056*437bfbebSnyanmisaka 
1057*437bfbebSnyanmisaka const MppHalApi hal_h264d_vdpu384a = {
1058*437bfbebSnyanmisaka     .name     = "h264d_vdpu384a",
1059*437bfbebSnyanmisaka     .type     = MPP_CTX_DEC,
1060*437bfbebSnyanmisaka     .coding   = MPP_VIDEO_CodingAVC,
1061*437bfbebSnyanmisaka     .ctx_size = sizeof(Vdpu384aH264dRegCtx),
1062*437bfbebSnyanmisaka     .flag     = 0,
1063*437bfbebSnyanmisaka     .init     = vdpu384a_h264d_init,
1064*437bfbebSnyanmisaka     .deinit   = vdpu384a_h264d_deinit,
1065*437bfbebSnyanmisaka     .reg_gen  = vdpu384a_h264d_gen_regs,
1066*437bfbebSnyanmisaka     .start    = vdpu384a_h264d_start,
1067*437bfbebSnyanmisaka     .wait     = vdpu384a_h264d_wait,
1068*437bfbebSnyanmisaka     .reset    = vdpu384a_h264d_reset,
1069*437bfbebSnyanmisaka     .flush    = vdpu384a_h264d_flush,
1070*437bfbebSnyanmisaka     .control  = vdpu384a_h264d_control,
1071*437bfbebSnyanmisaka };
1072