xref: /rockchip-linux_mpp/mpp/hal/rkdec/h265d/hal_h265d_vdpu384a.c (revision 437bfbeb9567cca9cd9080e3f6954aa9d6a94f18)
1*437bfbebSnyanmisaka /* SPDX-License-Identifier: Apache-2.0 OR MIT */
2*437bfbebSnyanmisaka /*
3*437bfbebSnyanmisaka  * Copyright (c) 2024 Rockchip Electronics Co., Ltd.
4*437bfbebSnyanmisaka  */
5*437bfbebSnyanmisaka 
6*437bfbebSnyanmisaka #define MODULE_TAG "hal_h265d_vdpu384a"
7*437bfbebSnyanmisaka 
8*437bfbebSnyanmisaka #include <stdio.h>
9*437bfbebSnyanmisaka #include <string.h>
10*437bfbebSnyanmisaka #include <unistd.h>
11*437bfbebSnyanmisaka #include <stdarg.h>
12*437bfbebSnyanmisaka #include <inttypes.h>
13*437bfbebSnyanmisaka #include <ctype.h>
14*437bfbebSnyanmisaka #include <sys/stat.h>
15*437bfbebSnyanmisaka #include <sys/types.h>
16*437bfbebSnyanmisaka 
17*437bfbebSnyanmisaka #include "mpp_env.h"
18*437bfbebSnyanmisaka #include "mpp_mem.h"
19*437bfbebSnyanmisaka #include "mpp_bitread.h"
20*437bfbebSnyanmisaka #include "mpp_bitput.h"
21*437bfbebSnyanmisaka #include "mpp_buffer_impl.h"
22*437bfbebSnyanmisaka 
23*437bfbebSnyanmisaka #include "h265d_syntax.h"
24*437bfbebSnyanmisaka #include "hal_h265d_debug.h"
25*437bfbebSnyanmisaka #include "hal_h265d_ctx.h"
26*437bfbebSnyanmisaka #include "hal_h265d_com.h"
27*437bfbebSnyanmisaka #include "hal_h265d_vdpu384a.h"
28*437bfbebSnyanmisaka #include "vdpu384a_h265d.h"
29*437bfbebSnyanmisaka #include "vdpu384a_com.h"
30*437bfbebSnyanmisaka 
31*437bfbebSnyanmisaka #define PPS_SIZE                (112 * 64)//(96x64)
32*437bfbebSnyanmisaka 
33*437bfbebSnyanmisaka #define FMT 4
34*437bfbebSnyanmisaka #define CTU 3
35*437bfbebSnyanmisaka 
36*437bfbebSnyanmisaka typedef struct {
37*437bfbebSnyanmisaka     RK_U32 a;
38*437bfbebSnyanmisaka     RK_U32 b;
39*437bfbebSnyanmisaka } FilterdColBufRatio;
40*437bfbebSnyanmisaka 
41*437bfbebSnyanmisaka #define SPSPPS_ALIGNED_SIZE             (MPP_ALIGN(2181 + 64, 128) / 8) // byte, 2181 bit + Reserve 64
42*437bfbebSnyanmisaka #define SCALIST_ALIGNED_SIZE            (MPP_ALIGN(81 * 1360, SZ_4K))
43*437bfbebSnyanmisaka #define INFO_BUFFER_SIZE                (SPSPPS_ALIGNED_SIZE + SCALIST_ALIGNED_SIZE)
44*437bfbebSnyanmisaka #define ALL_BUFFER_SIZE(cnt)            (INFO_BUFFER_SIZE *cnt)
45*437bfbebSnyanmisaka 
46*437bfbebSnyanmisaka #define SPSPPS_OFFSET(pos)              (INFO_BUFFER_SIZE * pos)
47*437bfbebSnyanmisaka #define SCALIST_OFFSET(pos)             (SPSPPS_OFFSET(pos) + SPSPPS_ALIGNED_SIZE)
48*437bfbebSnyanmisaka 
49*437bfbebSnyanmisaka #define pocdistance(a, b)               (((a) > (b)) ? ((a) - (b)) : ((b) - (a)))
50*437bfbebSnyanmisaka 
rkv_len_align_422(RK_U32 val)51*437bfbebSnyanmisaka static RK_U32 rkv_len_align_422(RK_U32 val)
52*437bfbebSnyanmisaka {
53*437bfbebSnyanmisaka     return (2 * MPP_ALIGN(val, 16));
54*437bfbebSnyanmisaka }
55*437bfbebSnyanmisaka 
rkv_len_align_444(RK_U32 val)56*437bfbebSnyanmisaka static RK_U32 rkv_len_align_444(RK_U32 val)
57*437bfbebSnyanmisaka {
58*437bfbebSnyanmisaka     return (3 * MPP_ALIGN(val, 16));
59*437bfbebSnyanmisaka }
60*437bfbebSnyanmisaka 
vdpu384a_setup_scale_origin_bufs(HalH265dCtx * ctx,MppFrame mframe)61*437bfbebSnyanmisaka static MPP_RET vdpu384a_setup_scale_origin_bufs(HalH265dCtx *ctx, MppFrame mframe)
62*437bfbebSnyanmisaka {
63*437bfbebSnyanmisaka     /* for 8K FrameBuf scale mode */
64*437bfbebSnyanmisaka     size_t origin_buf_size = 0;
65*437bfbebSnyanmisaka 
66*437bfbebSnyanmisaka     origin_buf_size = mpp_frame_get_buf_size(mframe);
67*437bfbebSnyanmisaka 
68*437bfbebSnyanmisaka     if (!origin_buf_size) {
69*437bfbebSnyanmisaka         mpp_err_f("origin_bufs get buf size failed\n");
70*437bfbebSnyanmisaka         return MPP_NOK;
71*437bfbebSnyanmisaka     }
72*437bfbebSnyanmisaka 
73*437bfbebSnyanmisaka     if (ctx->origin_bufs) {
74*437bfbebSnyanmisaka         hal_bufs_deinit(ctx->origin_bufs);
75*437bfbebSnyanmisaka         ctx->origin_bufs = NULL;
76*437bfbebSnyanmisaka     }
77*437bfbebSnyanmisaka     hal_bufs_init(&ctx->origin_bufs);
78*437bfbebSnyanmisaka     if (!ctx->origin_bufs) {
79*437bfbebSnyanmisaka         mpp_err_f("origin_bufs init fail\n");
80*437bfbebSnyanmisaka         return MPP_ERR_NOMEM;
81*437bfbebSnyanmisaka     }
82*437bfbebSnyanmisaka 
83*437bfbebSnyanmisaka     hal_bufs_setup(ctx->origin_bufs, 16, 1, &origin_buf_size);
84*437bfbebSnyanmisaka 
85*437bfbebSnyanmisaka     return MPP_OK;
86*437bfbebSnyanmisaka }
87*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_init(void * hal,MppHalCfg * cfg)88*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_init(void *hal, MppHalCfg *cfg)
89*437bfbebSnyanmisaka {
90*437bfbebSnyanmisaka     RK_S32 ret = 0;
91*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
92*437bfbebSnyanmisaka 
93*437bfbebSnyanmisaka     mpp_slots_set_prop(reg_ctx->slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
94*437bfbebSnyanmisaka     mpp_slots_set_prop(reg_ctx->slots, SLOTS_VER_ALIGN, hevc_ver_align);
95*437bfbebSnyanmisaka 
96*437bfbebSnyanmisaka     reg_ctx->scaling_qm = mpp_calloc(DXVA_Qmatrix_HEVC, 1);
97*437bfbebSnyanmisaka     if (reg_ctx->scaling_qm == NULL) {
98*437bfbebSnyanmisaka         mpp_err("scaling_org alloc fail");
99*437bfbebSnyanmisaka         return MPP_ERR_MALLOC;
100*437bfbebSnyanmisaka     }
101*437bfbebSnyanmisaka 
102*437bfbebSnyanmisaka     reg_ctx->scaling_rk = mpp_calloc(scalingFactor_t, 1);
103*437bfbebSnyanmisaka     reg_ctx->pps_buf = mpp_calloc(RK_U8, SPSPPS_ALIGNED_SIZE);
104*437bfbebSnyanmisaka 
105*437bfbebSnyanmisaka     if (reg_ctx->scaling_rk == NULL) {
106*437bfbebSnyanmisaka         mpp_err("scaling_rk alloc fail");
107*437bfbebSnyanmisaka         return MPP_ERR_MALLOC;
108*437bfbebSnyanmisaka     }
109*437bfbebSnyanmisaka 
110*437bfbebSnyanmisaka     if (reg_ctx->group == NULL) {
111*437bfbebSnyanmisaka         ret = mpp_buffer_group_get_internal(&reg_ctx->group, MPP_BUFFER_TYPE_ION);
112*437bfbebSnyanmisaka         if (ret) {
113*437bfbebSnyanmisaka             mpp_err("h265d mpp_buffer_group_get failed\n");
114*437bfbebSnyanmisaka             return ret;
115*437bfbebSnyanmisaka         }
116*437bfbebSnyanmisaka     }
117*437bfbebSnyanmisaka 
118*437bfbebSnyanmisaka     {
119*437bfbebSnyanmisaka         RK_U32 i = 0;
120*437bfbebSnyanmisaka         RK_U32 max_cnt = reg_ctx->fast_mode ? MAX_GEN_REG : 1;
121*437bfbebSnyanmisaka 
122*437bfbebSnyanmisaka         //!< malloc buffers
123*437bfbebSnyanmisaka         ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->bufs, ALL_BUFFER_SIZE(max_cnt));
124*437bfbebSnyanmisaka         if (ret) {
125*437bfbebSnyanmisaka             mpp_err("h265d mpp_buffer_get failed\n");
126*437bfbebSnyanmisaka             return ret;
127*437bfbebSnyanmisaka         }
128*437bfbebSnyanmisaka 
129*437bfbebSnyanmisaka         reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
130*437bfbebSnyanmisaka         for (i = 0; i < max_cnt; i++) {
131*437bfbebSnyanmisaka             reg_ctx->g_buf[i].hw_regs = mpp_calloc_size(void, sizeof(Vdpu384aH265dRegSet));
132*437bfbebSnyanmisaka             reg_ctx->offset_spspps[i] = SPSPPS_OFFSET(i);
133*437bfbebSnyanmisaka             reg_ctx->offset_sclst[i] = SCALIST_OFFSET(i);
134*437bfbebSnyanmisaka         }
135*437bfbebSnyanmisaka 
136*437bfbebSnyanmisaka         mpp_buffer_attach_dev(reg_ctx->bufs, reg_ctx->dev);
137*437bfbebSnyanmisaka     }
138*437bfbebSnyanmisaka 
139*437bfbebSnyanmisaka     if (!reg_ctx->fast_mode) {
140*437bfbebSnyanmisaka         reg_ctx->hw_regs = reg_ctx->g_buf[0].hw_regs;
141*437bfbebSnyanmisaka         reg_ctx->spspps_offset = reg_ctx->offset_spspps[0];
142*437bfbebSnyanmisaka         reg_ctx->sclst_offset = reg_ctx->offset_sclst[0];
143*437bfbebSnyanmisaka     }
144*437bfbebSnyanmisaka 
145*437bfbebSnyanmisaka     if (cfg->hal_fbc_adj_cfg) {
146*437bfbebSnyanmisaka         cfg->hal_fbc_adj_cfg->func = vdpu384a_afbc_align_calc;
147*437bfbebSnyanmisaka         cfg->hal_fbc_adj_cfg->expand = 16;
148*437bfbebSnyanmisaka     }
149*437bfbebSnyanmisaka 
150*437bfbebSnyanmisaka     (void) cfg;
151*437bfbebSnyanmisaka     return MPP_OK;
152*437bfbebSnyanmisaka }
153*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_deinit(void * hal)154*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_deinit(void *hal)
155*437bfbebSnyanmisaka {
156*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
157*437bfbebSnyanmisaka     RK_U32 loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->g_buf) : 1;
158*437bfbebSnyanmisaka     RK_U32 i;
159*437bfbebSnyanmisaka 
160*437bfbebSnyanmisaka     if (reg_ctx->bufs) {
161*437bfbebSnyanmisaka         mpp_buffer_put(reg_ctx->bufs);
162*437bfbebSnyanmisaka         reg_ctx->bufs = NULL;
163*437bfbebSnyanmisaka     }
164*437bfbebSnyanmisaka 
165*437bfbebSnyanmisaka     loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->rcb_buf) : 1;
166*437bfbebSnyanmisaka     for (i = 0; i < loop; i++) {
167*437bfbebSnyanmisaka         if (reg_ctx->rcb_buf[i]) {
168*437bfbebSnyanmisaka             mpp_buffer_put(reg_ctx->rcb_buf[i]);
169*437bfbebSnyanmisaka             reg_ctx->rcb_buf[i] = NULL;
170*437bfbebSnyanmisaka         }
171*437bfbebSnyanmisaka     }
172*437bfbebSnyanmisaka 
173*437bfbebSnyanmisaka     if (reg_ctx->group) {
174*437bfbebSnyanmisaka         mpp_buffer_group_put(reg_ctx->group);
175*437bfbebSnyanmisaka         reg_ctx->group = NULL;
176*437bfbebSnyanmisaka     }
177*437bfbebSnyanmisaka 
178*437bfbebSnyanmisaka     for (i = 0; i < loop; i++)
179*437bfbebSnyanmisaka         MPP_FREE(reg_ctx->g_buf[i].hw_regs);
180*437bfbebSnyanmisaka 
181*437bfbebSnyanmisaka     MPP_FREE(reg_ctx->scaling_qm);
182*437bfbebSnyanmisaka     MPP_FREE(reg_ctx->scaling_rk);
183*437bfbebSnyanmisaka     MPP_FREE(reg_ctx->pps_buf);
184*437bfbebSnyanmisaka 
185*437bfbebSnyanmisaka     if (reg_ctx->cmv_bufs) {
186*437bfbebSnyanmisaka         hal_bufs_deinit(reg_ctx->cmv_bufs);
187*437bfbebSnyanmisaka         reg_ctx->cmv_bufs = NULL;
188*437bfbebSnyanmisaka     }
189*437bfbebSnyanmisaka 
190*437bfbebSnyanmisaka     if (reg_ctx->origin_bufs) {
191*437bfbebSnyanmisaka         hal_bufs_deinit(reg_ctx->origin_bufs);
192*437bfbebSnyanmisaka         reg_ctx->origin_bufs = NULL;
193*437bfbebSnyanmisaka     }
194*437bfbebSnyanmisaka 
195*437bfbebSnyanmisaka     return MPP_OK;
196*437bfbebSnyanmisaka }
197*437bfbebSnyanmisaka 
198*437bfbebSnyanmisaka #define SCALING_LIST_NUM 6
199*437bfbebSnyanmisaka 
hal_vdpu384a_record_scaling_list(scalingFactor_t * pScalingFactor_out,scalingList_t * pScalingList)200*437bfbebSnyanmisaka void hal_vdpu384a_record_scaling_list(scalingFactor_t *pScalingFactor_out, scalingList_t *pScalingList)
201*437bfbebSnyanmisaka {
202*437bfbebSnyanmisaka     RK_S32 i;
203*437bfbebSnyanmisaka     RK_U32 listId;
204*437bfbebSnyanmisaka     BitputCtx_t bp;
205*437bfbebSnyanmisaka 
206*437bfbebSnyanmisaka     mpp_set_bitput_ctx(&bp, (RK_U64 *)pScalingFactor_out, 170); // 170*64bits
207*437bfbebSnyanmisaka 
208*437bfbebSnyanmisaka     //-------- following make it by hardware needed --------
209*437bfbebSnyanmisaka     //sizeId == 0, block4x4
210*437bfbebSnyanmisaka     for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
211*437bfbebSnyanmisaka         RK_U8 *p_data = pScalingList->sl[0][listId];
212*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
213*437bfbebSnyanmisaka         for (i = 0; i < 4; i++) {
214*437bfbebSnyanmisaka             mpp_put_bits(&bp, p_data[i + 0], 8);
215*437bfbebSnyanmisaka             mpp_put_bits(&bp, p_data[i + 4], 8);
216*437bfbebSnyanmisaka             mpp_put_bits(&bp, p_data[i + 8], 8);
217*437bfbebSnyanmisaka             mpp_put_bits(&bp, p_data[i + 12], 8);
218*437bfbebSnyanmisaka         }
219*437bfbebSnyanmisaka     }
220*437bfbebSnyanmisaka     //sizeId == 1, block8x8
221*437bfbebSnyanmisaka     for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
222*437bfbebSnyanmisaka         RK_S32 blk4_x = 0, blk4_y = 0;
223*437bfbebSnyanmisaka         RK_U8 *p_data = pScalingList->sl[1][listId];
224*437bfbebSnyanmisaka 
225*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
226*437bfbebSnyanmisaka         for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
227*437bfbebSnyanmisaka             for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
228*437bfbebSnyanmisaka                 RK_S32 pos = blk4_y * 8 + blk4_x;
229*437bfbebSnyanmisaka 
230*437bfbebSnyanmisaka                 for (i = 0; i < 4; i++) {
231*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 0], 8);
232*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 8], 8);
233*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 16], 8);
234*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 24], 8);
235*437bfbebSnyanmisaka                 }
236*437bfbebSnyanmisaka             }
237*437bfbebSnyanmisaka         }
238*437bfbebSnyanmisaka     }
239*437bfbebSnyanmisaka     //sizeId == 2, block16x16
240*437bfbebSnyanmisaka     for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
241*437bfbebSnyanmisaka         RK_S32 blk4_x = 0, blk4_y = 0;
242*437bfbebSnyanmisaka         RK_U8 *p_data = pScalingList->sl[2][listId];
243*437bfbebSnyanmisaka 
244*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
245*437bfbebSnyanmisaka         for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
246*437bfbebSnyanmisaka             for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
247*437bfbebSnyanmisaka                 RK_S32 pos = blk4_y * 8 + blk4_x;
248*437bfbebSnyanmisaka 
249*437bfbebSnyanmisaka                 for (i = 0; i < 4; i++) {
250*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 0], 8);
251*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 8], 8);
252*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 16], 8);
253*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 24], 8);
254*437bfbebSnyanmisaka                 }
255*437bfbebSnyanmisaka             }
256*437bfbebSnyanmisaka         }
257*437bfbebSnyanmisaka     }
258*437bfbebSnyanmisaka     //sizeId == 3, blcok32x32
259*437bfbebSnyanmisaka     for (listId = 0; listId < 6; listId++) {
260*437bfbebSnyanmisaka         RK_S32 blk4_x = 0, blk4_y = 0;
261*437bfbebSnyanmisaka         RK_U8 *p_data = pScalingList->sl[3][listId];
262*437bfbebSnyanmisaka 
263*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
264*437bfbebSnyanmisaka         for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
265*437bfbebSnyanmisaka             for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
266*437bfbebSnyanmisaka                 RK_S32 pos = blk4_y * 8 + blk4_x;
267*437bfbebSnyanmisaka 
268*437bfbebSnyanmisaka                 for (i = 0; i < 4; i++) {
269*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 0], 8);
270*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 8], 8);
271*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 16], 8);
272*437bfbebSnyanmisaka                     mpp_put_bits(&bp, p_data[pos + i + 24], 8);
273*437bfbebSnyanmisaka                 }
274*437bfbebSnyanmisaka             }
275*437bfbebSnyanmisaka         }
276*437bfbebSnyanmisaka     }
277*437bfbebSnyanmisaka     //sizeId == 0, block4x4, horiztion direction */
278*437bfbebSnyanmisaka     for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
279*437bfbebSnyanmisaka         RK_U8 *p_data = pScalingList->sl[0][listId];
280*437bfbebSnyanmisaka 
281*437bfbebSnyanmisaka         for (i = 0; i < 16; i++)
282*437bfbebSnyanmisaka             mpp_put_bits(&bp, p_data[i], 8);
283*437bfbebSnyanmisaka     }
284*437bfbebSnyanmisaka 
285*437bfbebSnyanmisaka     // dump dc value
286*437bfbebSnyanmisaka     for (i = 0; i < SCALING_LIST_NUM; i++)//sizeId = 2, 16x16
287*437bfbebSnyanmisaka         mpp_put_bits(&bp, pScalingList->sl_dc[0][i], 8);
288*437bfbebSnyanmisaka     for (i = 0; i < SCALING_LIST_NUM; i++) //sizeId = 3, 32x32
289*437bfbebSnyanmisaka         mpp_put_bits(&bp, pScalingList->sl_dc[1][i], 8);
290*437bfbebSnyanmisaka 
291*437bfbebSnyanmisaka     mpp_put_align(&bp, 128, 0);
292*437bfbebSnyanmisaka }
293*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_scalinglist_packet(void * hal,void * ptr,void * dxva)294*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_scalinglist_packet(void *hal, void *ptr, void *dxva)
295*437bfbebSnyanmisaka {
296*437bfbebSnyanmisaka     scalingList_t sl;
297*437bfbebSnyanmisaka     RK_U32 i, j, pos;
298*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
299*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
300*437bfbebSnyanmisaka 
301*437bfbebSnyanmisaka     if (!dxva_ctx->pp.scaling_list_enabled_flag) {
302*437bfbebSnyanmisaka         return MPP_OK;
303*437bfbebSnyanmisaka     }
304*437bfbebSnyanmisaka 
305*437bfbebSnyanmisaka     if (memcmp((void*)&dxva_ctx->qm, reg_ctx->scaling_qm, sizeof(DXVA_Qmatrix_HEVC))) {
306*437bfbebSnyanmisaka         memset(&sl, 0, sizeof(scalingList_t));
307*437bfbebSnyanmisaka 
308*437bfbebSnyanmisaka         for (i = 0; i < 6; i++) {
309*437bfbebSnyanmisaka             for (j = 0; j < 16; j++) {
310*437bfbebSnyanmisaka                 pos = 4 * hal_hevc_diag_scan4x4_y[j] + hal_hevc_diag_scan4x4_x[j];
311*437bfbebSnyanmisaka                 sl.sl[0][i][pos] = dxva_ctx->qm.ucScalingLists0[i][j];
312*437bfbebSnyanmisaka             }
313*437bfbebSnyanmisaka 
314*437bfbebSnyanmisaka             for (j = 0; j < 64; j++) {
315*437bfbebSnyanmisaka                 pos = 8 * hal_hevc_diag_scan8x8_y[j] + hal_hevc_diag_scan8x8_x[j];
316*437bfbebSnyanmisaka                 sl.sl[1][i][pos] =  dxva_ctx->qm.ucScalingLists1[i][j];
317*437bfbebSnyanmisaka                 sl.sl[2][i][pos] =  dxva_ctx->qm.ucScalingLists2[i][j];
318*437bfbebSnyanmisaka 
319*437bfbebSnyanmisaka                 if (i == 0)
320*437bfbebSnyanmisaka                     sl.sl[3][i][pos] =  dxva_ctx->qm.ucScalingLists3[0][j];
321*437bfbebSnyanmisaka                 else if (i == 3)
322*437bfbebSnyanmisaka                     sl.sl[3][i][pos] =  dxva_ctx->qm.ucScalingLists3[1][j];
323*437bfbebSnyanmisaka                 else
324*437bfbebSnyanmisaka                     sl.sl[3][i][pos] =  dxva_ctx->qm.ucScalingLists2[i][j];
325*437bfbebSnyanmisaka             }
326*437bfbebSnyanmisaka 
327*437bfbebSnyanmisaka             sl.sl_dc[0][i] =  dxva_ctx->qm.ucScalingListDCCoefSizeID2[i];
328*437bfbebSnyanmisaka             if (i == 0)
329*437bfbebSnyanmisaka                 sl.sl_dc[1][i] =  dxva_ctx->qm.ucScalingListDCCoefSizeID3[0];
330*437bfbebSnyanmisaka             else if (i == 3)
331*437bfbebSnyanmisaka                 sl.sl_dc[1][i] =  dxva_ctx->qm.ucScalingListDCCoefSizeID3[1];
332*437bfbebSnyanmisaka             else
333*437bfbebSnyanmisaka                 sl.sl_dc[1][i] =  dxva_ctx->qm.ucScalingListDCCoefSizeID2[i];
334*437bfbebSnyanmisaka         }
335*437bfbebSnyanmisaka         hal_vdpu384a_record_scaling_list((scalingFactor_t *)reg_ctx->scaling_rk, &sl);
336*437bfbebSnyanmisaka     }
337*437bfbebSnyanmisaka 
338*437bfbebSnyanmisaka     memcpy(ptr, reg_ctx->scaling_rk, sizeof(scalingFactor_t));
339*437bfbebSnyanmisaka 
340*437bfbebSnyanmisaka     return MPP_OK;
341*437bfbebSnyanmisaka }
342*437bfbebSnyanmisaka 
hal_h265d_v345_output_pps_packet(void * hal,void * dxva)343*437bfbebSnyanmisaka static RK_S32 hal_h265d_v345_output_pps_packet(void *hal, void *dxva)
344*437bfbebSnyanmisaka {
345*437bfbebSnyanmisaka     RK_S32 i;
346*437bfbebSnyanmisaka     RK_U32 log2_min_cb_size;
347*437bfbebSnyanmisaka     RK_S32 width, height;
348*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
349*437bfbebSnyanmisaka     Vdpu384aH265dRegSet *hw_reg = (Vdpu384aH265dRegSet*)(reg_ctx->hw_regs);
350*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
351*437bfbebSnyanmisaka     BitputCtx_t bp;
352*437bfbebSnyanmisaka 
353*437bfbebSnyanmisaka     if (NULL == reg_ctx || dxva_ctx == NULL) {
354*437bfbebSnyanmisaka         mpp_err("%s:%s:%d reg_ctx or dxva_ctx is NULL",
355*437bfbebSnyanmisaka                 __FILE__, __FUNCTION__, __LINE__);
356*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
357*437bfbebSnyanmisaka     }
358*437bfbebSnyanmisaka 
359*437bfbebSnyanmisaka     // SPS
360*437bfbebSnyanmisaka     {
361*437bfbebSnyanmisaka         void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->spspps_offset;
362*437bfbebSnyanmisaka         RK_U64 *pps_packet = reg_ctx->pps_buf;
363*437bfbebSnyanmisaka 
364*437bfbebSnyanmisaka         if (NULL == pps_ptr) {
365*437bfbebSnyanmisaka             mpp_err("pps_data get ptr error");
366*437bfbebSnyanmisaka             return MPP_ERR_NOMEM;
367*437bfbebSnyanmisaka         }
368*437bfbebSnyanmisaka 
369*437bfbebSnyanmisaka         log2_min_cb_size = dxva_ctx->pp.log2_min_luma_coding_block_size_minus3 + 3;
370*437bfbebSnyanmisaka         width = (dxva_ctx->pp.PicWidthInMinCbsY << log2_min_cb_size);
371*437bfbebSnyanmisaka         height = (dxva_ctx->pp.PicHeightInMinCbsY << log2_min_cb_size);
372*437bfbebSnyanmisaka 
373*437bfbebSnyanmisaka         mpp_set_bitput_ctx(&bp, pps_packet, SPSPPS_ALIGNED_SIZE / 8);
374*437bfbebSnyanmisaka 
375*437bfbebSnyanmisaka         if (dxva_ctx->pp.ps_update_flag) {
376*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.vps_id, 4);
377*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.sps_id, 4);
378*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.chroma_format_idc, 2);
379*437bfbebSnyanmisaka 
380*437bfbebSnyanmisaka             mpp_put_bits(&bp, width, 16);
381*437bfbebSnyanmisaka             mpp_put_bits(&bp, height, 16);
382*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.bit_depth_luma_minus8, 3);
383*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.bit_depth_chroma_minus8, 3);
384*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_max_pic_order_cnt_lsb_minus4 + 4, 5);
385*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size, 2);
386*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_min_luma_coding_block_size_minus3 + 3, 3);
387*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_min_transform_block_size_minus2 + 2, 3);
388*437bfbebSnyanmisaka 
389*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_diff_max_min_transform_block_size, 2);
390*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.max_transform_hierarchy_depth_inter, 3);
391*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.max_transform_hierarchy_depth_intra, 3);
392*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.scaling_list_enabled_flag, 1);
393*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.amp_enabled_flag, 1);
394*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.sample_adaptive_offset_enabled_flag, 1);
395*437bfbebSnyanmisaka             ///<-zrh comment ^  68 bit above
396*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag, 1);
397*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag ? (dxva_ctx->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0, 4);
398*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag ? (dxva_ctx->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0, 4);
399*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pcm_loop_filter_disabled_flag, 1);
400*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_diff_max_min_pcm_luma_coding_block_size, 3);
401*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag ? (dxva_ctx->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
402*437bfbebSnyanmisaka 
403*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.num_short_term_ref_pic_sets, 7);
404*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.long_term_ref_pics_present_flag, 1);
405*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.num_long_term_ref_pics_sps, 6);
406*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.sps_temporal_mvp_enabled_flag, 1);
407*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.strong_intra_smoothing_enabled_flag, 1);
408*437bfbebSnyanmisaka             // SPS extenstion
409*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.transform_skip_rotation_enabled_flag, 1);
410*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.transform_skip_context_enabled_flag, 1);
411*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.strong_intra_smoothing_enabled_flag, 1);
412*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.implicit_rdpcm_enabled_flag, 1);
413*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.explicit_rdpcm_enabled_flag, 1);
414*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.extended_precision_processing_flag, 1);
415*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.intra_smoothing_disabled_flag, 1);
416*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.sps_max_dec_pic_buffering_minus1, 4);
417*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.separate_colour_plane_flag, 1);
418*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.high_precision_offsets_enabled_flag, 1);
419*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.persistent_rice_adaptation_enabled_flag, 1);
420*437bfbebSnyanmisaka 
421*437bfbebSnyanmisaka             /* PPS */
422*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_id, 6);
423*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.sps_id, 4);
424*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.dependent_slice_segments_enabled_flag, 1);
425*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.output_flag_present_flag, 1);
426*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.num_extra_slice_header_bits, 13);
427*437bfbebSnyanmisaka 
428*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.sign_data_hiding_enabled_flag, 1);
429*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.cabac_init_present_flag, 1);
430*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.num_ref_idx_l0_default_active_minus1 + 1, 4);
431*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.num_ref_idx_l1_default_active_minus1 + 1, 4);
432*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.init_qp_minus26, 7);
433*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.constrained_intra_pred_flag, 1);
434*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.transform_skip_enabled_flag, 1);
435*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.cu_qp_delta_enabled_flag, 1);
436*437bfbebSnyanmisaka             mpp_put_bits(&bp, log2_min_cb_size + dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size - dxva_ctx->pp.diff_cu_qp_delta_depth, 3);
437*437bfbebSnyanmisaka 
438*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_cb_qp_offset, 5);
439*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_cr_qp_offset, 5);
440*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_slice_chroma_qp_offsets_present_flag, 1);
441*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.weighted_pred_flag, 1);
442*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.weighted_bipred_flag, 1);
443*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.transquant_bypass_enabled_flag, 1);
444*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.tiles_enabled_flag, 1);
445*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.entropy_coding_sync_enabled_flag, 1);
446*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_loop_filter_across_slices_enabled_flag, 1);
447*437bfbebSnyanmisaka 
448*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.loop_filter_across_tiles_enabled_flag, 1);
449*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.deblocking_filter_override_enabled_flag, 1);
450*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_deblocking_filter_disabled_flag, 1);
451*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_beta_offset_div2, 4);
452*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.pps_tc_offset_div2, 4);
453*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.lists_modification_present_flag, 1);
454*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.log2_parallel_merge_level_minus2 + 2, 3);
455*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.slice_segment_header_extension_present_flag, 1);
456*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 3);
457*437bfbebSnyanmisaka 
458*437bfbebSnyanmisaka             // PPS externsion
459*437bfbebSnyanmisaka             if (dxva_ctx->pp.log2_max_transform_skip_block_size > 2) {
460*437bfbebSnyanmisaka                 mpp_put_bits(&bp, dxva_ctx->pp.log2_max_transform_skip_block_size - 2, 2);
461*437bfbebSnyanmisaka             } else {
462*437bfbebSnyanmisaka                 mpp_put_bits(&bp, 0, 2);
463*437bfbebSnyanmisaka             }
464*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.cross_component_prediction_enabled_flag, 1);
465*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.chroma_qp_offset_list_enabled_flag, 1);
466*437bfbebSnyanmisaka 
467*437bfbebSnyanmisaka             RK_S32 log2_min_cu_chroma_qp_delta_size = log2_min_cb_size +
468*437bfbebSnyanmisaka                                                       dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size -
469*437bfbebSnyanmisaka                                                       dxva_ctx->pp.diff_cu_chroma_qp_offset_depth;
470*437bfbebSnyanmisaka             mpp_put_bits(&bp, log2_min_cu_chroma_qp_delta_size, 3);
471*437bfbebSnyanmisaka             for (i = 0; i < 6; i++)
472*437bfbebSnyanmisaka                 mpp_put_bits(&bp, dxva_ctx->pp.cb_qp_offset_list[i], 5);
473*437bfbebSnyanmisaka             for (i = 0; i < 6; i++)
474*437bfbebSnyanmisaka                 mpp_put_bits(&bp, dxva_ctx->pp.cr_qp_offset_list[i], 5);
475*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.chroma_qp_offset_list_len_minus1, 3);
476*437bfbebSnyanmisaka 
477*437bfbebSnyanmisaka             /* mvc0 && mvc1 */
478*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0xffff, 16);
479*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
480*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 6);
481*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
482*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
483*437bfbebSnyanmisaka         } else {
484*437bfbebSnyanmisaka             bp.index = 4;
485*437bfbebSnyanmisaka             bp.bitpos = 41;
486*437bfbebSnyanmisaka             bp.bvalue = bp.pbuf[bp.index] & MPP_GENMASK(bp.bitpos - 1, 0);
487*437bfbebSnyanmisaka         }
488*437bfbebSnyanmisaka         /* poc info */
489*437bfbebSnyanmisaka         {
490*437bfbebSnyanmisaka             RK_S32 dpb_valid[15] = {0}, refpic_poc[15] = {0};
491*437bfbebSnyanmisaka 
492*437bfbebSnyanmisaka             for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_ctx->pp.RefPicList); i++) {
493*437bfbebSnyanmisaka                 if (dxva_ctx->pp.RefPicList[i].bPicEntry != 0xff &&
494*437bfbebSnyanmisaka                     dxva_ctx->pp.RefPicList[i].bPicEntry != 0x7f) {
495*437bfbebSnyanmisaka                     dpb_valid[i] = 1;
496*437bfbebSnyanmisaka                     refpic_poc[i] = dxva_ctx->pp.PicOrderCntValList[i];
497*437bfbebSnyanmisaka                 }
498*437bfbebSnyanmisaka             }
499*437bfbebSnyanmisaka 
500*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
501*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
502*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
503*437bfbebSnyanmisaka             mpp_put_bits(&bp, dxva_ctx->pp.current_poc, 32);
504*437bfbebSnyanmisaka 
505*437bfbebSnyanmisaka             for (i = 0; i < 15; i++)
506*437bfbebSnyanmisaka                 mpp_put_bits(&bp, refpic_poc[i], 32);
507*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 32);
508*437bfbebSnyanmisaka             for (i = 0; i < 15; i++)
509*437bfbebSnyanmisaka                 mpp_put_bits(&bp, dpb_valid[i], 1);
510*437bfbebSnyanmisaka             mpp_put_bits(&bp, 0, 1);
511*437bfbebSnyanmisaka         }
512*437bfbebSnyanmisaka 
513*437bfbebSnyanmisaka         /* tile info */
514*437bfbebSnyanmisaka         mpp_put_bits(&bp, dxva_ctx->pp.tiles_enabled_flag ? (dxva_ctx->pp.num_tile_columns_minus1 + 1) : 1, 5);
515*437bfbebSnyanmisaka         mpp_put_bits(&bp, dxva_ctx->pp.tiles_enabled_flag ? (dxva_ctx->pp.num_tile_rows_minus1 + 1) : 1, 5);
516*437bfbebSnyanmisaka         {
517*437bfbebSnyanmisaka             /// tiles info begin
518*437bfbebSnyanmisaka             RK_U16 column_width[20];
519*437bfbebSnyanmisaka             RK_U16 row_height[22];
520*437bfbebSnyanmisaka 
521*437bfbebSnyanmisaka             memset(column_width, 0, sizeof(column_width));
522*437bfbebSnyanmisaka             memset(row_height, 0, sizeof(row_height));
523*437bfbebSnyanmisaka 
524*437bfbebSnyanmisaka             if (dxva_ctx->pp.tiles_enabled_flag) {
525*437bfbebSnyanmisaka                 if (dxva_ctx->pp.uniform_spacing_flag == 0) {
526*437bfbebSnyanmisaka                     RK_S32 maxcuwidth = dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
527*437bfbebSnyanmisaka                     RK_S32 ctu_width_in_pic = (width +
528*437bfbebSnyanmisaka                                                (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
529*437bfbebSnyanmisaka                     RK_S32 ctu_height_in_pic = (height +
530*437bfbebSnyanmisaka                                                 (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
531*437bfbebSnyanmisaka                     RK_S32 sum = 0;
532*437bfbebSnyanmisaka                     for (i = 0; i < dxva_ctx->pp.num_tile_columns_minus1; i++) {
533*437bfbebSnyanmisaka                         column_width[i] = dxva_ctx->pp.column_width_minus1[i] + 1;
534*437bfbebSnyanmisaka                         sum += column_width[i]  ;
535*437bfbebSnyanmisaka                     }
536*437bfbebSnyanmisaka                     column_width[i] = ctu_width_in_pic - sum;
537*437bfbebSnyanmisaka 
538*437bfbebSnyanmisaka                     sum = 0;
539*437bfbebSnyanmisaka                     for (i = 0; i < dxva_ctx->pp.num_tile_rows_minus1; i++) {
540*437bfbebSnyanmisaka                         row_height[i] = dxva_ctx->pp.row_height_minus1[i] + 1;
541*437bfbebSnyanmisaka                         sum += row_height[i];
542*437bfbebSnyanmisaka                     }
543*437bfbebSnyanmisaka                     row_height[i] = ctu_height_in_pic - sum;
544*437bfbebSnyanmisaka                 }  else {
545*437bfbebSnyanmisaka                     RK_S32    pic_in_cts_width = (width +
546*437bfbebSnyanmisaka                                                   (1 << (log2_min_cb_size +
547*437bfbebSnyanmisaka                                                          dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
548*437bfbebSnyanmisaka                                                  / (1 << (log2_min_cb_size +
549*437bfbebSnyanmisaka                                                           dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size));
550*437bfbebSnyanmisaka                     RK_S32 pic_in_cts_height = (height +
551*437bfbebSnyanmisaka                                                 (1 << (log2_min_cb_size +
552*437bfbebSnyanmisaka                                                        dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
553*437bfbebSnyanmisaka                                                / (1 << (log2_min_cb_size +
554*437bfbebSnyanmisaka                                                         dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size));
555*437bfbebSnyanmisaka 
556*437bfbebSnyanmisaka                     for (i = 0; i < dxva_ctx->pp.num_tile_columns_minus1 + 1; i++)
557*437bfbebSnyanmisaka                         column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_ctx->pp.num_tile_columns_minus1 + 1) -
558*437bfbebSnyanmisaka                                           (i * pic_in_cts_width) / (dxva_ctx->pp.num_tile_columns_minus1 + 1);
559*437bfbebSnyanmisaka 
560*437bfbebSnyanmisaka                     for (i = 0; i < dxva_ctx->pp.num_tile_rows_minus1 + 1; i++)
561*437bfbebSnyanmisaka                         row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_ctx->pp.num_tile_rows_minus1 + 1) -
562*437bfbebSnyanmisaka                                         (i * pic_in_cts_height) / (dxva_ctx->pp.num_tile_rows_minus1 + 1);
563*437bfbebSnyanmisaka                 }
564*437bfbebSnyanmisaka             } else {
565*437bfbebSnyanmisaka                 RK_S32 MaxCUWidth = (1 << (dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
566*437bfbebSnyanmisaka                 column_width[0] = (width  + MaxCUWidth - 1) / MaxCUWidth;
567*437bfbebSnyanmisaka                 row_height[0]   = (height + MaxCUWidth - 1) / MaxCUWidth;
568*437bfbebSnyanmisaka             }
569*437bfbebSnyanmisaka 
570*437bfbebSnyanmisaka             for (i = 0; i < 20; i++)
571*437bfbebSnyanmisaka                 mpp_put_bits(&bp, column_width[i], 12);
572*437bfbebSnyanmisaka 
573*437bfbebSnyanmisaka             for (i = 0; i < 22; i++)
574*437bfbebSnyanmisaka                 mpp_put_bits(&bp, row_height[i], 12);
575*437bfbebSnyanmisaka         }
576*437bfbebSnyanmisaka 
577*437bfbebSnyanmisaka         /* update rps */
578*437bfbebSnyanmisaka         if (dxva_ctx->pp.rps_update_flag) {
579*437bfbebSnyanmisaka             Short_SPS_RPS_HEVC *cur_st_rps_ptr = &dxva_ctx->pp.cur_st_rps;
580*437bfbebSnyanmisaka 
581*437bfbebSnyanmisaka             for (i = 0; i < 32; i ++) {
582*437bfbebSnyanmisaka                 mpp_put_bits(&bp, dxva_ctx->pp.sps_lt_rps[i].lt_ref_pic_poc_lsb, 16);
583*437bfbebSnyanmisaka                 mpp_put_bits(&bp, dxva_ctx->pp.sps_lt_rps[i].used_by_curr_pic_lt_flag, 1);
584*437bfbebSnyanmisaka             }
585*437bfbebSnyanmisaka 
586*437bfbebSnyanmisaka             mpp_put_bits(&bp, cur_st_rps_ptr->num_negative_pics, 4);
587*437bfbebSnyanmisaka             mpp_put_bits(&bp, cur_st_rps_ptr->num_positive_pics, 4);
588*437bfbebSnyanmisaka 
589*437bfbebSnyanmisaka             for (i = 0; i <  cur_st_rps_ptr->num_negative_pics; i++) {
590*437bfbebSnyanmisaka                 mpp_put_bits(&bp, cur_st_rps_ptr->delta_poc_s0[i], 16);
591*437bfbebSnyanmisaka                 mpp_put_bits(&bp, cur_st_rps_ptr->s0_used_flag[i], 1);
592*437bfbebSnyanmisaka             }
593*437bfbebSnyanmisaka 
594*437bfbebSnyanmisaka             for (i = 0; i <  cur_st_rps_ptr->num_positive_pics; i++) {
595*437bfbebSnyanmisaka                 mpp_put_bits(&bp, cur_st_rps_ptr->delta_poc_s1[i], 16);
596*437bfbebSnyanmisaka                 mpp_put_bits(&bp, cur_st_rps_ptr->s1_used_flag[i], 1);
597*437bfbebSnyanmisaka             }
598*437bfbebSnyanmisaka 
599*437bfbebSnyanmisaka             for ( i = cur_st_rps_ptr->num_negative_pics + cur_st_rps_ptr->num_positive_pics; i < 15; i++) {
600*437bfbebSnyanmisaka                 mpp_put_bits(&bp, 0, 16);
601*437bfbebSnyanmisaka                 mpp_put_bits(&bp, 0, 1);
602*437bfbebSnyanmisaka             }
603*437bfbebSnyanmisaka             mpp_put_align(&bp, 64, 0);//128
604*437bfbebSnyanmisaka         }
605*437bfbebSnyanmisaka         memcpy(pps_ptr, reg_ctx->pps_buf, SPSPPS_ALIGNED_SIZE);
606*437bfbebSnyanmisaka     } /* --- end spspps data ------*/
607*437bfbebSnyanmisaka 
608*437bfbebSnyanmisaka     if (dxva_ctx->pp.scaling_list_enabled_flag) {
609*437bfbebSnyanmisaka         RK_U32 addr;
610*437bfbebSnyanmisaka         RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->sclst_offset;
611*437bfbebSnyanmisaka 
612*437bfbebSnyanmisaka         if (dxva_ctx->pp.scaling_list_data_present_flag) {
613*437bfbebSnyanmisaka             addr = (dxva_ctx->pp.pps_id + 16) * 1360;
614*437bfbebSnyanmisaka         } else if (dxva_ctx->pp.scaling_list_enabled_flag) {
615*437bfbebSnyanmisaka             addr = dxva_ctx->pp.sps_id * 1360;
616*437bfbebSnyanmisaka         } else {
617*437bfbebSnyanmisaka             addr = 80 * 1360;
618*437bfbebSnyanmisaka         }
619*437bfbebSnyanmisaka 
620*437bfbebSnyanmisaka         hal_h265d_vdpu384a_scalinglist_packet(hal, ptr_scaling + addr, dxva);
621*437bfbebSnyanmisaka 
622*437bfbebSnyanmisaka         hw_reg->common_addr.reg132_scanlist_addr = reg_ctx->bufs_fd;
623*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(reg_ctx->dev, 132, addr + reg_ctx->sclst_offset);
624*437bfbebSnyanmisaka     }
625*437bfbebSnyanmisaka 
626*437bfbebSnyanmisaka #ifdef dump
627*437bfbebSnyanmisaka     fwrite(pps_ptr, 1, 80 * 64, fp);
628*437bfbebSnyanmisaka     RK_U32 *tmp = (RK_U32 *)pps_ptr;
629*437bfbebSnyanmisaka     for (i = 0; i < 112 / 4; i++) {
630*437bfbebSnyanmisaka         mpp_log("pps[%3d] = 0x%08x\n", i, tmp[i]);
631*437bfbebSnyanmisaka     }
632*437bfbebSnyanmisaka #endif
633*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
634*437bfbebSnyanmisaka     {
635*437bfbebSnyanmisaka         char *cur_fname = "global_cfg.dat";
636*437bfbebSnyanmisaka         memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
637*437bfbebSnyanmisaka         sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
638*437bfbebSnyanmisaka         dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 18 * 128, 128, 0);
639*437bfbebSnyanmisaka     }
640*437bfbebSnyanmisaka #endif
641*437bfbebSnyanmisaka 
642*437bfbebSnyanmisaka     return 0;
643*437bfbebSnyanmisaka }
644*437bfbebSnyanmisaka 
h265d_refine_rcb_size(Vdpu384aRcbInfo * rcb_info,RK_S32 width,RK_S32 height,void * dxva)645*437bfbebSnyanmisaka static void h265d_refine_rcb_size(Vdpu384aRcbInfo *rcb_info,
646*437bfbebSnyanmisaka                                   RK_S32 width, RK_S32 height, void *dxva)
647*437bfbebSnyanmisaka {
648*437bfbebSnyanmisaka     RK_U32 rcb_bits = 0;
649*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
650*437bfbebSnyanmisaka     DXVA_PicParams_HEVC *pp = &dxva_ctx->pp;
651*437bfbebSnyanmisaka     RK_U32 chroma_fmt_idc = pp->chroma_format_idc;//0 400,1 4202 ,422,3 444
652*437bfbebSnyanmisaka     RK_U8 bit_depth = MPP_MAX(pp->bit_depth_luma_minus8, pp->bit_depth_chroma_minus8) + 8;
653*437bfbebSnyanmisaka     RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size + pp->log2_min_luma_coding_block_size_minus3 + 3);
654*437bfbebSnyanmisaka     RK_U32 tile_row_cut_num = pp->num_tile_rows_minus1;
655*437bfbebSnyanmisaka     RK_U32 tile_col_cut_num = pp->num_tile_columns_minus1;
656*437bfbebSnyanmisaka     RK_U32 ext_row_align_size = tile_row_cut_num * 64 * 8;
657*437bfbebSnyanmisaka     RK_U32 ext_col_align_size = tile_col_cut_num * 64 * 8;
658*437bfbebSnyanmisaka     RK_U32 filterd_row_append = 8192;
659*437bfbebSnyanmisaka     RK_U32 row_uv_para = 0;
660*437bfbebSnyanmisaka     RK_U32 col_uv_para = 0;
661*437bfbebSnyanmisaka 
662*437bfbebSnyanmisaka     if (chroma_fmt_idc == 1) {
663*437bfbebSnyanmisaka         row_uv_para = 1;
664*437bfbebSnyanmisaka         col_uv_para = 1;
665*437bfbebSnyanmisaka     } else if (chroma_fmt_idc == 2) {
666*437bfbebSnyanmisaka         row_uv_para = 1;
667*437bfbebSnyanmisaka         col_uv_para = 3;
668*437bfbebSnyanmisaka     } else if (chroma_fmt_idc == 3) {
669*437bfbebSnyanmisaka         row_uv_para = 3;
670*437bfbebSnyanmisaka         col_uv_para = 3;
671*437bfbebSnyanmisaka     }
672*437bfbebSnyanmisaka 
673*437bfbebSnyanmisaka     width = MPP_ALIGN(width, ctu_size);
674*437bfbebSnyanmisaka     height = MPP_ALIGN(height, ctu_size);
675*437bfbebSnyanmisaka     /* RCB_STRMD_ROW && RCB_STRMD_TILE_ROW*/
676*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_ROW].size = 0;
677*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_TILE_ROW].size = 0;
678*437bfbebSnyanmisaka 
679*437bfbebSnyanmisaka     /* RCB_INTER_ROW && RCB_INTER_TILE_ROW*/
680*437bfbebSnyanmisaka     rcb_bits = ((width + 7) / 8) * 174;
681*437bfbebSnyanmisaka     rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
682*437bfbebSnyanmisaka     rcb_bits += ext_row_align_size;
683*437bfbebSnyanmisaka     if (tile_row_cut_num)
684*437bfbebSnyanmisaka         rcb_info[RCB_INTER_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
685*437bfbebSnyanmisaka     else
686*437bfbebSnyanmisaka         rcb_info[RCB_INTER_TILE_ROW].size = 0;
687*437bfbebSnyanmisaka 
688*437bfbebSnyanmisaka     /* RCB_INTRA_ROW && RCB_INTRA_TILE_ROW*/
689*437bfbebSnyanmisaka     rcb_bits = MPP_ALIGN(width, 512) * (bit_depth + 2);
690*437bfbebSnyanmisaka     rcb_bits = rcb_bits * 4; //TODO:
691*437bfbebSnyanmisaka     rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
692*437bfbebSnyanmisaka     rcb_bits += ext_row_align_size;
693*437bfbebSnyanmisaka     if (tile_row_cut_num)
694*437bfbebSnyanmisaka         rcb_info[RCB_INTRA_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
695*437bfbebSnyanmisaka     else
696*437bfbebSnyanmisaka         rcb_info[RCB_INTRA_TILE_ROW].size = 0;
697*437bfbebSnyanmisaka 
698*437bfbebSnyanmisaka     /* RCB_FILTERD_ROW && RCB_FILTERD_TILE_ROW*/
699*437bfbebSnyanmisaka     rcb_bits = (MPP_ALIGN(width, 64) * (1.2 * bit_depth + 0.5) * (8 + 5 * row_uv_para));
700*437bfbebSnyanmisaka     // save space mode : half for RCB_FILTERD_ROW, half for RCB_FILTERD_PROTECT_ROW
701*437bfbebSnyanmisaka     if (width > 4096)
702*437bfbebSnyanmisaka         filterd_row_append = 27648;
703*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_ROW].size = MPP_RCB_BYTES(rcb_bits / 2) + filterd_row_append;
704*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_PROTECT_ROW].size = MPP_RCB_BYTES(rcb_bits / 2) + filterd_row_append;
705*437bfbebSnyanmisaka     rcb_bits += ext_row_align_size;
706*437bfbebSnyanmisaka     if (tile_row_cut_num)
707*437bfbebSnyanmisaka         rcb_info[RCB_FILTERD_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
708*437bfbebSnyanmisaka     else
709*437bfbebSnyanmisaka         rcb_info[RCB_FILTERD_TILE_ROW].size = 0;
710*437bfbebSnyanmisaka 
711*437bfbebSnyanmisaka     /* RCB_FILTERD_TILE_COL */
712*437bfbebSnyanmisaka     if (tile_col_cut_num) {
713*437bfbebSnyanmisaka         rcb_bits = (MPP_ALIGN(height, 64) * (1.6 * bit_depth + 0.5) * (16.5 + 5.5 * col_uv_para)) + ext_col_align_size;
714*437bfbebSnyanmisaka         rcb_info[RCB_FILTERD_TILE_COL].size = MPP_RCB_BYTES(rcb_bits);
715*437bfbebSnyanmisaka     } else {
716*437bfbebSnyanmisaka         rcb_info[RCB_FILTERD_TILE_COL].size = 0;
717*437bfbebSnyanmisaka     }
718*437bfbebSnyanmisaka 
719*437bfbebSnyanmisaka }
720*437bfbebSnyanmisaka 
hal_h265d_rcb_info_update(void * hal,void * dxva,Vdpu384aH265dRegSet * hw_regs,RK_S32 width,RK_S32 height)721*437bfbebSnyanmisaka static void hal_h265d_rcb_info_update(void *hal,  void *dxva,
722*437bfbebSnyanmisaka                                       Vdpu384aH265dRegSet *hw_regs,
723*437bfbebSnyanmisaka                                       RK_S32 width, RK_S32 height)
724*437bfbebSnyanmisaka {
725*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
726*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
727*437bfbebSnyanmisaka     DXVA_PicParams_HEVC *pp = &dxva_ctx->pp;
728*437bfbebSnyanmisaka     RK_U32 chroma_fmt_idc = pp->chroma_format_idc;//0 400,1 4202 ,422,3 444
729*437bfbebSnyanmisaka     RK_U8 bit_depth = MPP_MAX(pp->bit_depth_luma_minus8, pp->bit_depth_chroma_minus8) + 8;
730*437bfbebSnyanmisaka     RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size + pp->log2_min_luma_coding_block_size_minus3 + 3);
731*437bfbebSnyanmisaka     RK_U32 num_tiles = pp->num_tile_rows_minus1 + 1;
732*437bfbebSnyanmisaka     (void)hw_regs;
733*437bfbebSnyanmisaka 
734*437bfbebSnyanmisaka     if (reg_ctx->num_row_tiles != num_tiles ||
735*437bfbebSnyanmisaka         reg_ctx->bit_depth != bit_depth ||
736*437bfbebSnyanmisaka         reg_ctx->chroma_fmt_idc != chroma_fmt_idc ||
737*437bfbebSnyanmisaka         reg_ctx->ctu_size !=  ctu_size ||
738*437bfbebSnyanmisaka         reg_ctx->width != width ||
739*437bfbebSnyanmisaka         reg_ctx->height != height) {
740*437bfbebSnyanmisaka         RK_U32 i = 0;
741*437bfbebSnyanmisaka         RK_U32 loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->g_buf) : 1;
742*437bfbebSnyanmisaka 
743*437bfbebSnyanmisaka         reg_ctx->rcb_buf_size = vdpu384a_get_rcb_buf_size((Vdpu384aRcbInfo *)reg_ctx->rcb_info, width, height);
744*437bfbebSnyanmisaka         h265d_refine_rcb_size((Vdpu384aRcbInfo *)reg_ctx->rcb_info, width, height, dxva_ctx);
745*437bfbebSnyanmisaka         /* vdpu384a_check_rcb_buf_size((Vdpu384aRcbInfo *)reg_ctx->rcb_info, width, height); */
746*437bfbebSnyanmisaka 
747*437bfbebSnyanmisaka         for (i = 0; i < loop; i++) {
748*437bfbebSnyanmisaka             MppBuffer rcb_buf;
749*437bfbebSnyanmisaka 
750*437bfbebSnyanmisaka             if (reg_ctx->rcb_buf[i]) {
751*437bfbebSnyanmisaka                 mpp_buffer_put(reg_ctx->rcb_buf[i]);
752*437bfbebSnyanmisaka                 reg_ctx->rcb_buf[i] = NULL;
753*437bfbebSnyanmisaka             }
754*437bfbebSnyanmisaka             mpp_buffer_get(reg_ctx->group, &rcb_buf, reg_ctx->rcb_buf_size);
755*437bfbebSnyanmisaka             reg_ctx->rcb_buf[i] = rcb_buf;
756*437bfbebSnyanmisaka         }
757*437bfbebSnyanmisaka 
758*437bfbebSnyanmisaka         reg_ctx->num_row_tiles  = num_tiles;
759*437bfbebSnyanmisaka         reg_ctx->bit_depth      = bit_depth;
760*437bfbebSnyanmisaka         reg_ctx->chroma_fmt_idc = chroma_fmt_idc;
761*437bfbebSnyanmisaka         reg_ctx->ctu_size       = ctu_size;
762*437bfbebSnyanmisaka         reg_ctx->width          = width;
763*437bfbebSnyanmisaka         reg_ctx->height         = height;
764*437bfbebSnyanmisaka     }
765*437bfbebSnyanmisaka }
766*437bfbebSnyanmisaka 
calc_mv_size(RK_S32 pic_w,RK_S32 pic_h,RK_S32 ctu_w)767*437bfbebSnyanmisaka static RK_S32 calc_mv_size(RK_S32 pic_w, RK_S32 pic_h, RK_S32 ctu_w)
768*437bfbebSnyanmisaka {
769*437bfbebSnyanmisaka     RK_S32 seg_w = 64 * 16 * 16 / ctu_w; // colmv_block_size = 16, colmv_per_bytes = 16
770*437bfbebSnyanmisaka     RK_S32 seg_cnt_w = MPP_ALIGN(pic_w, seg_w) / seg_w;
771*437bfbebSnyanmisaka     RK_S32 seg_cnt_h = MPP_ALIGN(pic_h, ctu_w) / ctu_w;
772*437bfbebSnyanmisaka     RK_S32 mv_size   = seg_cnt_w * seg_cnt_h * 64 * 16;
773*437bfbebSnyanmisaka 
774*437bfbebSnyanmisaka     return mv_size;
775*437bfbebSnyanmisaka }
776*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_gen_regs(void * hal,HalTaskInfo * syn)777*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_gen_regs(void *hal,  HalTaskInfo *syn)
778*437bfbebSnyanmisaka {
779*437bfbebSnyanmisaka     RK_S32 i = 0;
780*437bfbebSnyanmisaka     RK_S32 log2_min_cb_size;
781*437bfbebSnyanmisaka     RK_S32 width, height;
782*437bfbebSnyanmisaka     RK_S32 stride_y, stride_uv, virstrid_y;
783*437bfbebSnyanmisaka     Vdpu384aH265dRegSet *hw_regs;
784*437bfbebSnyanmisaka     RK_S32 ret = MPP_SUCCESS;
785*437bfbebSnyanmisaka     MppBuffer streambuf = NULL;
786*437bfbebSnyanmisaka     RK_S32 aglin_offset = 0;
787*437bfbebSnyanmisaka     RK_S32 valid_ref = -1;
788*437bfbebSnyanmisaka     MppBuffer framebuf = NULL;
789*437bfbebSnyanmisaka     HalBuf *mv_buf = NULL;
790*437bfbebSnyanmisaka     RK_S32 fd = -1;
791*437bfbebSnyanmisaka     RK_U32 mv_size = 0;
792*437bfbebSnyanmisaka     RK_S32 distance = INT_MAX;
793*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
794*437bfbebSnyanmisaka 
795*437bfbebSnyanmisaka     (void) fd;
796*437bfbebSnyanmisaka     if (syn->dec.flags.parse_err ||
797*437bfbebSnyanmisaka         (syn->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
798*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
799*437bfbebSnyanmisaka         return MPP_OK;
800*437bfbebSnyanmisaka     }
801*437bfbebSnyanmisaka 
802*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
803*437bfbebSnyanmisaka     HalBuf *origin_buf = NULL;
804*437bfbebSnyanmisaka 
805*437bfbebSnyanmisaka     if (reg_ctx ->fast_mode) {
806*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
807*437bfbebSnyanmisaka             if (!reg_ctx->g_buf[i].use_flag) {
808*437bfbebSnyanmisaka                 syn->dec.reg_index = i;
809*437bfbebSnyanmisaka 
810*437bfbebSnyanmisaka                 reg_ctx->spspps_offset = reg_ctx->offset_spspps[i];
811*437bfbebSnyanmisaka                 reg_ctx->sclst_offset = reg_ctx->offset_sclst[i];
812*437bfbebSnyanmisaka 
813*437bfbebSnyanmisaka                 reg_ctx->hw_regs = reg_ctx->g_buf[i].hw_regs;
814*437bfbebSnyanmisaka                 reg_ctx->g_buf[i].use_flag = 1;
815*437bfbebSnyanmisaka                 break;
816*437bfbebSnyanmisaka             }
817*437bfbebSnyanmisaka         }
818*437bfbebSnyanmisaka         if (i == MAX_GEN_REG) {
819*437bfbebSnyanmisaka             mpp_err("hevc rps buf all used");
820*437bfbebSnyanmisaka             return MPP_ERR_NOMEM;
821*437bfbebSnyanmisaka         }
822*437bfbebSnyanmisaka     }
823*437bfbebSnyanmisaka 
824*437bfbebSnyanmisaka     if (syn->dec.syntax.data == NULL) {
825*437bfbebSnyanmisaka         mpp_err("%s:%s:%d dxva is NULL", __FILE__, __FUNCTION__, __LINE__);
826*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
827*437bfbebSnyanmisaka     }
828*437bfbebSnyanmisaka 
829*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
830*437bfbebSnyanmisaka     {
831*437bfbebSnyanmisaka         memset(dump_cur_dir, 0, sizeof(dump_cur_dir));
832*437bfbebSnyanmisaka         sprintf(dump_cur_dir, "/data/hevc/Frame%04d", dump_cur_frame);
833*437bfbebSnyanmisaka         if (access(dump_cur_dir, 0)) {
834*437bfbebSnyanmisaka             if (mkdir(dump_cur_dir))
835*437bfbebSnyanmisaka                 mpp_err_f("error: mkdir %s\n", dump_cur_dir);
836*437bfbebSnyanmisaka         }
837*437bfbebSnyanmisaka         dump_cur_frame++;
838*437bfbebSnyanmisaka     }
839*437bfbebSnyanmisaka #endif
840*437bfbebSnyanmisaka 
841*437bfbebSnyanmisaka     /* output pps */
842*437bfbebSnyanmisaka     hw_regs = (Vdpu384aH265dRegSet*)reg_ctx->hw_regs;
843*437bfbebSnyanmisaka     memset(hw_regs, 0, sizeof(Vdpu384aH265dRegSet));
844*437bfbebSnyanmisaka 
845*437bfbebSnyanmisaka     if (NULL == reg_ctx->hw_regs) {
846*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
847*437bfbebSnyanmisaka     }
848*437bfbebSnyanmisaka 
849*437bfbebSnyanmisaka 
850*437bfbebSnyanmisaka     log2_min_cb_size = dxva_ctx->pp.log2_min_luma_coding_block_size_minus3 + 3;
851*437bfbebSnyanmisaka     width = (dxva_ctx->pp.PicWidthInMinCbsY << log2_min_cb_size);
852*437bfbebSnyanmisaka     height = (dxva_ctx->pp.PicHeightInMinCbsY << log2_min_cb_size);
853*437bfbebSnyanmisaka     mv_size = calc_mv_size(width, height, 1 << log2_min_cb_size) * 2;
854*437bfbebSnyanmisaka 
855*437bfbebSnyanmisaka     if (reg_ctx->cmv_bufs == NULL || reg_ctx->mv_size < mv_size) {
856*437bfbebSnyanmisaka         size_t size = mv_size;
857*437bfbebSnyanmisaka 
858*437bfbebSnyanmisaka         if (reg_ctx->cmv_bufs) {
859*437bfbebSnyanmisaka             hal_bufs_deinit(reg_ctx->cmv_bufs);
860*437bfbebSnyanmisaka             reg_ctx->cmv_bufs = NULL;
861*437bfbebSnyanmisaka         }
862*437bfbebSnyanmisaka 
863*437bfbebSnyanmisaka         hal_bufs_init(&reg_ctx->cmv_bufs);
864*437bfbebSnyanmisaka         if (reg_ctx->cmv_bufs == NULL) {
865*437bfbebSnyanmisaka             mpp_err_f("colmv bufs init fail");
866*437bfbebSnyanmisaka             return MPP_ERR_NULL_PTR;
867*437bfbebSnyanmisaka         }
868*437bfbebSnyanmisaka 
869*437bfbebSnyanmisaka         reg_ctx->mv_size = mv_size;
870*437bfbebSnyanmisaka         reg_ctx->mv_count = mpp_buf_slot_get_count(reg_ctx->slots);
871*437bfbebSnyanmisaka         hal_bufs_setup(reg_ctx->cmv_bufs, reg_ctx->mv_count, 1, &size);
872*437bfbebSnyanmisaka     }
873*437bfbebSnyanmisaka 
874*437bfbebSnyanmisaka     {
875*437bfbebSnyanmisaka         MppFrame mframe = NULL;
876*437bfbebSnyanmisaka         RK_U32 ver_virstride;
877*437bfbebSnyanmisaka         RK_U32 virstrid_uv;
878*437bfbebSnyanmisaka         MppFrameFormat fmt;
879*437bfbebSnyanmisaka         RK_U32 chroma_fmt_idc = dxva_ctx->pp.chroma_format_idc;
880*437bfbebSnyanmisaka 
881*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
882*437bfbebSnyanmisaka                               SLOT_FRAME_PTR, &mframe);
883*437bfbebSnyanmisaka         /* for 8K downscale mode*/
884*437bfbebSnyanmisaka         if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY &&
885*437bfbebSnyanmisaka             reg_ctx->origin_bufs == NULL) {
886*437bfbebSnyanmisaka             vdpu384a_setup_scale_origin_bufs(reg_ctx, mframe);
887*437bfbebSnyanmisaka         }
888*437bfbebSnyanmisaka 
889*437bfbebSnyanmisaka         fmt = mpp_frame_get_fmt(mframe);
890*437bfbebSnyanmisaka 
891*437bfbebSnyanmisaka         stride_y = mpp_frame_get_hor_stride(mframe);
892*437bfbebSnyanmisaka         ver_virstride = mpp_frame_get_ver_stride(mframe);
893*437bfbebSnyanmisaka         stride_uv = stride_y;
894*437bfbebSnyanmisaka         virstrid_y = ver_virstride * stride_y;
895*437bfbebSnyanmisaka         if (chroma_fmt_idc == 3)
896*437bfbebSnyanmisaka             stride_uv *= 2;
897*437bfbebSnyanmisaka         if (chroma_fmt_idc == 3 || chroma_fmt_idc == 2) {
898*437bfbebSnyanmisaka             virstrid_uv = stride_uv * ver_virstride;
899*437bfbebSnyanmisaka         } else {
900*437bfbebSnyanmisaka             virstrid_uv = stride_uv * ver_virstride / 2;
901*437bfbebSnyanmisaka         }
902*437bfbebSnyanmisaka         if (MPP_FRAME_FMT_IS_FBC(fmt)) {
903*437bfbebSnyanmisaka             RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
904*437bfbebSnyanmisaka             RK_U32 fbd_offset;
905*437bfbebSnyanmisaka 
906*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.dpb_data_sel = 0;
907*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.dpb_output_dis = 0;
908*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.pp_m_output_mode = 0;
909*437bfbebSnyanmisaka 
910*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg68_dpb_hor_virstride = fbc_hdr_stride / 64;
911*437bfbebSnyanmisaka             fbd_offset = fbc_hdr_stride * MPP_ALIGN(ver_virstride, 64) / 16;
912*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg193_dpb_fbc64x4_payload_offset = fbd_offset;
913*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg80_error_ref_hor_virstride = hw_regs->h265d_paras.reg68_dpb_hor_virstride;
914*437bfbebSnyanmisaka         } else if (MPP_FRAME_FMT_IS_TILE(fmt)) {
915*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.dpb_data_sel = 1;
916*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.dpb_output_dis = 1;
917*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.pp_m_output_mode = 2;
918*437bfbebSnyanmisaka 
919*437bfbebSnyanmisaka             if (chroma_fmt_idc == 0) { //yuv400
920*437bfbebSnyanmisaka                 hw_regs->h265d_paras.reg77_pp_m_hor_stride = stride_y * 4 / 16;
921*437bfbebSnyanmisaka             } else if (chroma_fmt_idc == 2) { //yuv422
922*437bfbebSnyanmisaka                 hw_regs->h265d_paras.reg77_pp_m_hor_stride = stride_y * 8 / 16;
923*437bfbebSnyanmisaka             } else if (chroma_fmt_idc == 3) { //yuv444
924*437bfbebSnyanmisaka                 hw_regs->h265d_paras.reg77_pp_m_hor_stride = stride_y * 12 / 16;
925*437bfbebSnyanmisaka             } else { //yuv420
926*437bfbebSnyanmisaka                 hw_regs->h265d_paras.reg77_pp_m_hor_stride = stride_y * 6 / 16;
927*437bfbebSnyanmisaka             }
928*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg79_pp_m_y_virstride = (virstrid_y + virstrid_uv) / 16;
929*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg80_error_ref_hor_virstride = hw_regs->h265d_paras.reg77_pp_m_hor_stride;
930*437bfbebSnyanmisaka         } else {
931*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.dpb_data_sel = 1;
932*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.dpb_output_dis = 1;
933*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.pp_m_output_mode = 1;
934*437bfbebSnyanmisaka 
935*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg77_pp_m_hor_stride = stride_y >> 4;
936*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg78_pp_m_uv_hor_stride = stride_uv >> 4;
937*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg79_pp_m_y_virstride = virstrid_y >> 4;
938*437bfbebSnyanmisaka             hw_regs->h265d_paras.reg80_error_ref_hor_virstride = hw_regs->h265d_paras.reg77_pp_m_hor_stride;
939*437bfbebSnyanmisaka         }
940*437bfbebSnyanmisaka         hw_regs->h265d_paras.reg81_error_ref_raster_uv_hor_virstride = hw_regs->h265d_paras.reg78_pp_m_uv_hor_stride;
941*437bfbebSnyanmisaka         hw_regs->h265d_paras.reg82_error_ref_virstride = hw_regs->h265d_paras.reg79_pp_m_y_virstride;
942*437bfbebSnyanmisaka     }
943*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
944*437bfbebSnyanmisaka                           SLOT_BUFFER, &framebuf);
945*437bfbebSnyanmisaka 
946*437bfbebSnyanmisaka     if (reg_ctx->origin_bufs) {
947*437bfbebSnyanmisaka         origin_buf = hal_bufs_get_buf(reg_ctx->origin_bufs,
948*437bfbebSnyanmisaka                                       dxva_ctx->pp.CurrPic.Index7Bits);
949*437bfbebSnyanmisaka         framebuf = origin_buf->buf[0];
950*437bfbebSnyanmisaka     }
951*437bfbebSnyanmisaka 
952*437bfbebSnyanmisaka     /* output rkfbc64 */
953*437bfbebSnyanmisaka     // hw_regs->h265d_addrs.reg168_dpb_decout_base = mpp_buffer_get_fd(framebuf); //just index need map
954*437bfbebSnyanmisaka     /* output raster/tile4x4 */
955*437bfbebSnyanmisaka     hw_regs->common_addr.reg135_pp_m_decout_base = mpp_buffer_get_fd(framebuf); //just index need map
956*437bfbebSnyanmisaka     hw_regs->h265d_addrs.reg169_error_ref_base = mpp_buffer_get_fd(framebuf);
957*437bfbebSnyanmisaka     /*if out_base is equal to zero it means this frame may error
958*437bfbebSnyanmisaka     we return directly add by csy*/
959*437bfbebSnyanmisaka 
960*437bfbebSnyanmisaka     /* output rkfbc64 */
961*437bfbebSnyanmisaka     // if (!hw_regs->h265d_addrs.reg168_dpb_decout_base)
962*437bfbebSnyanmisaka     //     return 0;
963*437bfbebSnyanmisaka     /* output raster/tile4x4 */
964*437bfbebSnyanmisaka     if (!hw_regs->common_addr.reg135_pp_m_decout_base)
965*437bfbebSnyanmisaka         return 0;
966*437bfbebSnyanmisaka 
967*437bfbebSnyanmisaka     fd =  mpp_buffer_get_fd(framebuf);
968*437bfbebSnyanmisaka     /* output rkfbc64 */
969*437bfbebSnyanmisaka     // hw_regs->h265d_addrs.reg168_dpb_decout_base = fd;
970*437bfbebSnyanmisaka     /* output raster/tile4x4 */
971*437bfbebSnyanmisaka     hw_regs->common_addr.reg135_pp_m_decout_base = fd;
972*437bfbebSnyanmisaka     hw_regs->h265d_addrs.reg192_dpb_payload64x4_st_cur_base = fd;
973*437bfbebSnyanmisaka     mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, dxva_ctx->pp.CurrPic.Index7Bits);
974*437bfbebSnyanmisaka 
975*437bfbebSnyanmisaka     hw_regs->h265d_addrs.reg216_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
976*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
977*437bfbebSnyanmisaka     {
978*437bfbebSnyanmisaka         char *cur_fname = "colmv_cur_frame.dat";
979*437bfbebSnyanmisaka         memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
980*437bfbebSnyanmisaka         sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
981*437bfbebSnyanmisaka         dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(mv_buf->buf[0]),
982*437bfbebSnyanmisaka                           mpp_buffer_get_size(mv_buf->buf[0]), 64, 0);
983*437bfbebSnyanmisaka     }
984*437bfbebSnyanmisaka #endif
985*437bfbebSnyanmisaka 
986*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(reg_ctx->packet_slots, syn->dec.input, SLOT_BUFFER,
987*437bfbebSnyanmisaka                           &streambuf);
988*437bfbebSnyanmisaka     if ( dxva_ctx->bitstream == NULL) {
989*437bfbebSnyanmisaka         dxva_ctx->bitstream = mpp_buffer_get_ptr(streambuf);
990*437bfbebSnyanmisaka     }
991*437bfbebSnyanmisaka 
992*437bfbebSnyanmisaka #ifdef DUMP_VDPU384A_DATAS
993*437bfbebSnyanmisaka     {
994*437bfbebSnyanmisaka         char *cur_fname = "stream_in_128bit.dat";
995*437bfbebSnyanmisaka         memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
996*437bfbebSnyanmisaka         sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
997*437bfbebSnyanmisaka         dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(streambuf),
998*437bfbebSnyanmisaka                           mpp_buffer_get_size(streambuf), 128, 0);
999*437bfbebSnyanmisaka     }
1000*437bfbebSnyanmisaka #endif
1001*437bfbebSnyanmisaka 
1002*437bfbebSnyanmisaka     hw_regs->common_addr.reg128_strm_base = mpp_buffer_get_fd(streambuf);
1003*437bfbebSnyanmisaka     hw_regs->h265d_paras.reg66_stream_len = ((dxva_ctx->bitstream_size + 15) & (~15)) + 64;
1004*437bfbebSnyanmisaka     hw_regs->common_addr.reg129_stream_buf_st_base = mpp_buffer_get_fd(streambuf);
1005*437bfbebSnyanmisaka     hw_regs->common_addr.reg130_stream_buf_end_base = mpp_buffer_get_fd(streambuf);
1006*437bfbebSnyanmisaka     mpp_dev_set_reg_offset(reg_ctx->dev, 130, mpp_buffer_get_size(streambuf));
1007*437bfbebSnyanmisaka     aglin_offset =  hw_regs->h265d_paras.reg66_stream_len - dxva_ctx->bitstream_size;
1008*437bfbebSnyanmisaka     if (aglin_offset > 0)
1009*437bfbebSnyanmisaka         memset((void *)(dxva_ctx->bitstream + dxva_ctx->bitstream_size), 0, aglin_offset);
1010*437bfbebSnyanmisaka 
1011*437bfbebSnyanmisaka     /* common setting */
1012*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg8_dec_mode = 0; // hevc
1013*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg9.low_latency_en = 0;
1014*437bfbebSnyanmisaka 
1015*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.strmd_auto_gating_e      = 1;
1016*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.inter_auto_gating_e      = 1;
1017*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.intra_auto_gating_e      = 1;
1018*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.transd_auto_gating_e     = 1;
1019*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.recon_auto_gating_e      = 1;
1020*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.filterd_auto_gating_e    = 1;
1021*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.bus_auto_gating_e        = 1;
1022*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.ctrl_auto_gating_e       = 1;
1023*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.rcb_auto_gating_e        = 1;
1024*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg10.err_prc_auto_gating_e    = 1;
1025*437bfbebSnyanmisaka 
1026*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg11.rd_outstanding = 32;
1027*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg11.wr_outstanding = 250;
1028*437bfbebSnyanmisaka     // hw_regs->ctrl_regs.reg11.dec_timeout_dis = 1;
1029*437bfbebSnyanmisaka 
1030*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg16.error_proc_disable = 1;
1031*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg16.error_spread_disable = 0;
1032*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg16.roi_error_ctu_cal_en = 0;
1033*437bfbebSnyanmisaka 
1034*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg20_cabac_error_en_lowbits = 0xffffffff;
1035*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg21_cabac_error_en_highbits = 0x3ff3f9ff;
1036*437bfbebSnyanmisaka 
1037*437bfbebSnyanmisaka     hw_regs->ctrl_regs.reg13_core_timeout_threshold = 0xffff;
1038*437bfbebSnyanmisaka 
1039*437bfbebSnyanmisaka 
1040*437bfbebSnyanmisaka     /* output rkfbc64 */
1041*437bfbebSnyanmisaka     // valid_ref = hw_regs->h265d_addrs.reg168_dpb_decout_base;
1042*437bfbebSnyanmisaka     /* output raster/tile4x4 */
1043*437bfbebSnyanmisaka     valid_ref = hw_regs->common_addr.reg135_pp_m_decout_base;
1044*437bfbebSnyanmisaka     reg_ctx->error_index[syn->dec.reg_index] = dxva_ctx->pp.CurrPic.Index7Bits;
1045*437bfbebSnyanmisaka 
1046*437bfbebSnyanmisaka     hw_regs->h265d_addrs.reg169_error_ref_base = valid_ref;
1047*437bfbebSnyanmisaka     for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_ctx->pp.RefPicList); i++) {
1048*437bfbebSnyanmisaka         if (dxva_ctx->pp.RefPicList[i].bPicEntry != 0xff &&
1049*437bfbebSnyanmisaka             dxva_ctx->pp.RefPicList[i].bPicEntry != 0x7f) {
1050*437bfbebSnyanmisaka 
1051*437bfbebSnyanmisaka             MppFrame mframe = NULL;
1052*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots,
1053*437bfbebSnyanmisaka                                   dxva_ctx->pp.RefPicList[i].Index7Bits,
1054*437bfbebSnyanmisaka                                   SLOT_BUFFER, &framebuf);
1055*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.RefPicList[i].Index7Bits,
1056*437bfbebSnyanmisaka                                   SLOT_FRAME_PTR, &mframe);
1057*437bfbebSnyanmisaka             if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY) {
1058*437bfbebSnyanmisaka                 origin_buf = hal_bufs_get_buf(reg_ctx->origin_bufs,
1059*437bfbebSnyanmisaka                                               dxva_ctx->pp.RefPicList[i].Index7Bits);
1060*437bfbebSnyanmisaka                 framebuf = origin_buf->buf[0];
1061*437bfbebSnyanmisaka             }
1062*437bfbebSnyanmisaka             if (framebuf != NULL) {
1063*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg170_185_ref_base[i] = mpp_buffer_get_fd(framebuf);
1064*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = mpp_buffer_get_fd(framebuf);
1065*437bfbebSnyanmisaka                 valid_ref = hw_regs->h265d_addrs.reg170_185_ref_base[i];
1066*437bfbebSnyanmisaka                 if ((pocdistance(dxva_ctx->pp.PicOrderCntValList[i], dxva_ctx->pp.current_poc) < distance)
1067*437bfbebSnyanmisaka                     && (!mpp_frame_get_errinfo(mframe))) {
1068*437bfbebSnyanmisaka 
1069*437bfbebSnyanmisaka                     distance = pocdistance(dxva_ctx->pp.PicOrderCntValList[i], dxva_ctx->pp.current_poc);
1070*437bfbebSnyanmisaka                     hw_regs->h265d_addrs.reg169_error_ref_base = hw_regs->h265d_addrs.reg170_185_ref_base[i];
1071*437bfbebSnyanmisaka                     reg_ctx->error_index[syn->dec.reg_index] = dxva_ctx->pp.RefPicList[i].Index7Bits;
1072*437bfbebSnyanmisaka                     hw_regs->ctrl_regs.reg16.error_proc_disable = 1;
1073*437bfbebSnyanmisaka                 }
1074*437bfbebSnyanmisaka             } else {
1075*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg170_185_ref_base[i] = valid_ref;
1076*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = valid_ref;
1077*437bfbebSnyanmisaka             }
1078*437bfbebSnyanmisaka 
1079*437bfbebSnyanmisaka             mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, dxva_ctx->pp.RefPicList[i].Index7Bits);
1080*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
1081*437bfbebSnyanmisaka         }
1082*437bfbebSnyanmisaka     }
1083*437bfbebSnyanmisaka 
1084*437bfbebSnyanmisaka     if ((reg_ctx->error_index[syn->dec.reg_index] == dxva_ctx->pp.CurrPic.Index7Bits) &&
1085*437bfbebSnyanmisaka         !dxva_ctx->pp.IntraPicFlag) {
1086*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "current frm may be err, should skip process");
1087*437bfbebSnyanmisaka         syn->dec.flags.ref_err = 1;
1088*437bfbebSnyanmisaka         return MPP_OK;
1089*437bfbebSnyanmisaka     }
1090*437bfbebSnyanmisaka 
1091*437bfbebSnyanmisaka     /* pps */
1092*437bfbebSnyanmisaka     hw_regs->common_addr.reg131_gbl_base = reg_ctx->bufs_fd;
1093*437bfbebSnyanmisaka     hw_regs->h265d_paras.reg67_global_len = SPSPPS_ALIGNED_SIZE / 16;
1094*437bfbebSnyanmisaka 
1095*437bfbebSnyanmisaka     mpp_dev_set_reg_offset(reg_ctx->dev, 131, reg_ctx->spspps_offset);
1096*437bfbebSnyanmisaka 
1097*437bfbebSnyanmisaka     hal_h265d_v345_output_pps_packet(hal, syn->dec.syntax.data);
1098*437bfbebSnyanmisaka 
1099*437bfbebSnyanmisaka     for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_ctx->pp.RefPicList); i++) {
1100*437bfbebSnyanmisaka 
1101*437bfbebSnyanmisaka         if (dxva_ctx->pp.RefPicList[i].bPicEntry != 0xff &&
1102*437bfbebSnyanmisaka             dxva_ctx->pp.RefPicList[i].bPicEntry != 0x7f) {
1103*437bfbebSnyanmisaka             MppFrame mframe = NULL;
1104*437bfbebSnyanmisaka 
1105*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots,
1106*437bfbebSnyanmisaka                                   dxva_ctx->pp.RefPicList[i].Index7Bits,
1107*437bfbebSnyanmisaka                                   SLOT_BUFFER, &framebuf);
1108*437bfbebSnyanmisaka 
1109*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.RefPicList[i].Index7Bits,
1110*437bfbebSnyanmisaka                                   SLOT_FRAME_PTR, &mframe);
1111*437bfbebSnyanmisaka 
1112*437bfbebSnyanmisaka             if (framebuf == NULL || mpp_frame_get_errinfo(mframe)) {
1113*437bfbebSnyanmisaka                 mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, reg_ctx->error_index[syn->dec.reg_index]);
1114*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg170_185_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1115*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1116*437bfbebSnyanmisaka                 hw_regs->h265d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
1117*437bfbebSnyanmisaka             }
1118*437bfbebSnyanmisaka         } else {
1119*437bfbebSnyanmisaka             mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, reg_ctx->error_index[syn->dec.reg_index]);
1120*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg170_185_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1121*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1122*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
1123*437bfbebSnyanmisaka         }
1124*437bfbebSnyanmisaka     }
1125*437bfbebSnyanmisaka 
1126*437bfbebSnyanmisaka     hal_h265d_rcb_info_update(hal, dxva_ctx, hw_regs, width, height);
1127*437bfbebSnyanmisaka     vdpu384a_setup_rcb(&hw_regs->common_addr, reg_ctx->dev, reg_ctx->fast_mode ?
1128*437bfbebSnyanmisaka                        reg_ctx->rcb_buf[syn->dec.reg_index] : reg_ctx->rcb_buf[0],
1129*437bfbebSnyanmisaka                        (Vdpu384aRcbInfo *)reg_ctx->rcb_info);
1130*437bfbebSnyanmisaka     vdpu384a_setup_statistic(&hw_regs->ctrl_regs);
1131*437bfbebSnyanmisaka     mpp_buffer_sync_end(reg_ctx->bufs);
1132*437bfbebSnyanmisaka 
1133*437bfbebSnyanmisaka     {
1134*437bfbebSnyanmisaka         //scale down config
1135*437bfbebSnyanmisaka         MppFrame mframe = NULL;
1136*437bfbebSnyanmisaka         MppBuffer mbuffer = NULL;
1137*437bfbebSnyanmisaka         MppFrameThumbnailMode thumbnail_mode;
1138*437bfbebSnyanmisaka 
1139*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
1140*437bfbebSnyanmisaka                               SLOT_BUFFER, &mbuffer);
1141*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
1142*437bfbebSnyanmisaka                               SLOT_FRAME_PTR, &mframe);
1143*437bfbebSnyanmisaka         thumbnail_mode = mpp_frame_get_thumbnail_en(mframe);
1144*437bfbebSnyanmisaka         switch (thumbnail_mode) {
1145*437bfbebSnyanmisaka         case MPP_FRAME_THUMBNAIL_ONLY:
1146*437bfbebSnyanmisaka             hw_regs->common_addr.reg133_scale_down_base = mpp_buffer_get_fd(mbuffer);
1147*437bfbebSnyanmisaka             origin_buf = hal_bufs_get_buf(reg_ctx->origin_bufs, dxva_ctx->pp.CurrPic.Index7Bits);
1148*437bfbebSnyanmisaka             fd = mpp_buffer_get_fd(origin_buf->buf[0]);
1149*437bfbebSnyanmisaka             /* output rkfbc64 */
1150*437bfbebSnyanmisaka             // hw_regs->h265d_addrs.reg168_dpb_decout_base = fd;
1151*437bfbebSnyanmisaka             /* output raster/tile4x4 */
1152*437bfbebSnyanmisaka             hw_regs->common_addr.reg135_pp_m_decout_base = fd;
1153*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg192_dpb_payload64x4_st_cur_base = fd;
1154*437bfbebSnyanmisaka             hw_regs->h265d_addrs.reg169_error_ref_base = fd;
1155*437bfbebSnyanmisaka             vdpu384a_setup_down_scale(mframe, reg_ctx->dev, &hw_regs->ctrl_regs, (void*)&hw_regs->h265d_paras);
1156*437bfbebSnyanmisaka             break;
1157*437bfbebSnyanmisaka         case MPP_FRAME_THUMBNAIL_MIXED:
1158*437bfbebSnyanmisaka             hw_regs->common_addr.reg133_scale_down_base = mpp_buffer_get_fd(mbuffer);
1159*437bfbebSnyanmisaka             vdpu384a_setup_down_scale(mframe, reg_ctx->dev, &hw_regs->ctrl_regs, (void*)&hw_regs->h265d_paras);
1160*437bfbebSnyanmisaka             break;
1161*437bfbebSnyanmisaka         case MPP_FRAME_THUMBNAIL_NONE:
1162*437bfbebSnyanmisaka         default:
1163*437bfbebSnyanmisaka             hw_regs->ctrl_regs.reg9.scale_down_en = 0;
1164*437bfbebSnyanmisaka             break;
1165*437bfbebSnyanmisaka         }
1166*437bfbebSnyanmisaka     }
1167*437bfbebSnyanmisaka 
1168*437bfbebSnyanmisaka     return ret;
1169*437bfbebSnyanmisaka }
1170*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_start(void * hal,HalTaskInfo * task)1171*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_start(void *hal, HalTaskInfo *task)
1172*437bfbebSnyanmisaka {
1173*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
1174*437bfbebSnyanmisaka     RK_U8* p = NULL;
1175*437bfbebSnyanmisaka     Vdpu384aH265dRegSet *hw_regs = NULL;
1176*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
1177*437bfbebSnyanmisaka     RK_S32 index =  task->dec.reg_index;
1178*437bfbebSnyanmisaka 
1179*437bfbebSnyanmisaka     RK_U32 i;
1180*437bfbebSnyanmisaka 
1181*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
1182*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
1183*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
1184*437bfbebSnyanmisaka         return MPP_OK;
1185*437bfbebSnyanmisaka     }
1186*437bfbebSnyanmisaka 
1187*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
1188*437bfbebSnyanmisaka         p = (RK_U8*)reg_ctx->g_buf[index].hw_regs;
1189*437bfbebSnyanmisaka         hw_regs = ( Vdpu384aH265dRegSet *)reg_ctx->g_buf[index].hw_regs;
1190*437bfbebSnyanmisaka     } else {
1191*437bfbebSnyanmisaka         p = (RK_U8*)reg_ctx->hw_regs;
1192*437bfbebSnyanmisaka         hw_regs = ( Vdpu384aH265dRegSet *)reg_ctx->hw_regs;
1193*437bfbebSnyanmisaka     }
1194*437bfbebSnyanmisaka 
1195*437bfbebSnyanmisaka     if (hw_regs == NULL) {
1196*437bfbebSnyanmisaka         mpp_err("hal_h265d_start hw_regs is NULL");
1197*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
1198*437bfbebSnyanmisaka     }
1199*437bfbebSnyanmisaka     for (i = 0; i < 68; i++) {
1200*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1201*437bfbebSnyanmisaka                   i, *((RK_U32*)p));
1202*437bfbebSnyanmisaka         //mpp_log("RK_HEVC_DEC: regs[%02d]=%08X\n", i, *((RK_U32*)p));
1203*437bfbebSnyanmisaka         p += 4;
1204*437bfbebSnyanmisaka     }
1205*437bfbebSnyanmisaka 
1206*437bfbebSnyanmisaka     do {
1207*437bfbebSnyanmisaka         MppDevRegWrCfg wr_cfg;
1208*437bfbebSnyanmisaka         MppDevRegRdCfg rd_cfg;
1209*437bfbebSnyanmisaka 
1210*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->ctrl_regs;
1211*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->ctrl_regs);
1212*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CTRL_REGS;
1213*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1214*437bfbebSnyanmisaka         if (ret) {
1215*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
1216*437bfbebSnyanmisaka             break;
1217*437bfbebSnyanmisaka         }
1218*437bfbebSnyanmisaka 
1219*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->common_addr;
1220*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->common_addr);
1221*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
1222*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1223*437bfbebSnyanmisaka         if (ret) {
1224*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
1225*437bfbebSnyanmisaka             break;
1226*437bfbebSnyanmisaka         }
1227*437bfbebSnyanmisaka 
1228*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->h265d_paras;
1229*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->h265d_paras);
1230*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_PARAS_REGS;
1231*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1232*437bfbebSnyanmisaka         if (ret) {
1233*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
1234*437bfbebSnyanmisaka             break;
1235*437bfbebSnyanmisaka         }
1236*437bfbebSnyanmisaka 
1237*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->h265d_addrs;
1238*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->h265d_addrs);
1239*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
1240*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1241*437bfbebSnyanmisaka         if (ret) {
1242*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
1243*437bfbebSnyanmisaka             break;
1244*437bfbebSnyanmisaka         }
1245*437bfbebSnyanmisaka 
1246*437bfbebSnyanmisaka         rd_cfg.reg = &hw_regs->ctrl_regs.reg15;
1247*437bfbebSnyanmisaka         rd_cfg.size = sizeof(hw_regs->ctrl_regs.reg15);
1248*437bfbebSnyanmisaka         rd_cfg.offset = OFFSET_INTERRUPT_REGS;
1249*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_RD, &rd_cfg);
1250*437bfbebSnyanmisaka         if (ret) {
1251*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
1252*437bfbebSnyanmisaka             break;
1253*437bfbebSnyanmisaka         }
1254*437bfbebSnyanmisaka 
1255*437bfbebSnyanmisaka         /* rcb info for sram */
1256*437bfbebSnyanmisaka         vdpu384a_set_rcbinfo(reg_ctx->dev, (Vdpu384aRcbInfo*)reg_ctx->rcb_info);
1257*437bfbebSnyanmisaka 
1258*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_SEND, NULL);
1259*437bfbebSnyanmisaka         if (ret) {
1260*437bfbebSnyanmisaka             mpp_err_f("send cmd failed %d\n", ret);
1261*437bfbebSnyanmisaka             break;
1262*437bfbebSnyanmisaka         }
1263*437bfbebSnyanmisaka     } while (0);
1264*437bfbebSnyanmisaka 
1265*437bfbebSnyanmisaka     return ret;
1266*437bfbebSnyanmisaka }
1267*437bfbebSnyanmisaka 
1268*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_wait(void * hal,HalTaskInfo * task)1269*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_wait(void *hal, HalTaskInfo *task)
1270*437bfbebSnyanmisaka {
1271*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
1272*437bfbebSnyanmisaka     RK_S32 index =  task->dec.reg_index;
1273*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
1274*437bfbebSnyanmisaka     RK_U8* p = NULL;
1275*437bfbebSnyanmisaka     Vdpu384aH265dRegSet *hw_regs = NULL;
1276*437bfbebSnyanmisaka     RK_S32 i;
1277*437bfbebSnyanmisaka 
1278*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
1279*437bfbebSnyanmisaka         hw_regs = ( Vdpu384aH265dRegSet *)reg_ctx->g_buf[index].hw_regs;
1280*437bfbebSnyanmisaka     } else {
1281*437bfbebSnyanmisaka         hw_regs = ( Vdpu384aH265dRegSet *)reg_ctx->hw_regs;
1282*437bfbebSnyanmisaka     }
1283*437bfbebSnyanmisaka 
1284*437bfbebSnyanmisaka     p = (RK_U8*)hw_regs;
1285*437bfbebSnyanmisaka 
1286*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
1287*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
1288*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
1289*437bfbebSnyanmisaka         goto ERR_PROC;
1290*437bfbebSnyanmisaka     }
1291*437bfbebSnyanmisaka 
1292*437bfbebSnyanmisaka     ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_POLL, NULL);
1293*437bfbebSnyanmisaka     if (ret)
1294*437bfbebSnyanmisaka         mpp_err_f("poll cmd failed %d\n", ret);
1295*437bfbebSnyanmisaka 
1296*437bfbebSnyanmisaka ERR_PROC:
1297*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
1298*437bfbebSnyanmisaka         task->dec.flags.ref_err ||
1299*437bfbebSnyanmisaka         (!hw_regs->ctrl_regs.reg15.rkvdec_frame_rdy_sta) ||
1300*437bfbebSnyanmisaka         hw_regs->ctrl_regs.reg15.rkvdec_strm_error_sta ||
1301*437bfbebSnyanmisaka         hw_regs->ctrl_regs.reg15.rkvdec_core_timeout_sta ||
1302*437bfbebSnyanmisaka         hw_regs->ctrl_regs.reg15.rkvdec_ip_timeout_sta ||
1303*437bfbebSnyanmisaka         hw_regs->ctrl_regs.reg15.rkvdec_bus_error_sta ||
1304*437bfbebSnyanmisaka         hw_regs->ctrl_regs.reg15.rkvdec_buffer_empty_sta ||
1305*437bfbebSnyanmisaka         hw_regs->ctrl_regs.reg15.rkvdec_colmv_ref_error_sta) {
1306*437bfbebSnyanmisaka         if (!reg_ctx->fast_mode) {
1307*437bfbebSnyanmisaka             if (reg_ctx->dec_cb)
1308*437bfbebSnyanmisaka                 mpp_callback(reg_ctx->dec_cb, &task->dec);
1309*437bfbebSnyanmisaka         } else {
1310*437bfbebSnyanmisaka             MppFrame mframe = NULL;
1311*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1312*437bfbebSnyanmisaka                                   SLOT_FRAME_PTR, &mframe);
1313*437bfbebSnyanmisaka             if (mframe) {
1314*437bfbebSnyanmisaka                 reg_ctx->fast_mode_err_found = 1;
1315*437bfbebSnyanmisaka                 mpp_frame_set_errinfo(mframe, 1);
1316*437bfbebSnyanmisaka             }
1317*437bfbebSnyanmisaka         }
1318*437bfbebSnyanmisaka     } else {
1319*437bfbebSnyanmisaka         if (reg_ctx->fast_mode && reg_ctx->fast_mode_err_found) {
1320*437bfbebSnyanmisaka             for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(task->dec.refer); i++) {
1321*437bfbebSnyanmisaka                 if (task->dec.refer[i] >= 0) {
1322*437bfbebSnyanmisaka                     MppFrame frame_ref = NULL;
1323*437bfbebSnyanmisaka 
1324*437bfbebSnyanmisaka                     mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.refer[i],
1325*437bfbebSnyanmisaka                                           SLOT_FRAME_PTR, &frame_ref);
1326*437bfbebSnyanmisaka                     h265h_dbg(H265H_DBG_FAST_ERR, "refer[%d] %d frame %p\n",
1327*437bfbebSnyanmisaka                               i, task->dec.refer[i], frame_ref);
1328*437bfbebSnyanmisaka                     if (frame_ref && mpp_frame_get_errinfo(frame_ref)) {
1329*437bfbebSnyanmisaka                         MppFrame frame_out = NULL;
1330*437bfbebSnyanmisaka                         mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1331*437bfbebSnyanmisaka                                               SLOT_FRAME_PTR, &frame_out);
1332*437bfbebSnyanmisaka                         mpp_frame_set_errinfo(frame_out, 1);
1333*437bfbebSnyanmisaka                         break;
1334*437bfbebSnyanmisaka                     }
1335*437bfbebSnyanmisaka                 }
1336*437bfbebSnyanmisaka             }
1337*437bfbebSnyanmisaka         }
1338*437bfbebSnyanmisaka     }
1339*437bfbebSnyanmisaka 
1340*437bfbebSnyanmisaka     for (i = 0; i < 68; i++) {
1341*437bfbebSnyanmisaka         if (i == 1) {
1342*437bfbebSnyanmisaka             h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1343*437bfbebSnyanmisaka                       i, *((RK_U32*)p));
1344*437bfbebSnyanmisaka         }
1345*437bfbebSnyanmisaka 
1346*437bfbebSnyanmisaka         if (i == 45) {
1347*437bfbebSnyanmisaka             h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1348*437bfbebSnyanmisaka                       i, *((RK_U32*)p));
1349*437bfbebSnyanmisaka         }
1350*437bfbebSnyanmisaka         p += 4;
1351*437bfbebSnyanmisaka     }
1352*437bfbebSnyanmisaka 
1353*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
1354*437bfbebSnyanmisaka         reg_ctx->g_buf[index].use_flag = 0;
1355*437bfbebSnyanmisaka     }
1356*437bfbebSnyanmisaka 
1357*437bfbebSnyanmisaka     return ret;
1358*437bfbebSnyanmisaka }
1359*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_reset(void * hal)1360*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_reset(void *hal)
1361*437bfbebSnyanmisaka {
1362*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
1363*437bfbebSnyanmisaka     HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1364*437bfbebSnyanmisaka     p_hal->fast_mode_err_found = 0;
1365*437bfbebSnyanmisaka     (void)hal;
1366*437bfbebSnyanmisaka     return ret;
1367*437bfbebSnyanmisaka }
1368*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_flush(void * hal)1369*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_flush(void *hal)
1370*437bfbebSnyanmisaka {
1371*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
1372*437bfbebSnyanmisaka 
1373*437bfbebSnyanmisaka     (void)hal;
1374*437bfbebSnyanmisaka     return ret;
1375*437bfbebSnyanmisaka }
1376*437bfbebSnyanmisaka 
hal_h265d_vdpu384a_control(void * hal,MpiCmd cmd_type,void * param)1377*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu384a_control(void *hal, MpiCmd cmd_type, void *param)
1378*437bfbebSnyanmisaka {
1379*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
1380*437bfbebSnyanmisaka     HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1381*437bfbebSnyanmisaka 
1382*437bfbebSnyanmisaka     (void)hal;
1383*437bfbebSnyanmisaka     (void)param;
1384*437bfbebSnyanmisaka     switch ((MpiCmd)cmd_type) {
1385*437bfbebSnyanmisaka     case MPP_DEC_SET_FRAME_INFO: {
1386*437bfbebSnyanmisaka         MppFrame frame = (MppFrame)param;
1387*437bfbebSnyanmisaka         MppFrameFormat fmt = mpp_frame_get_fmt(frame);
1388*437bfbebSnyanmisaka         RK_U32 imgwidth = mpp_frame_get_width((MppFrame)param);
1389*437bfbebSnyanmisaka         RK_U32 imgheight = mpp_frame_get_height((MppFrame)param);
1390*437bfbebSnyanmisaka 
1391*437bfbebSnyanmisaka         if (fmt == MPP_FMT_YUV422SP) {
1392*437bfbebSnyanmisaka             mpp_slots_set_prop(p_hal->slots, SLOTS_LEN_ALIGN, rkv_len_align_422);
1393*437bfbebSnyanmisaka         } else if (fmt == MPP_FMT_YUV444SP) {
1394*437bfbebSnyanmisaka             mpp_slots_set_prop(p_hal->slots, SLOTS_LEN_ALIGN, rkv_len_align_444);
1395*437bfbebSnyanmisaka         }
1396*437bfbebSnyanmisaka         if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1397*437bfbebSnyanmisaka             vdpu384a_afbc_align_calc(p_hal->slots, frame, 16);
1398*437bfbebSnyanmisaka         } else if (imgwidth > 1920 || imgheight > 1088) {
1399*437bfbebSnyanmisaka             mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
1400*437bfbebSnyanmisaka         }
1401*437bfbebSnyanmisaka         break;
1402*437bfbebSnyanmisaka     }
1403*437bfbebSnyanmisaka     case MPP_DEC_GET_THUMBNAIL_FRAME_INFO: {
1404*437bfbebSnyanmisaka         vdpu384a_update_thumbnail_frame_info((MppFrame)param);
1405*437bfbebSnyanmisaka     } break;
1406*437bfbebSnyanmisaka     case MPP_DEC_SET_OUTPUT_FORMAT: {
1407*437bfbebSnyanmisaka     } break;
1408*437bfbebSnyanmisaka     default: {
1409*437bfbebSnyanmisaka     } break;
1410*437bfbebSnyanmisaka     }
1411*437bfbebSnyanmisaka     return  ret;
1412*437bfbebSnyanmisaka }
1413*437bfbebSnyanmisaka 
1414*437bfbebSnyanmisaka const MppHalApi hal_h265d_vdpu384a = {
1415*437bfbebSnyanmisaka     .name = "h265d_vdpu384a",
1416*437bfbebSnyanmisaka     .type = MPP_CTX_DEC,
1417*437bfbebSnyanmisaka     .coding = MPP_VIDEO_CodingHEVC,
1418*437bfbebSnyanmisaka     .ctx_size = sizeof(HalH265dCtx),
1419*437bfbebSnyanmisaka     .flag = 0,
1420*437bfbebSnyanmisaka     .init = hal_h265d_vdpu384a_init,
1421*437bfbebSnyanmisaka     .deinit = hal_h265d_vdpu384a_deinit,
1422*437bfbebSnyanmisaka     .reg_gen = hal_h265d_vdpu384a_gen_regs,
1423*437bfbebSnyanmisaka     .start = hal_h265d_vdpu384a_start,
1424*437bfbebSnyanmisaka     .wait = hal_h265d_vdpu384a_wait,
1425*437bfbebSnyanmisaka     .reset = hal_h265d_vdpu384a_reset,
1426*437bfbebSnyanmisaka     .flush = hal_h265d_vdpu384a_flush,
1427*437bfbebSnyanmisaka     .control = hal_h265d_vdpu384a_control,
1428*437bfbebSnyanmisaka };
1429