1*437bfbebSnyanmisaka /* SPDX-License-Identifier: Apache-2.0 OR MIT */
2*437bfbebSnyanmisaka /*
3*437bfbebSnyanmisaka * Copyright (c) 2024 Rockchip Electronics Co., Ltd.
4*437bfbebSnyanmisaka */
5*437bfbebSnyanmisaka
6*437bfbebSnyanmisaka #define MODULE_TAG "hal_h265d_vdpu383"
7*437bfbebSnyanmisaka
8*437bfbebSnyanmisaka #include <stdio.h>
9*437bfbebSnyanmisaka #include <string.h>
10*437bfbebSnyanmisaka #include <unistd.h>
11*437bfbebSnyanmisaka #include <stdarg.h>
12*437bfbebSnyanmisaka #include <inttypes.h>
13*437bfbebSnyanmisaka #include <ctype.h>
14*437bfbebSnyanmisaka #include <sys/stat.h>
15*437bfbebSnyanmisaka #include <sys/types.h>
16*437bfbebSnyanmisaka
17*437bfbebSnyanmisaka #include "mpp_env.h"
18*437bfbebSnyanmisaka #include "mpp_mem.h"
19*437bfbebSnyanmisaka #include "mpp_bitread.h"
20*437bfbebSnyanmisaka #include "mpp_bitput.h"
21*437bfbebSnyanmisaka #include "mpp_buffer_impl.h"
22*437bfbebSnyanmisaka
23*437bfbebSnyanmisaka #include "h265d_syntax.h"
24*437bfbebSnyanmisaka #include "hal_h265d_debug.h"
25*437bfbebSnyanmisaka #include "hal_h265d_ctx.h"
26*437bfbebSnyanmisaka #include "hal_h265d_com.h"
27*437bfbebSnyanmisaka #include "hal_h265d_vdpu383.h"
28*437bfbebSnyanmisaka #include "vdpu383_h265d.h"
29*437bfbebSnyanmisaka #include "vdpu383_com.h"
30*437bfbebSnyanmisaka
31*437bfbebSnyanmisaka #define HW_RPS
32*437bfbebSnyanmisaka #define PPS_SIZE (112 * 64)//(96x64)
33*437bfbebSnyanmisaka
34*437bfbebSnyanmisaka #define FMT 4
35*437bfbebSnyanmisaka #define CTU 3
36*437bfbebSnyanmisaka
37*437bfbebSnyanmisaka typedef struct {
38*437bfbebSnyanmisaka RK_U32 a;
39*437bfbebSnyanmisaka RK_U32 b;
40*437bfbebSnyanmisaka } FilterdColBufRatio;
41*437bfbebSnyanmisaka
42*437bfbebSnyanmisaka #if 0
43*437bfbebSnyanmisaka static const FilterdColBufRatio filterd_fbc_on[CTU][FMT] = {
44*437bfbebSnyanmisaka /* 400 420 422 444 */
45*437bfbebSnyanmisaka {{0, 0}, {27, 15}, {36, 15}, {52, 15}}, //ctu 16
46*437bfbebSnyanmisaka {{0, 0}, {27, 8}, {36, 8}, {52, 8}}, //ctu 32
47*437bfbebSnyanmisaka {{0, 0}, {27, 5}, {36, 5}, {52, 5}} //ctu 64
48*437bfbebSnyanmisaka };
49*437bfbebSnyanmisaka
50*437bfbebSnyanmisaka static const FilterdColBufRatio filterd_fbc_off[CTU][FMT] = {
51*437bfbebSnyanmisaka /* 400 420 422 444 */
52*437bfbebSnyanmisaka {{0, 0}, {9, 31}, {12, 39}, {12, 39}}, //ctu 16
53*437bfbebSnyanmisaka {{0, 0}, {9, 25}, {12, 33}, {12, 33}}, //ctu 32
54*437bfbebSnyanmisaka {{0, 0}, {9, 21}, {12, 29}, {12, 29}} //ctu 64
55*437bfbebSnyanmisaka };
56*437bfbebSnyanmisaka #endif
57*437bfbebSnyanmisaka
58*437bfbebSnyanmisaka #define CABAC_TAB_ALIGEND_SIZE (MPP_ALIGN(27456, SZ_4K))
59*437bfbebSnyanmisaka #define SPSPPS_ALIGNED_SIZE (MPP_ALIGN(176, SZ_4K))
60*437bfbebSnyanmisaka #define RPS_ALIGEND_SIZE (MPP_ALIGN(400 * 8, SZ_4K))
61*437bfbebSnyanmisaka #define SCALIST_ALIGNED_SIZE (MPP_ALIGN(81 * 1360, SZ_4K))
62*437bfbebSnyanmisaka #define INFO_BUFFER_SIZE (SPSPPS_ALIGNED_SIZE + RPS_ALIGEND_SIZE + SCALIST_ALIGNED_SIZE)
63*437bfbebSnyanmisaka #define ALL_BUFFER_SIZE(cnt) (CABAC_TAB_ALIGEND_SIZE + INFO_BUFFER_SIZE *cnt)
64*437bfbebSnyanmisaka
65*437bfbebSnyanmisaka #define CABAC_TAB_OFFSET (0)
66*437bfbebSnyanmisaka #define SPSPPS_OFFSET(pos) (CABAC_TAB_OFFSET + CABAC_TAB_ALIGEND_SIZE + (INFO_BUFFER_SIZE * pos))
67*437bfbebSnyanmisaka #define RPS_OFFSET(pos) (SPSPPS_OFFSET(pos) + SPSPPS_ALIGNED_SIZE)
68*437bfbebSnyanmisaka #define SCALIST_OFFSET(pos) (RPS_OFFSET(pos) + RPS_ALIGEND_SIZE)
69*437bfbebSnyanmisaka
70*437bfbebSnyanmisaka #define pocdistance(a, b) (((a) > (b)) ? ((a) - (b)) : ((b) - (a)))
71*437bfbebSnyanmisaka
rkv_len_align_422(RK_U32 val)72*437bfbebSnyanmisaka static RK_U32 rkv_len_align_422(RK_U32 val)
73*437bfbebSnyanmisaka {
74*437bfbebSnyanmisaka return (2 * MPP_ALIGN(val, 16));
75*437bfbebSnyanmisaka }
76*437bfbebSnyanmisaka
rkv_len_align_444(RK_U32 val)77*437bfbebSnyanmisaka static RK_U32 rkv_len_align_444(RK_U32 val)
78*437bfbebSnyanmisaka {
79*437bfbebSnyanmisaka return (3 * MPP_ALIGN(val, 16));
80*437bfbebSnyanmisaka }
81*437bfbebSnyanmisaka
vdpu383_setup_scale_origin_bufs(HalH265dCtx * ctx,MppFrame mframe)82*437bfbebSnyanmisaka static MPP_RET vdpu383_setup_scale_origin_bufs(HalH265dCtx *ctx, MppFrame mframe)
83*437bfbebSnyanmisaka {
84*437bfbebSnyanmisaka /* for 8K FrameBuf scale mode */
85*437bfbebSnyanmisaka size_t origin_buf_size = 0;
86*437bfbebSnyanmisaka
87*437bfbebSnyanmisaka origin_buf_size = mpp_frame_get_buf_size(mframe);
88*437bfbebSnyanmisaka
89*437bfbebSnyanmisaka if (!origin_buf_size) {
90*437bfbebSnyanmisaka mpp_err_f("origin_bufs get buf size failed\n");
91*437bfbebSnyanmisaka return MPP_NOK;
92*437bfbebSnyanmisaka }
93*437bfbebSnyanmisaka
94*437bfbebSnyanmisaka if (ctx->origin_bufs) {
95*437bfbebSnyanmisaka hal_bufs_deinit(ctx->origin_bufs);
96*437bfbebSnyanmisaka ctx->origin_bufs = NULL;
97*437bfbebSnyanmisaka }
98*437bfbebSnyanmisaka hal_bufs_init(&ctx->origin_bufs);
99*437bfbebSnyanmisaka if (!ctx->origin_bufs) {
100*437bfbebSnyanmisaka mpp_err_f("origin_bufs init fail\n");
101*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
102*437bfbebSnyanmisaka }
103*437bfbebSnyanmisaka
104*437bfbebSnyanmisaka hal_bufs_setup(ctx->origin_bufs, 16, 1, &origin_buf_size);
105*437bfbebSnyanmisaka
106*437bfbebSnyanmisaka return MPP_OK;
107*437bfbebSnyanmisaka }
108*437bfbebSnyanmisaka
hal_h265d_vdpu383_init(void * hal,MppHalCfg * cfg)109*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_init(void *hal, MppHalCfg *cfg)
110*437bfbebSnyanmisaka {
111*437bfbebSnyanmisaka RK_S32 ret = 0;
112*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
113*437bfbebSnyanmisaka
114*437bfbebSnyanmisaka mpp_slots_set_prop(reg_ctx->slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
115*437bfbebSnyanmisaka mpp_slots_set_prop(reg_ctx->slots, SLOTS_VER_ALIGN, hevc_ver_align);
116*437bfbebSnyanmisaka
117*437bfbebSnyanmisaka reg_ctx->scaling_qm = mpp_calloc(DXVA_Qmatrix_HEVC, 1);
118*437bfbebSnyanmisaka if (reg_ctx->scaling_qm == NULL) {
119*437bfbebSnyanmisaka mpp_err("scaling_org alloc fail");
120*437bfbebSnyanmisaka return MPP_ERR_MALLOC;
121*437bfbebSnyanmisaka }
122*437bfbebSnyanmisaka
123*437bfbebSnyanmisaka reg_ctx->scaling_rk = mpp_calloc(scalingFactor_t, 1);
124*437bfbebSnyanmisaka reg_ctx->pps_buf = mpp_calloc(RK_U64, 24);
125*437bfbebSnyanmisaka reg_ctx->sw_rps_buf = mpp_calloc(RK_U64, 400);
126*437bfbebSnyanmisaka
127*437bfbebSnyanmisaka if (reg_ctx->scaling_rk == NULL) {
128*437bfbebSnyanmisaka mpp_err("scaling_rk alloc fail");
129*437bfbebSnyanmisaka return MPP_ERR_MALLOC;
130*437bfbebSnyanmisaka }
131*437bfbebSnyanmisaka
132*437bfbebSnyanmisaka if (reg_ctx->group == NULL) {
133*437bfbebSnyanmisaka ret = mpp_buffer_group_get_internal(®_ctx->group, MPP_BUFFER_TYPE_ION);
134*437bfbebSnyanmisaka if (ret) {
135*437bfbebSnyanmisaka mpp_err("h265d mpp_buffer_group_get failed\n");
136*437bfbebSnyanmisaka return ret;
137*437bfbebSnyanmisaka }
138*437bfbebSnyanmisaka }
139*437bfbebSnyanmisaka
140*437bfbebSnyanmisaka {
141*437bfbebSnyanmisaka RK_U32 i = 0;
142*437bfbebSnyanmisaka RK_U32 max_cnt = reg_ctx->fast_mode ? MAX_GEN_REG : 1;
143*437bfbebSnyanmisaka
144*437bfbebSnyanmisaka //!< malloc buffers
145*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->bufs, ALL_BUFFER_SIZE(max_cnt));
146*437bfbebSnyanmisaka if (ret) {
147*437bfbebSnyanmisaka mpp_err("h265d mpp_buffer_get failed\n");
148*437bfbebSnyanmisaka return ret;
149*437bfbebSnyanmisaka }
150*437bfbebSnyanmisaka
151*437bfbebSnyanmisaka reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
152*437bfbebSnyanmisaka reg_ctx->offset_cabac = CABAC_TAB_OFFSET;
153*437bfbebSnyanmisaka for (i = 0; i < max_cnt; i++) {
154*437bfbebSnyanmisaka reg_ctx->g_buf[i].hw_regs = mpp_calloc_size(void, sizeof(Vdpu383H265dRegSet));
155*437bfbebSnyanmisaka reg_ctx->offset_spspps[i] = SPSPPS_OFFSET(i);
156*437bfbebSnyanmisaka reg_ctx->offset_rps[i] = RPS_OFFSET(i);
157*437bfbebSnyanmisaka reg_ctx->offset_sclst[i] = SCALIST_OFFSET(i);
158*437bfbebSnyanmisaka }
159*437bfbebSnyanmisaka
160*437bfbebSnyanmisaka mpp_buffer_attach_dev(reg_ctx->bufs, reg_ctx->dev);
161*437bfbebSnyanmisaka }
162*437bfbebSnyanmisaka
163*437bfbebSnyanmisaka if (!reg_ctx->fast_mode) {
164*437bfbebSnyanmisaka reg_ctx->hw_regs = reg_ctx->g_buf[0].hw_regs;
165*437bfbebSnyanmisaka reg_ctx->spspps_offset = reg_ctx->offset_spspps[0];
166*437bfbebSnyanmisaka reg_ctx->rps_offset = reg_ctx->offset_rps[0];
167*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->offset_sclst[0];
168*437bfbebSnyanmisaka }
169*437bfbebSnyanmisaka
170*437bfbebSnyanmisaka ret = mpp_buffer_write(reg_ctx->bufs, 0, (void*)cabac_table, sizeof(cabac_table));
171*437bfbebSnyanmisaka if (ret) {
172*437bfbebSnyanmisaka mpp_err("h265d write cabac_table data failed\n");
173*437bfbebSnyanmisaka return ret;
174*437bfbebSnyanmisaka }
175*437bfbebSnyanmisaka
176*437bfbebSnyanmisaka if (cfg->hal_fbc_adj_cfg) {
177*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->func = vdpu383_afbc_align_calc;
178*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->expand = 16;
179*437bfbebSnyanmisaka }
180*437bfbebSnyanmisaka
181*437bfbebSnyanmisaka (void) cfg;
182*437bfbebSnyanmisaka return MPP_OK;
183*437bfbebSnyanmisaka }
184*437bfbebSnyanmisaka
hal_h265d_vdpu383_deinit(void * hal)185*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_deinit(void *hal)
186*437bfbebSnyanmisaka {
187*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
188*437bfbebSnyanmisaka RK_U32 loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->g_buf) : 1;
189*437bfbebSnyanmisaka RK_U32 i;
190*437bfbebSnyanmisaka
191*437bfbebSnyanmisaka if (reg_ctx->bufs) {
192*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->bufs);
193*437bfbebSnyanmisaka reg_ctx->bufs = NULL;
194*437bfbebSnyanmisaka }
195*437bfbebSnyanmisaka
196*437bfbebSnyanmisaka loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->rcb_buf) : 1;
197*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
198*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
199*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
200*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
201*437bfbebSnyanmisaka }
202*437bfbebSnyanmisaka }
203*437bfbebSnyanmisaka
204*437bfbebSnyanmisaka if (reg_ctx->group) {
205*437bfbebSnyanmisaka mpp_buffer_group_put(reg_ctx->group);
206*437bfbebSnyanmisaka reg_ctx->group = NULL;
207*437bfbebSnyanmisaka }
208*437bfbebSnyanmisaka
209*437bfbebSnyanmisaka for (i = 0; i < loop; i++)
210*437bfbebSnyanmisaka MPP_FREE(reg_ctx->g_buf[i].hw_regs);
211*437bfbebSnyanmisaka
212*437bfbebSnyanmisaka MPP_FREE(reg_ctx->scaling_qm);
213*437bfbebSnyanmisaka MPP_FREE(reg_ctx->scaling_rk);
214*437bfbebSnyanmisaka MPP_FREE(reg_ctx->pps_buf);
215*437bfbebSnyanmisaka MPP_FREE(reg_ctx->sw_rps_buf);
216*437bfbebSnyanmisaka
217*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs) {
218*437bfbebSnyanmisaka hal_bufs_deinit(reg_ctx->cmv_bufs);
219*437bfbebSnyanmisaka reg_ctx->cmv_bufs = NULL;
220*437bfbebSnyanmisaka }
221*437bfbebSnyanmisaka
222*437bfbebSnyanmisaka if (reg_ctx->origin_bufs) {
223*437bfbebSnyanmisaka hal_bufs_deinit(reg_ctx->origin_bufs);
224*437bfbebSnyanmisaka reg_ctx->origin_bufs = NULL;
225*437bfbebSnyanmisaka }
226*437bfbebSnyanmisaka
227*437bfbebSnyanmisaka return MPP_OK;
228*437bfbebSnyanmisaka }
229*437bfbebSnyanmisaka
230*437bfbebSnyanmisaka #define SCALING_LIST_NUM 6
231*437bfbebSnyanmisaka
hal_vdpu383_record_scaling_list(scalingFactor_t * pScalingFactor_out,scalingList_t * pScalingList)232*437bfbebSnyanmisaka void hal_vdpu383_record_scaling_list(scalingFactor_t *pScalingFactor_out, scalingList_t *pScalingList)
233*437bfbebSnyanmisaka {
234*437bfbebSnyanmisaka RK_S32 i;
235*437bfbebSnyanmisaka RK_U32 listId;
236*437bfbebSnyanmisaka BitputCtx_t bp;
237*437bfbebSnyanmisaka
238*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, (RK_U64 *)pScalingFactor_out, 170); // 170*64bits
239*437bfbebSnyanmisaka
240*437bfbebSnyanmisaka //-------- following make it by hardware needed --------
241*437bfbebSnyanmisaka //sizeId == 0, block4x4
242*437bfbebSnyanmisaka for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
243*437bfbebSnyanmisaka RK_U8 *p_data = pScalingList->sl[0][listId];
244*437bfbebSnyanmisaka /* dump by block4x4, vectial direction */
245*437bfbebSnyanmisaka for (i = 0; i < 4; i++) {
246*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[i + 0], 8);
247*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[i + 4], 8);
248*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[i + 8], 8);
249*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[i + 12], 8);
250*437bfbebSnyanmisaka }
251*437bfbebSnyanmisaka }
252*437bfbebSnyanmisaka //sizeId == 1, block8x8
253*437bfbebSnyanmisaka for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
254*437bfbebSnyanmisaka RK_S32 blk4_x = 0, blk4_y = 0;
255*437bfbebSnyanmisaka RK_U8 *p_data = pScalingList->sl[1][listId];
256*437bfbebSnyanmisaka
257*437bfbebSnyanmisaka /* dump by block4x4, vectial direction */
258*437bfbebSnyanmisaka for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
259*437bfbebSnyanmisaka for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
260*437bfbebSnyanmisaka RK_S32 pos = blk4_y * 8 + blk4_x;
261*437bfbebSnyanmisaka
262*437bfbebSnyanmisaka for (i = 0; i < 4; i++) {
263*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 0], 8);
264*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 8], 8);
265*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 16], 8);
266*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 24], 8);
267*437bfbebSnyanmisaka }
268*437bfbebSnyanmisaka }
269*437bfbebSnyanmisaka }
270*437bfbebSnyanmisaka }
271*437bfbebSnyanmisaka //sizeId == 2, block16x16
272*437bfbebSnyanmisaka for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
273*437bfbebSnyanmisaka RK_S32 blk4_x = 0, blk4_y = 0;
274*437bfbebSnyanmisaka RK_U8 *p_data = pScalingList->sl[2][listId];
275*437bfbebSnyanmisaka
276*437bfbebSnyanmisaka /* dump by block4x4, vectial direction */
277*437bfbebSnyanmisaka for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
278*437bfbebSnyanmisaka for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
279*437bfbebSnyanmisaka RK_S32 pos = blk4_y * 8 + blk4_x;
280*437bfbebSnyanmisaka
281*437bfbebSnyanmisaka for (i = 0; i < 4; i++) {
282*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 0], 8);
283*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 8], 8);
284*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 16], 8);
285*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 24], 8);
286*437bfbebSnyanmisaka }
287*437bfbebSnyanmisaka }
288*437bfbebSnyanmisaka }
289*437bfbebSnyanmisaka }
290*437bfbebSnyanmisaka //sizeId == 3, blcok32x32
291*437bfbebSnyanmisaka for (listId = 0; listId < 6; listId++) {
292*437bfbebSnyanmisaka RK_S32 blk4_x = 0, blk4_y = 0;
293*437bfbebSnyanmisaka RK_U8 *p_data = pScalingList->sl[3][listId];
294*437bfbebSnyanmisaka
295*437bfbebSnyanmisaka /* dump by block4x4, vectial direction */
296*437bfbebSnyanmisaka for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
297*437bfbebSnyanmisaka for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
298*437bfbebSnyanmisaka RK_S32 pos = blk4_y * 8 + blk4_x;
299*437bfbebSnyanmisaka
300*437bfbebSnyanmisaka for (i = 0; i < 4; i++) {
301*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 0], 8);
302*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 8], 8);
303*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 16], 8);
304*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[pos + i + 24], 8);
305*437bfbebSnyanmisaka }
306*437bfbebSnyanmisaka }
307*437bfbebSnyanmisaka }
308*437bfbebSnyanmisaka }
309*437bfbebSnyanmisaka //sizeId == 0, block4x4, horiztion direction */
310*437bfbebSnyanmisaka for (listId = 0; listId < SCALING_LIST_NUM; listId++) {
311*437bfbebSnyanmisaka RK_U8 *p_data = pScalingList->sl[0][listId];
312*437bfbebSnyanmisaka
313*437bfbebSnyanmisaka for (i = 0; i < 16; i++)
314*437bfbebSnyanmisaka mpp_put_bits(&bp, p_data[i], 8);
315*437bfbebSnyanmisaka }
316*437bfbebSnyanmisaka
317*437bfbebSnyanmisaka // dump dc value
318*437bfbebSnyanmisaka for (i = 0; i < SCALING_LIST_NUM; i++)//sizeId = 2, 16x16
319*437bfbebSnyanmisaka mpp_put_bits(&bp, pScalingList->sl_dc[0][i], 8);
320*437bfbebSnyanmisaka for (i = 0; i < SCALING_LIST_NUM; i++) //sizeId = 3, 32x32
321*437bfbebSnyanmisaka mpp_put_bits(&bp, pScalingList->sl_dc[1][i], 8);
322*437bfbebSnyanmisaka
323*437bfbebSnyanmisaka mpp_put_align(&bp, 128, 0);
324*437bfbebSnyanmisaka }
325*437bfbebSnyanmisaka
hal_h265d_vdpu383_scalinglist_packet(void * hal,void * ptr,void * dxva)326*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_scalinglist_packet(void *hal, void *ptr, void *dxva)
327*437bfbebSnyanmisaka {
328*437bfbebSnyanmisaka scalingList_t sl;
329*437bfbebSnyanmisaka RK_U32 i, j, pos;
330*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
331*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
332*437bfbebSnyanmisaka
333*437bfbebSnyanmisaka if (!dxva_ctx->pp.scaling_list_enabled_flag) {
334*437bfbebSnyanmisaka return MPP_OK;
335*437bfbebSnyanmisaka }
336*437bfbebSnyanmisaka
337*437bfbebSnyanmisaka if (memcmp((void*)&dxva_ctx->qm, reg_ctx->scaling_qm, sizeof(DXVA_Qmatrix_HEVC))) {
338*437bfbebSnyanmisaka memset(&sl, 0, sizeof(scalingList_t));
339*437bfbebSnyanmisaka
340*437bfbebSnyanmisaka for (i = 0; i < 6; i++) {
341*437bfbebSnyanmisaka for (j = 0; j < 16; j++) {
342*437bfbebSnyanmisaka pos = 4 * hal_hevc_diag_scan4x4_y[j] + hal_hevc_diag_scan4x4_x[j];
343*437bfbebSnyanmisaka sl.sl[0][i][pos] = dxva_ctx->qm.ucScalingLists0[i][j];
344*437bfbebSnyanmisaka }
345*437bfbebSnyanmisaka
346*437bfbebSnyanmisaka for (j = 0; j < 64; j++) {
347*437bfbebSnyanmisaka pos = 8 * hal_hevc_diag_scan8x8_y[j] + hal_hevc_diag_scan8x8_x[j];
348*437bfbebSnyanmisaka sl.sl[1][i][pos] = dxva_ctx->qm.ucScalingLists1[i][j];
349*437bfbebSnyanmisaka sl.sl[2][i][pos] = dxva_ctx->qm.ucScalingLists2[i][j];
350*437bfbebSnyanmisaka
351*437bfbebSnyanmisaka if (i == 0)
352*437bfbebSnyanmisaka sl.sl[3][i][pos] = dxva_ctx->qm.ucScalingLists3[0][j];
353*437bfbebSnyanmisaka else if (i == 3)
354*437bfbebSnyanmisaka sl.sl[3][i][pos] = dxva_ctx->qm.ucScalingLists3[1][j];
355*437bfbebSnyanmisaka else
356*437bfbebSnyanmisaka sl.sl[3][i][pos] = dxva_ctx->qm.ucScalingLists2[i][j];
357*437bfbebSnyanmisaka }
358*437bfbebSnyanmisaka
359*437bfbebSnyanmisaka sl.sl_dc[0][i] = dxva_ctx->qm.ucScalingListDCCoefSizeID2[i];
360*437bfbebSnyanmisaka if (i == 0)
361*437bfbebSnyanmisaka sl.sl_dc[1][i] = dxva_ctx->qm.ucScalingListDCCoefSizeID3[0];
362*437bfbebSnyanmisaka else if (i == 3)
363*437bfbebSnyanmisaka sl.sl_dc[1][i] = dxva_ctx->qm.ucScalingListDCCoefSizeID3[1];
364*437bfbebSnyanmisaka else
365*437bfbebSnyanmisaka sl.sl_dc[1][i] = dxva_ctx->qm.ucScalingListDCCoefSizeID2[i];
366*437bfbebSnyanmisaka }
367*437bfbebSnyanmisaka hal_vdpu383_record_scaling_list((scalingFactor_t *)reg_ctx->scaling_rk, &sl);
368*437bfbebSnyanmisaka }
369*437bfbebSnyanmisaka
370*437bfbebSnyanmisaka memcpy(ptr, reg_ctx->scaling_rk, sizeof(scalingFactor_t));
371*437bfbebSnyanmisaka
372*437bfbebSnyanmisaka return MPP_OK;
373*437bfbebSnyanmisaka }
374*437bfbebSnyanmisaka
hal_h265d_v345_output_pps_packet(void * hal,void * dxva)375*437bfbebSnyanmisaka static RK_S32 hal_h265d_v345_output_pps_packet(void *hal, void *dxva)
376*437bfbebSnyanmisaka {
377*437bfbebSnyanmisaka RK_S32 i;
378*437bfbebSnyanmisaka RK_U32 log2_min_cb_size;
379*437bfbebSnyanmisaka RK_S32 width, height;
380*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
381*437bfbebSnyanmisaka Vdpu383H265dRegSet *hw_reg = (Vdpu383H265dRegSet*)(reg_ctx->hw_regs);
382*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
383*437bfbebSnyanmisaka BitputCtx_t bp;
384*437bfbebSnyanmisaka
385*437bfbebSnyanmisaka if (NULL == reg_ctx || dxva_ctx == NULL) {
386*437bfbebSnyanmisaka mpp_err("%s:%s:%d reg_ctx or dxva_ctx is NULL",
387*437bfbebSnyanmisaka __FILE__, __FUNCTION__, __LINE__);
388*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
389*437bfbebSnyanmisaka }
390*437bfbebSnyanmisaka
391*437bfbebSnyanmisaka // SPS
392*437bfbebSnyanmisaka {
393*437bfbebSnyanmisaka void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->spspps_offset;
394*437bfbebSnyanmisaka RK_U64 *pps_packet = reg_ctx->pps_buf;
395*437bfbebSnyanmisaka
396*437bfbebSnyanmisaka if (NULL == pps_ptr) {
397*437bfbebSnyanmisaka mpp_err("pps_data get ptr error");
398*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
399*437bfbebSnyanmisaka }
400*437bfbebSnyanmisaka
401*437bfbebSnyanmisaka log2_min_cb_size = dxva_ctx->pp.log2_min_luma_coding_block_size_minus3 + 3;
402*437bfbebSnyanmisaka width = (dxva_ctx->pp.PicWidthInMinCbsY << log2_min_cb_size);
403*437bfbebSnyanmisaka height = (dxva_ctx->pp.PicHeightInMinCbsY << log2_min_cb_size);
404*437bfbebSnyanmisaka
405*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, pps_packet, 22); // 22*64bits
406*437bfbebSnyanmisaka
407*437bfbebSnyanmisaka if (dxva_ctx->pp.ps_update_flag) {
408*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.vps_id, 4);
409*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_id, 4);
410*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.chroma_format_idc, 2);
411*437bfbebSnyanmisaka
412*437bfbebSnyanmisaka mpp_put_bits(&bp, width, 16);
413*437bfbebSnyanmisaka mpp_put_bits(&bp, height, 16);
414*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.bit_depth_luma_minus8, 3);
415*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.bit_depth_chroma_minus8, 3);
416*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_max_pic_order_cnt_lsb_minus4 + 4, 5);
417*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size, 2);
418*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_min_luma_coding_block_size_minus3 + 3, 3);
419*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_min_transform_block_size_minus2 + 2, 3);
420*437bfbebSnyanmisaka
421*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_diff_max_min_transform_block_size, 2);
422*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.max_transform_hierarchy_depth_inter, 3);
423*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.max_transform_hierarchy_depth_intra, 3);
424*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.scaling_list_enabled_flag, 1);
425*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.amp_enabled_flag, 1);
426*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sample_adaptive_offset_enabled_flag, 1);
427*437bfbebSnyanmisaka ///<-zrh comment ^ 68 bit above
428*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag, 1);
429*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag ? (dxva_ctx->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0, 4);
430*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag ? (dxva_ctx->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0, 4);
431*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pcm_loop_filter_disabled_flag, 1);
432*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_diff_max_min_pcm_luma_coding_block_size, 3);
433*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pcm_enabled_flag ? (dxva_ctx->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
434*437bfbebSnyanmisaka
435*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.num_short_term_ref_pic_sets, 7);
436*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.long_term_ref_pics_present_flag, 1);
437*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.num_long_term_ref_pics_sps, 6);
438*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_temporal_mvp_enabled_flag, 1);
439*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.strong_intra_smoothing_enabled_flag, 1);
440*437bfbebSnyanmisaka // SPS extenstion
441*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.transform_skip_rotation_enabled_flag, 1);
442*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.transform_skip_context_enabled_flag, 1);
443*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.strong_intra_smoothing_enabled_flag, 1);
444*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.implicit_rdpcm_enabled_flag, 1);
445*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.explicit_rdpcm_enabled_flag, 1);
446*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.extended_precision_processing_flag, 1);
447*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.intra_smoothing_disabled_flag, 1);
448*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_max_dec_pic_buffering_minus1, 4);
449*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.separate_colour_plane_flag, 1);
450*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.high_precision_offsets_enabled_flag, 1);
451*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.persistent_rice_adaptation_enabled_flag, 1);
452*437bfbebSnyanmisaka
453*437bfbebSnyanmisaka /* PPS */
454*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_id, 6);
455*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_id, 4);
456*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.dependent_slice_segments_enabled_flag, 1);
457*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.output_flag_present_flag, 1);
458*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.num_extra_slice_header_bits, 13);
459*437bfbebSnyanmisaka
460*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sign_data_hiding_enabled_flag, 1);
461*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.cabac_init_present_flag, 1);
462*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.num_ref_idx_l0_default_active_minus1 + 1, 4);
463*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.num_ref_idx_l1_default_active_minus1 + 1, 4);
464*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.init_qp_minus26, 7);
465*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.constrained_intra_pred_flag, 1);
466*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.transform_skip_enabled_flag, 1);
467*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.cu_qp_delta_enabled_flag, 1);
468*437bfbebSnyanmisaka mpp_put_bits(&bp, log2_min_cb_size + dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size - dxva_ctx->pp.diff_cu_qp_delta_depth, 3);
469*437bfbebSnyanmisaka
470*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_cb_qp_offset, 5);
471*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_cr_qp_offset, 5);
472*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_slice_chroma_qp_offsets_present_flag, 1);
473*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.weighted_pred_flag, 1);
474*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.weighted_bipred_flag, 1);
475*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.transquant_bypass_enabled_flag, 1);
476*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.tiles_enabled_flag, 1);
477*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.entropy_coding_sync_enabled_flag, 1);
478*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_loop_filter_across_slices_enabled_flag, 1);
479*437bfbebSnyanmisaka
480*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.loop_filter_across_tiles_enabled_flag, 1);
481*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.deblocking_filter_override_enabled_flag, 1);
482*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_deblocking_filter_disabled_flag, 1);
483*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_beta_offset_div2, 4);
484*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.pps_tc_offset_div2, 4);
485*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.lists_modification_present_flag, 1);
486*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_parallel_merge_level_minus2 + 2, 3);
487*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.slice_segment_header_extension_present_flag, 1);
488*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 3);
489*437bfbebSnyanmisaka
490*437bfbebSnyanmisaka // PPS externsion
491*437bfbebSnyanmisaka if (dxva_ctx->pp.log2_max_transform_skip_block_size > 2) {
492*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.log2_max_transform_skip_block_size - 2, 2);
493*437bfbebSnyanmisaka } else {
494*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 2);
495*437bfbebSnyanmisaka }
496*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.cross_component_prediction_enabled_flag, 1);
497*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.chroma_qp_offset_list_enabled_flag, 1);
498*437bfbebSnyanmisaka
499*437bfbebSnyanmisaka RK_S32 log2_min_cu_chroma_qp_delta_size = log2_min_cb_size +
500*437bfbebSnyanmisaka dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size -
501*437bfbebSnyanmisaka dxva_ctx->pp.diff_cu_chroma_qp_offset_depth;
502*437bfbebSnyanmisaka mpp_put_bits(&bp, log2_min_cu_chroma_qp_delta_size, 3);
503*437bfbebSnyanmisaka for (i = 0; i < 6; i++)
504*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.cb_qp_offset_list[i], 5);
505*437bfbebSnyanmisaka for (i = 0; i < 6; i++)
506*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.cr_qp_offset_list[i], 5);
507*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.chroma_qp_offset_list_len_minus1, 3);
508*437bfbebSnyanmisaka
509*437bfbebSnyanmisaka /* mvc0 && mvc1 */
510*437bfbebSnyanmisaka mpp_put_bits(&bp, 0xffff, 16);
511*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
512*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 6);
513*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
514*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
515*437bfbebSnyanmisaka } else {
516*437bfbebSnyanmisaka bp.index = 4;
517*437bfbebSnyanmisaka bp.bitpos = 41;
518*437bfbebSnyanmisaka bp.bvalue = bp.pbuf[bp.index] & MPP_GENMASK(bp.bitpos - 1, 0);
519*437bfbebSnyanmisaka }
520*437bfbebSnyanmisaka /* poc info */
521*437bfbebSnyanmisaka {
522*437bfbebSnyanmisaka RK_S32 dpb_valid[15] = {0}, refpic_poc[15] = {0};
523*437bfbebSnyanmisaka
524*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_ctx->pp.RefPicList); i++) {
525*437bfbebSnyanmisaka if (dxva_ctx->pp.RefPicList[i].bPicEntry != 0xff &&
526*437bfbebSnyanmisaka dxva_ctx->pp.RefPicList[i].bPicEntry != 0x7f) {
527*437bfbebSnyanmisaka dpb_valid[i] = 1;
528*437bfbebSnyanmisaka refpic_poc[i] = dxva_ctx->pp.PicOrderCntValList[i];
529*437bfbebSnyanmisaka }
530*437bfbebSnyanmisaka }
531*437bfbebSnyanmisaka
532*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
533*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
534*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
535*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.current_poc, 32);
536*437bfbebSnyanmisaka
537*437bfbebSnyanmisaka for (i = 0; i < 15; i++)
538*437bfbebSnyanmisaka mpp_put_bits(&bp, refpic_poc[i], 32);
539*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 32);
540*437bfbebSnyanmisaka for (i = 0; i < 15; i++)
541*437bfbebSnyanmisaka mpp_put_bits(&bp, dpb_valid[i], 1);
542*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
543*437bfbebSnyanmisaka }
544*437bfbebSnyanmisaka
545*437bfbebSnyanmisaka /* tile info */
546*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.tiles_enabled_flag ? (dxva_ctx->pp.num_tile_columns_minus1 + 1) : 1, 5);
547*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.tiles_enabled_flag ? (dxva_ctx->pp.num_tile_rows_minus1 + 1) : 1, 5);
548*437bfbebSnyanmisaka {
549*437bfbebSnyanmisaka /// tiles info begin
550*437bfbebSnyanmisaka RK_U16 column_width[20];
551*437bfbebSnyanmisaka RK_U16 row_height[22];
552*437bfbebSnyanmisaka
553*437bfbebSnyanmisaka memset(column_width, 0, sizeof(column_width));
554*437bfbebSnyanmisaka memset(row_height, 0, sizeof(row_height));
555*437bfbebSnyanmisaka
556*437bfbebSnyanmisaka if (dxva_ctx->pp.tiles_enabled_flag) {
557*437bfbebSnyanmisaka if (dxva_ctx->pp.uniform_spacing_flag == 0) {
558*437bfbebSnyanmisaka RK_S32 maxcuwidth = dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
559*437bfbebSnyanmisaka RK_S32 ctu_width_in_pic = (width +
560*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
561*437bfbebSnyanmisaka RK_S32 ctu_height_in_pic = (height +
562*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
563*437bfbebSnyanmisaka RK_S32 sum = 0;
564*437bfbebSnyanmisaka for (i = 0; i < dxva_ctx->pp.num_tile_columns_minus1; i++) {
565*437bfbebSnyanmisaka column_width[i] = dxva_ctx->pp.column_width_minus1[i] + 1;
566*437bfbebSnyanmisaka sum += column_width[i] ;
567*437bfbebSnyanmisaka }
568*437bfbebSnyanmisaka column_width[i] = ctu_width_in_pic - sum;
569*437bfbebSnyanmisaka
570*437bfbebSnyanmisaka sum = 0;
571*437bfbebSnyanmisaka for (i = 0; i < dxva_ctx->pp.num_tile_rows_minus1; i++) {
572*437bfbebSnyanmisaka row_height[i] = dxva_ctx->pp.row_height_minus1[i] + 1;
573*437bfbebSnyanmisaka sum += row_height[i];
574*437bfbebSnyanmisaka }
575*437bfbebSnyanmisaka row_height[i] = ctu_height_in_pic - sum;
576*437bfbebSnyanmisaka } else {
577*437bfbebSnyanmisaka RK_S32 pic_in_cts_width = (width +
578*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
579*437bfbebSnyanmisaka dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
580*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
581*437bfbebSnyanmisaka dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size));
582*437bfbebSnyanmisaka RK_S32 pic_in_cts_height = (height +
583*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
584*437bfbebSnyanmisaka dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
585*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
586*437bfbebSnyanmisaka dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size));
587*437bfbebSnyanmisaka
588*437bfbebSnyanmisaka for (i = 0; i < dxva_ctx->pp.num_tile_columns_minus1 + 1; i++)
589*437bfbebSnyanmisaka column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_ctx->pp.num_tile_columns_minus1 + 1) -
590*437bfbebSnyanmisaka (i * pic_in_cts_width) / (dxva_ctx->pp.num_tile_columns_minus1 + 1);
591*437bfbebSnyanmisaka
592*437bfbebSnyanmisaka for (i = 0; i < dxva_ctx->pp.num_tile_rows_minus1 + 1; i++)
593*437bfbebSnyanmisaka row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_ctx->pp.num_tile_rows_minus1 + 1) -
594*437bfbebSnyanmisaka (i * pic_in_cts_height) / (dxva_ctx->pp.num_tile_rows_minus1 + 1);
595*437bfbebSnyanmisaka }
596*437bfbebSnyanmisaka } else {
597*437bfbebSnyanmisaka RK_S32 MaxCUWidth = (1 << (dxva_ctx->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
598*437bfbebSnyanmisaka column_width[0] = (width + MaxCUWidth - 1) / MaxCUWidth;
599*437bfbebSnyanmisaka row_height[0] = (height + MaxCUWidth - 1) / MaxCUWidth;
600*437bfbebSnyanmisaka }
601*437bfbebSnyanmisaka
602*437bfbebSnyanmisaka for (i = 0; i < 20; i++)
603*437bfbebSnyanmisaka mpp_put_bits(&bp, column_width[i], 12);
604*437bfbebSnyanmisaka
605*437bfbebSnyanmisaka for (i = 0; i < 22; i++)
606*437bfbebSnyanmisaka mpp_put_bits(&bp, row_height[i], 12);
607*437bfbebSnyanmisaka }
608*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0);//128
609*437bfbebSnyanmisaka memcpy(pps_ptr, reg_ctx->pps_buf, 176);
610*437bfbebSnyanmisaka } /* --- end spspps data ------*/
611*437bfbebSnyanmisaka
612*437bfbebSnyanmisaka if (dxva_ctx->pp.scaling_list_enabled_flag) {
613*437bfbebSnyanmisaka RK_U32 addr;
614*437bfbebSnyanmisaka RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->sclst_offset;
615*437bfbebSnyanmisaka
616*437bfbebSnyanmisaka if (dxva_ctx->pp.scaling_list_data_present_flag) {
617*437bfbebSnyanmisaka addr = (dxva_ctx->pp.pps_id + 16) * 1360;
618*437bfbebSnyanmisaka } else if (dxva_ctx->pp.scaling_list_enabled_flag) {
619*437bfbebSnyanmisaka addr = dxva_ctx->pp.sps_id * 1360;
620*437bfbebSnyanmisaka } else {
621*437bfbebSnyanmisaka addr = 80 * 1360;
622*437bfbebSnyanmisaka }
623*437bfbebSnyanmisaka
624*437bfbebSnyanmisaka hal_h265d_vdpu383_scalinglist_packet(hal, ptr_scaling + addr, dxva);
625*437bfbebSnyanmisaka
626*437bfbebSnyanmisaka hw_reg->common_addr.reg132_scanlist_addr = reg_ctx->bufs_fd;
627*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 132, addr + reg_ctx->sclst_offset);
628*437bfbebSnyanmisaka }
629*437bfbebSnyanmisaka
630*437bfbebSnyanmisaka #ifdef dump
631*437bfbebSnyanmisaka fwrite(pps_ptr, 1, 80 * 64, fp);
632*437bfbebSnyanmisaka RK_U32 *tmp = (RK_U32 *)pps_ptr;
633*437bfbebSnyanmisaka for (i = 0; i < 112 / 4; i++) {
634*437bfbebSnyanmisaka mpp_log("pps[%3d] = 0x%08x\n", i, tmp[i]);
635*437bfbebSnyanmisaka }
636*437bfbebSnyanmisaka #endif
637*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
638*437bfbebSnyanmisaka {
639*437bfbebSnyanmisaka char *cur_fname = "global_cfg.dat";
640*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
641*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
642*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 64 * bp.index + bp.bitpos, 128, 0);
643*437bfbebSnyanmisaka }
644*437bfbebSnyanmisaka #endif
645*437bfbebSnyanmisaka
646*437bfbebSnyanmisaka return 0;
647*437bfbebSnyanmisaka }
648*437bfbebSnyanmisaka
h265d_refine_rcb_size(Vdpu383RcbInfo * rcb_info,RK_S32 width,RK_S32 height,void * dxva)649*437bfbebSnyanmisaka static void h265d_refine_rcb_size(Vdpu383RcbInfo *rcb_info,
650*437bfbebSnyanmisaka RK_S32 width, RK_S32 height, void *dxva)
651*437bfbebSnyanmisaka {
652*437bfbebSnyanmisaka RK_U32 rcb_bits = 0;
653*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
654*437bfbebSnyanmisaka DXVA_PicParams_HEVC *pp = &dxva_ctx->pp;
655*437bfbebSnyanmisaka RK_U32 chroma_fmt_idc = pp->chroma_format_idc;//0 400,1 4202 ,422,3 444
656*437bfbebSnyanmisaka RK_U8 bit_depth = MPP_MAX(pp->bit_depth_luma_minus8, pp->bit_depth_chroma_minus8) + 8;
657*437bfbebSnyanmisaka RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size + pp->log2_min_luma_coding_block_size_minus3 + 3);
658*437bfbebSnyanmisaka RK_U32 tile_row_cut_num = pp->num_tile_rows_minus1;
659*437bfbebSnyanmisaka RK_U32 tile_col_cut_num = pp->num_tile_columns_minus1;
660*437bfbebSnyanmisaka RK_U32 ext_row_align_size = tile_row_cut_num * 64 * 8;
661*437bfbebSnyanmisaka RK_U32 ext_col_align_size = tile_col_cut_num * 64 * 8;
662*437bfbebSnyanmisaka RK_U32 filterd_row_append = 8192;
663*437bfbebSnyanmisaka RK_U32 row_uv_para = 0;
664*437bfbebSnyanmisaka RK_U32 col_uv_para = 0;
665*437bfbebSnyanmisaka
666*437bfbebSnyanmisaka if (chroma_fmt_idc == 1) {
667*437bfbebSnyanmisaka row_uv_para = 1;
668*437bfbebSnyanmisaka col_uv_para = 1;
669*437bfbebSnyanmisaka } else if (chroma_fmt_idc == 2) {
670*437bfbebSnyanmisaka row_uv_para = 1;
671*437bfbebSnyanmisaka col_uv_para = 3;
672*437bfbebSnyanmisaka } else if (chroma_fmt_idc == 3) {
673*437bfbebSnyanmisaka row_uv_para = 3;
674*437bfbebSnyanmisaka col_uv_para = 3;
675*437bfbebSnyanmisaka }
676*437bfbebSnyanmisaka
677*437bfbebSnyanmisaka width = MPP_ALIGN(width, ctu_size);
678*437bfbebSnyanmisaka height = MPP_ALIGN(height, ctu_size);
679*437bfbebSnyanmisaka /* RCB_STRMD_ROW && RCB_STRMD_TILE_ROW*/
680*437bfbebSnyanmisaka rcb_info[RCB_STRMD_ROW].size = 0;
681*437bfbebSnyanmisaka rcb_info[RCB_STRMD_TILE_ROW].size = 0;
682*437bfbebSnyanmisaka
683*437bfbebSnyanmisaka /* RCB_INTER_ROW && RCB_INTER_TILE_ROW*/
684*437bfbebSnyanmisaka rcb_bits = ((width + 7) / 8) * 174;
685*437bfbebSnyanmisaka rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
686*437bfbebSnyanmisaka rcb_bits += ext_row_align_size;
687*437bfbebSnyanmisaka if (tile_row_cut_num)
688*437bfbebSnyanmisaka rcb_info[RCB_INTER_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
689*437bfbebSnyanmisaka else
690*437bfbebSnyanmisaka rcb_info[RCB_INTER_TILE_ROW].size = 0;
691*437bfbebSnyanmisaka
692*437bfbebSnyanmisaka /* RCB_INTRA_ROW && RCB_INTRA_TILE_ROW*/
693*437bfbebSnyanmisaka rcb_bits = MPP_ALIGN(width, 512) * (bit_depth + 2);
694*437bfbebSnyanmisaka rcb_bits = rcb_bits * 4; //TODO:
695*437bfbebSnyanmisaka rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
696*437bfbebSnyanmisaka rcb_bits += ext_row_align_size;
697*437bfbebSnyanmisaka if (tile_row_cut_num)
698*437bfbebSnyanmisaka rcb_info[RCB_INTRA_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
699*437bfbebSnyanmisaka else
700*437bfbebSnyanmisaka rcb_info[RCB_INTRA_TILE_ROW].size = 0;
701*437bfbebSnyanmisaka
702*437bfbebSnyanmisaka /* RCB_FILTERD_ROW && RCB_FILTERD_TILE_ROW*/
703*437bfbebSnyanmisaka rcb_bits = (MPP_ALIGN(width, 64) * (1.6 * bit_depth + 0.5) * (8 + 5 * row_uv_para));
704*437bfbebSnyanmisaka // save space mode : half for RCB_FILTERD_ROW, half for RCB_FILTERD_PROTECT_ROW
705*437bfbebSnyanmisaka if (width > 4096)
706*437bfbebSnyanmisaka filterd_row_append = 27648;
707*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_ROW].size = MPP_RCB_BYTES(rcb_bits / 2) + filterd_row_append;
708*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_PROTECT_ROW].size = MPP_RCB_BYTES(rcb_bits / 2) + filterd_row_append;
709*437bfbebSnyanmisaka rcb_bits += ext_row_align_size;
710*437bfbebSnyanmisaka if (tile_row_cut_num)
711*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
712*437bfbebSnyanmisaka else
713*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_ROW].size = 0;
714*437bfbebSnyanmisaka
715*437bfbebSnyanmisaka /* RCB_FILTERD_TILE_COL */
716*437bfbebSnyanmisaka if (tile_col_cut_num) {
717*437bfbebSnyanmisaka rcb_bits = (MPP_ALIGN(height, 64) * (1.6 * bit_depth + 0.5) * (16.5 + 5 * col_uv_para)) + ext_col_align_size;
718*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_COL].size = MPP_RCB_BYTES(rcb_bits);
719*437bfbebSnyanmisaka } else {
720*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_COL].size = 0;
721*437bfbebSnyanmisaka }
722*437bfbebSnyanmisaka
723*437bfbebSnyanmisaka }
724*437bfbebSnyanmisaka
hal_h265d_rcb_info_update(void * hal,void * dxva,Vdpu383H265dRegSet * hw_regs,RK_S32 width,RK_S32 height)725*437bfbebSnyanmisaka static void hal_h265d_rcb_info_update(void *hal, void *dxva,
726*437bfbebSnyanmisaka Vdpu383H265dRegSet *hw_regs,
727*437bfbebSnyanmisaka RK_S32 width, RK_S32 height)
728*437bfbebSnyanmisaka {
729*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
730*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
731*437bfbebSnyanmisaka DXVA_PicParams_HEVC *pp = &dxva_ctx->pp;
732*437bfbebSnyanmisaka RK_U32 chroma_fmt_idc = pp->chroma_format_idc;//0 400,1 4202 ,422,3 444
733*437bfbebSnyanmisaka RK_U8 bit_depth = MPP_MAX(pp->bit_depth_luma_minus8, pp->bit_depth_chroma_minus8) + 8;
734*437bfbebSnyanmisaka RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size + pp->log2_min_luma_coding_block_size_minus3 + 3);
735*437bfbebSnyanmisaka RK_U32 num_tiles = pp->num_tile_rows_minus1 + 1;
736*437bfbebSnyanmisaka (void)hw_regs;
737*437bfbebSnyanmisaka
738*437bfbebSnyanmisaka if (reg_ctx->num_row_tiles != num_tiles ||
739*437bfbebSnyanmisaka reg_ctx->bit_depth != bit_depth ||
740*437bfbebSnyanmisaka reg_ctx->chroma_fmt_idc != chroma_fmt_idc ||
741*437bfbebSnyanmisaka reg_ctx->ctu_size != ctu_size ||
742*437bfbebSnyanmisaka reg_ctx->width != width ||
743*437bfbebSnyanmisaka reg_ctx->height != height) {
744*437bfbebSnyanmisaka RK_U32 i = 0;
745*437bfbebSnyanmisaka RK_U32 loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->g_buf) : 1;
746*437bfbebSnyanmisaka
747*437bfbebSnyanmisaka reg_ctx->rcb_buf_size = vdpu383_get_rcb_buf_size((Vdpu383RcbInfo *)reg_ctx->rcb_info, width, height);
748*437bfbebSnyanmisaka h265d_refine_rcb_size((Vdpu383RcbInfo *)reg_ctx->rcb_info, width, height, dxva_ctx);
749*437bfbebSnyanmisaka
750*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
751*437bfbebSnyanmisaka MppBuffer rcb_buf;
752*437bfbebSnyanmisaka
753*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
754*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
755*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
756*437bfbebSnyanmisaka }
757*437bfbebSnyanmisaka mpp_buffer_get(reg_ctx->group, &rcb_buf, reg_ctx->rcb_buf_size);
758*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = rcb_buf;
759*437bfbebSnyanmisaka }
760*437bfbebSnyanmisaka
761*437bfbebSnyanmisaka reg_ctx->num_row_tiles = num_tiles;
762*437bfbebSnyanmisaka reg_ctx->bit_depth = bit_depth;
763*437bfbebSnyanmisaka reg_ctx->chroma_fmt_idc = chroma_fmt_idc;
764*437bfbebSnyanmisaka reg_ctx->ctu_size = ctu_size;
765*437bfbebSnyanmisaka reg_ctx->width = width;
766*437bfbebSnyanmisaka reg_ctx->height = height;
767*437bfbebSnyanmisaka }
768*437bfbebSnyanmisaka }
769*437bfbebSnyanmisaka
hal_h265d_vdpu383_rps(void * dxva,void * rps_buf,void * sw_rps_buf,RK_U32 fast_mode)770*437bfbebSnyanmisaka static RK_S32 hal_h265d_vdpu383_rps(void *dxva, void *rps_buf, void* sw_rps_buf, RK_U32 fast_mode)
771*437bfbebSnyanmisaka {
772*437bfbebSnyanmisaka BitputCtx_t bp;
773*437bfbebSnyanmisaka RK_S32 fifo_len = 400;
774*437bfbebSnyanmisaka RK_S32 i = 0, j = 0;
775*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t*)dxva;
776*437bfbebSnyanmisaka
777*437bfbebSnyanmisaka if (!dxva_ctx->pp.rps_update_flag) {
778*437bfbebSnyanmisaka if (fast_mode) {
779*437bfbebSnyanmisaka memcpy(rps_buf, sw_rps_buf, fifo_len * sizeof(RK_U64));
780*437bfbebSnyanmisaka }
781*437bfbebSnyanmisaka return 0;
782*437bfbebSnyanmisaka }
783*437bfbebSnyanmisaka
784*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, (RK_U64*)sw_rps_buf, fifo_len);
785*437bfbebSnyanmisaka
786*437bfbebSnyanmisaka for (i = 0; i < 32; i ++) {
787*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_lt_rps[i].lt_ref_pic_poc_lsb, 16);
788*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_lt_rps[i].used_by_curr_pic_lt_flag, 1);
789*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 15);
790*437bfbebSnyanmisaka }
791*437bfbebSnyanmisaka
792*437bfbebSnyanmisaka for (i = 0; i < 64; i++) {
793*437bfbebSnyanmisaka if (i < dxva_ctx->pp.num_short_term_ref_pic_sets) {
794*437bfbebSnyanmisaka
795*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_st_rps[i].num_negative_pics, 4);
796*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_st_rps[i].num_positive_pics, 4);
797*437bfbebSnyanmisaka for ( j = 0; j < dxva_ctx->pp.sps_st_rps[i].num_negative_pics; j++) {
798*437bfbebSnyanmisaka
799*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_st_rps[i].delta_poc_s0[j], 16);
800*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_st_rps[i].s0_used_flag[j], 1);
801*437bfbebSnyanmisaka }
802*437bfbebSnyanmisaka
803*437bfbebSnyanmisaka for (j = 0; j < dxva_ctx->pp.sps_st_rps[i].num_positive_pics; j++) {
804*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_st_rps[i].delta_poc_s1[j], 16);
805*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_ctx->pp.sps_st_rps[i].s1_used_flag[j], 1);
806*437bfbebSnyanmisaka
807*437bfbebSnyanmisaka }
808*437bfbebSnyanmisaka
809*437bfbebSnyanmisaka for ( j = dxva_ctx->pp.sps_st_rps[i].num_negative_pics + dxva_ctx->pp.sps_st_rps[i].num_positive_pics; j < 15; j++) {
810*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 16);
811*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
812*437bfbebSnyanmisaka }
813*437bfbebSnyanmisaka
814*437bfbebSnyanmisaka } else {
815*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 4);
816*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 4);
817*437bfbebSnyanmisaka for ( j = 0; j < 15; j++) {
818*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 16);
819*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
820*437bfbebSnyanmisaka }
821*437bfbebSnyanmisaka }
822*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0);
823*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 128);
824*437bfbebSnyanmisaka }
825*437bfbebSnyanmisaka
826*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
827*437bfbebSnyanmisaka {
828*437bfbebSnyanmisaka char *cur_fname = "rps_128bit.dat";
829*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
830*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
831*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 64 * bp.index + bp.bitpos, 128, 0);
832*437bfbebSnyanmisaka }
833*437bfbebSnyanmisaka #endif
834*437bfbebSnyanmisaka
835*437bfbebSnyanmisaka RK_U32 *tmp = (RK_U32 *)sw_rps_buf;
836*437bfbebSnyanmisaka memcpy(rps_buf, sw_rps_buf, fifo_len * sizeof(RK_U64));
837*437bfbebSnyanmisaka
838*437bfbebSnyanmisaka if (hal_h265d_debug & H265H_DBG_RPS) {
839*437bfbebSnyanmisaka for (i = 0; i < 400 * 8 / 4; i++) {
840*437bfbebSnyanmisaka mpp_log("rps[%3d] = 0x%08x\n", i, tmp[i]);
841*437bfbebSnyanmisaka }
842*437bfbebSnyanmisaka }
843*437bfbebSnyanmisaka return 0;
844*437bfbebSnyanmisaka }
845*437bfbebSnyanmisaka
calc_mv_size(RK_S32 pic_w,RK_S32 pic_h,RK_S32 ctu_w)846*437bfbebSnyanmisaka static RK_S32 calc_mv_size(RK_S32 pic_w, RK_S32 pic_h, RK_S32 ctu_w)
847*437bfbebSnyanmisaka {
848*437bfbebSnyanmisaka RK_S32 seg_w = 64 * 16 * 16 / ctu_w; // colmv_block_size = 16, colmv_per_bytes = 16
849*437bfbebSnyanmisaka RK_S32 seg_cnt_w = MPP_ALIGN(pic_w, seg_w) / seg_w;
850*437bfbebSnyanmisaka RK_S32 seg_cnt_h = MPP_ALIGN(pic_h, ctu_w) / ctu_w;
851*437bfbebSnyanmisaka RK_S32 mv_size = seg_cnt_w * seg_cnt_h * 64 * 16;
852*437bfbebSnyanmisaka
853*437bfbebSnyanmisaka return mv_size;
854*437bfbebSnyanmisaka }
855*437bfbebSnyanmisaka
hal_h265d_vdpu383_gen_regs(void * hal,HalTaskInfo * syn)856*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_gen_regs(void *hal, HalTaskInfo *syn)
857*437bfbebSnyanmisaka {
858*437bfbebSnyanmisaka RK_S32 i = 0;
859*437bfbebSnyanmisaka RK_S32 log2_min_cb_size;
860*437bfbebSnyanmisaka RK_S32 width, height;
861*437bfbebSnyanmisaka RK_S32 stride_y, stride_uv, virstrid_y;
862*437bfbebSnyanmisaka Vdpu383H265dRegSet *hw_regs;
863*437bfbebSnyanmisaka RK_S32 ret = MPP_SUCCESS;
864*437bfbebSnyanmisaka MppBuffer streambuf = NULL;
865*437bfbebSnyanmisaka RK_S32 aglin_offset = 0;
866*437bfbebSnyanmisaka RK_S32 valid_ref = -1;
867*437bfbebSnyanmisaka MppBuffer framebuf = NULL;
868*437bfbebSnyanmisaka HalBuf *mv_buf = NULL;
869*437bfbebSnyanmisaka RK_S32 fd = -1;
870*437bfbebSnyanmisaka RK_U32 mv_size = 0;
871*437bfbebSnyanmisaka RK_S32 distance = INT_MAX;
872*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
873*437bfbebSnyanmisaka
874*437bfbebSnyanmisaka (void) fd;
875*437bfbebSnyanmisaka if (syn->dec.flags.parse_err ||
876*437bfbebSnyanmisaka (syn->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
877*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
878*437bfbebSnyanmisaka return MPP_OK;
879*437bfbebSnyanmisaka }
880*437bfbebSnyanmisaka
881*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_ctx = (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
882*437bfbebSnyanmisaka HalBuf *origin_buf = NULL;
883*437bfbebSnyanmisaka
884*437bfbebSnyanmisaka void *rps_ptr = NULL;
885*437bfbebSnyanmisaka if (reg_ctx ->fast_mode) {
886*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
887*437bfbebSnyanmisaka if (!reg_ctx->g_buf[i].use_flag) {
888*437bfbebSnyanmisaka syn->dec.reg_index = i;
889*437bfbebSnyanmisaka
890*437bfbebSnyanmisaka reg_ctx->spspps_offset = reg_ctx->offset_spspps[i];
891*437bfbebSnyanmisaka reg_ctx->rps_offset = reg_ctx->offset_rps[i];
892*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->offset_sclst[i];
893*437bfbebSnyanmisaka
894*437bfbebSnyanmisaka reg_ctx->hw_regs = reg_ctx->g_buf[i].hw_regs;
895*437bfbebSnyanmisaka reg_ctx->g_buf[i].use_flag = 1;
896*437bfbebSnyanmisaka break;
897*437bfbebSnyanmisaka }
898*437bfbebSnyanmisaka }
899*437bfbebSnyanmisaka if (i == MAX_GEN_REG) {
900*437bfbebSnyanmisaka mpp_err("hevc rps buf all used");
901*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
902*437bfbebSnyanmisaka }
903*437bfbebSnyanmisaka }
904*437bfbebSnyanmisaka rps_ptr = mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->rps_offset;
905*437bfbebSnyanmisaka if (NULL == rps_ptr) {
906*437bfbebSnyanmisaka
907*437bfbebSnyanmisaka mpp_err("rps_data get ptr error");
908*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
909*437bfbebSnyanmisaka }
910*437bfbebSnyanmisaka
911*437bfbebSnyanmisaka
912*437bfbebSnyanmisaka if (syn->dec.syntax.data == NULL) {
913*437bfbebSnyanmisaka mpp_err("%s:%s:%d dxva is NULL", __FILE__, __FUNCTION__, __LINE__);
914*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
915*437bfbebSnyanmisaka }
916*437bfbebSnyanmisaka
917*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
918*437bfbebSnyanmisaka {
919*437bfbebSnyanmisaka memset(dump_cur_dir, 0, sizeof(dump_cur_dir));
920*437bfbebSnyanmisaka sprintf(dump_cur_dir, "hevc/Frame%04d", dump_cur_frame);
921*437bfbebSnyanmisaka if (access(dump_cur_dir, 0)) {
922*437bfbebSnyanmisaka if (mkdir(dump_cur_dir))
923*437bfbebSnyanmisaka mpp_err_f("error: mkdir %s\n", dump_cur_dir);
924*437bfbebSnyanmisaka }
925*437bfbebSnyanmisaka dump_cur_frame++;
926*437bfbebSnyanmisaka }
927*437bfbebSnyanmisaka #endif
928*437bfbebSnyanmisaka
929*437bfbebSnyanmisaka /* output pps */
930*437bfbebSnyanmisaka hw_regs = (Vdpu383H265dRegSet*)reg_ctx->hw_regs;
931*437bfbebSnyanmisaka memset(hw_regs, 0, sizeof(Vdpu383H265dRegSet));
932*437bfbebSnyanmisaka
933*437bfbebSnyanmisaka if (NULL == reg_ctx->hw_regs) {
934*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
935*437bfbebSnyanmisaka }
936*437bfbebSnyanmisaka
937*437bfbebSnyanmisaka
938*437bfbebSnyanmisaka log2_min_cb_size = dxva_ctx->pp.log2_min_luma_coding_block_size_minus3 + 3;
939*437bfbebSnyanmisaka width = (dxva_ctx->pp.PicWidthInMinCbsY << log2_min_cb_size);
940*437bfbebSnyanmisaka height = (dxva_ctx->pp.PicHeightInMinCbsY << log2_min_cb_size);
941*437bfbebSnyanmisaka mv_size = calc_mv_size(width, height, 1 << log2_min_cb_size) * 2;
942*437bfbebSnyanmisaka
943*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs == NULL || reg_ctx->mv_size < mv_size) {
944*437bfbebSnyanmisaka size_t size = mv_size;
945*437bfbebSnyanmisaka
946*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs) {
947*437bfbebSnyanmisaka hal_bufs_deinit(reg_ctx->cmv_bufs);
948*437bfbebSnyanmisaka reg_ctx->cmv_bufs = NULL;
949*437bfbebSnyanmisaka }
950*437bfbebSnyanmisaka
951*437bfbebSnyanmisaka hal_bufs_init(®_ctx->cmv_bufs);
952*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs == NULL) {
953*437bfbebSnyanmisaka mpp_err_f("colmv bufs init fail");
954*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
955*437bfbebSnyanmisaka }
956*437bfbebSnyanmisaka
957*437bfbebSnyanmisaka reg_ctx->mv_size = mv_size;
958*437bfbebSnyanmisaka reg_ctx->mv_count = mpp_buf_slot_get_count(reg_ctx->slots);
959*437bfbebSnyanmisaka hal_bufs_setup(reg_ctx->cmv_bufs, reg_ctx->mv_count, 1, &size);
960*437bfbebSnyanmisaka }
961*437bfbebSnyanmisaka
962*437bfbebSnyanmisaka {
963*437bfbebSnyanmisaka MppFrame mframe = NULL;
964*437bfbebSnyanmisaka RK_U32 ver_virstride;
965*437bfbebSnyanmisaka RK_U32 virstrid_uv;
966*437bfbebSnyanmisaka MppFrameFormat fmt;
967*437bfbebSnyanmisaka RK_U32 chroma_fmt_idc = dxva_ctx->pp.chroma_format_idc;
968*437bfbebSnyanmisaka
969*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
970*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
971*437bfbebSnyanmisaka /* for 8K downscale mode*/
972*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY &&
973*437bfbebSnyanmisaka reg_ctx->origin_bufs == NULL) {
974*437bfbebSnyanmisaka vdpu383_setup_scale_origin_bufs(reg_ctx, mframe);
975*437bfbebSnyanmisaka }
976*437bfbebSnyanmisaka
977*437bfbebSnyanmisaka fmt = mpp_frame_get_fmt(mframe);
978*437bfbebSnyanmisaka
979*437bfbebSnyanmisaka stride_y = mpp_frame_get_hor_stride(mframe);
980*437bfbebSnyanmisaka ver_virstride = mpp_frame_get_ver_stride(mframe);
981*437bfbebSnyanmisaka stride_uv = stride_y;
982*437bfbebSnyanmisaka virstrid_y = ver_virstride * stride_y;
983*437bfbebSnyanmisaka if (chroma_fmt_idc == 3)
984*437bfbebSnyanmisaka stride_uv *= 2;
985*437bfbebSnyanmisaka if (chroma_fmt_idc == 3 || chroma_fmt_idc == 2) {
986*437bfbebSnyanmisaka virstrid_uv = stride_uv * ver_virstride;
987*437bfbebSnyanmisaka } else {
988*437bfbebSnyanmisaka virstrid_uv = stride_uv * ver_virstride / 2;
989*437bfbebSnyanmisaka }
990*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(fmt)) {
991*437bfbebSnyanmisaka RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
992*437bfbebSnyanmisaka RK_U32 fbd_offset;
993*437bfbebSnyanmisaka
994*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg9.fbc_e = 1;
995*437bfbebSnyanmisaka hw_regs->h265d_paras.reg68_hor_virstride = fbc_hdr_stride / 64;
996*437bfbebSnyanmisaka fbd_offset = fbc_hdr_stride * MPP_ALIGN(ver_virstride, 64) / 16;
997*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg193_fbc_payload_offset = fbd_offset;
998*437bfbebSnyanmisaka } else if (MPP_FRAME_FMT_IS_TILE(fmt)) {
999*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg9.tile_e = 1;
1000*437bfbebSnyanmisaka if (chroma_fmt_idc == 0) { //yuv400
1001*437bfbebSnyanmisaka hw_regs->h265d_paras.reg68_hor_virstride = stride_y * 4 / 16;
1002*437bfbebSnyanmisaka } else if (chroma_fmt_idc == 2) { //yuv422
1003*437bfbebSnyanmisaka hw_regs->h265d_paras.reg68_hor_virstride = stride_y * 8 / 16;
1004*437bfbebSnyanmisaka } else if (chroma_fmt_idc == 3) { //yuv444
1005*437bfbebSnyanmisaka hw_regs->h265d_paras.reg68_hor_virstride = stride_y * 12 / 16;
1006*437bfbebSnyanmisaka } else { //yuv420
1007*437bfbebSnyanmisaka hw_regs->h265d_paras.reg68_hor_virstride = stride_y * 6 / 16;
1008*437bfbebSnyanmisaka }
1009*437bfbebSnyanmisaka hw_regs->h265d_paras.reg70_y_virstride = (virstrid_y + virstrid_uv) / 16;
1010*437bfbebSnyanmisaka } else {
1011*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg9.fbc_e = 0;
1012*437bfbebSnyanmisaka hw_regs->h265d_paras.reg68_hor_virstride = stride_y >> 4;
1013*437bfbebSnyanmisaka hw_regs->h265d_paras.reg69_raster_uv_hor_virstride = stride_uv >> 4;
1014*437bfbebSnyanmisaka hw_regs->h265d_paras.reg70_y_virstride = virstrid_y >> 4;
1015*437bfbebSnyanmisaka }
1016*437bfbebSnyanmisaka hw_regs->h265d_paras.reg80_error_ref_hor_virstride = hw_regs->h265d_paras.reg68_hor_virstride;
1017*437bfbebSnyanmisaka hw_regs->h265d_paras.reg81_error_ref_raster_uv_hor_virstride = hw_regs->h265d_paras.reg69_raster_uv_hor_virstride;
1018*437bfbebSnyanmisaka hw_regs->h265d_paras.reg82_error_ref_virstride = hw_regs->h265d_paras.reg70_y_virstride;
1019*437bfbebSnyanmisaka }
1020*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
1021*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
1022*437bfbebSnyanmisaka
1023*437bfbebSnyanmisaka if (reg_ctx->origin_bufs) {
1024*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(reg_ctx->origin_bufs,
1025*437bfbebSnyanmisaka dxva_ctx->pp.CurrPic.Index7Bits);
1026*437bfbebSnyanmisaka framebuf = origin_buf->buf[0];
1027*437bfbebSnyanmisaka }
1028*437bfbebSnyanmisaka
1029*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg168_decout_base = mpp_buffer_get_fd(framebuf); //just index need map
1030*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg169_error_ref_base = mpp_buffer_get_fd(framebuf);
1031*437bfbebSnyanmisaka /*if out_base is equal to zero it means this frame may error
1032*437bfbebSnyanmisaka we return directly add by csy*/
1033*437bfbebSnyanmisaka
1034*437bfbebSnyanmisaka if (hw_regs->h265d_addrs.reg168_decout_base == 0) {
1035*437bfbebSnyanmisaka return 0;
1036*437bfbebSnyanmisaka }
1037*437bfbebSnyanmisaka
1038*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(framebuf);
1039*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg168_decout_base = fd;
1040*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg192_payload_st_cur_base = fd;
1041*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, dxva_ctx->pp.CurrPic.Index7Bits);
1042*437bfbebSnyanmisaka
1043*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg216_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
1044*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
1045*437bfbebSnyanmisaka {
1046*437bfbebSnyanmisaka char *cur_fname = "colmv_cur_frame.dat";
1047*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
1048*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
1049*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(mv_buf->buf[0]),
1050*437bfbebSnyanmisaka mpp_buffer_get_size(mv_buf->buf[0]), 64, 0);
1051*437bfbebSnyanmisaka }
1052*437bfbebSnyanmisaka #endif
1053*437bfbebSnyanmisaka
1054*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->packet_slots, syn->dec.input, SLOT_BUFFER,
1055*437bfbebSnyanmisaka &streambuf);
1056*437bfbebSnyanmisaka if ( dxva_ctx->bitstream == NULL) {
1057*437bfbebSnyanmisaka dxva_ctx->bitstream = mpp_buffer_get_ptr(streambuf);
1058*437bfbebSnyanmisaka }
1059*437bfbebSnyanmisaka
1060*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
1061*437bfbebSnyanmisaka {
1062*437bfbebSnyanmisaka char *cur_fname = "stream_in_128bit.dat";
1063*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
1064*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
1065*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(streambuf),
1066*437bfbebSnyanmisaka mpp_buffer_get_size(streambuf), 128, 0);
1067*437bfbebSnyanmisaka }
1068*437bfbebSnyanmisaka #endif
1069*437bfbebSnyanmisaka
1070*437bfbebSnyanmisaka hal_h265d_vdpu383_rps(syn->dec.syntax.data, rps_ptr, reg_ctx->sw_rps_buf, reg_ctx->fast_mode);
1071*437bfbebSnyanmisaka
1072*437bfbebSnyanmisaka hw_regs->common_addr.reg128_strm_base = mpp_buffer_get_fd(streambuf);
1073*437bfbebSnyanmisaka hw_regs->h265d_paras.reg66_stream_len = ((dxva_ctx->bitstream_size + 15) & (~15)) + 64;
1074*437bfbebSnyanmisaka aglin_offset = hw_regs->h265d_paras.reg66_stream_len - dxva_ctx->bitstream_size;
1075*437bfbebSnyanmisaka if (aglin_offset > 0)
1076*437bfbebSnyanmisaka memset((void *)(dxva_ctx->bitstream + dxva_ctx->bitstream_size), 0, aglin_offset);
1077*437bfbebSnyanmisaka
1078*437bfbebSnyanmisaka /* common setting */
1079*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg8_dec_mode = 0; // hevc
1080*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg9.buf_empty_en = 0;
1081*437bfbebSnyanmisaka
1082*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.strmd_auto_gating_e = 1;
1083*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.inter_auto_gating_e = 1;
1084*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.intra_auto_gating_e = 1;
1085*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.transd_auto_gating_e = 1;
1086*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.recon_auto_gating_e = 1;
1087*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.filterd_auto_gating_e = 1;
1088*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.bus_auto_gating_e = 1;
1089*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.ctrl_auto_gating_e = 1;
1090*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.rcb_auto_gating_e = 1;
1091*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg10.err_prc_auto_gating_e = 1;
1092*437bfbebSnyanmisaka
1093*437bfbebSnyanmisaka // hw_regs->ctrl_regs.reg11.dec_timeout_dis = 1;
1094*437bfbebSnyanmisaka
1095*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg16.error_proc_disable = 1;
1096*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg16.error_spread_disable = 0;
1097*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg16.roi_error_ctu_cal_en = 0;
1098*437bfbebSnyanmisaka
1099*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg20_cabac_error_en_lowbits = 0xffffffff;
1100*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg21_cabac_error_en_highbits = 0x3ff3f9ff;
1101*437bfbebSnyanmisaka
1102*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg13_core_timeout_threshold = 0xffff;
1103*437bfbebSnyanmisaka
1104*437bfbebSnyanmisaka
1105*437bfbebSnyanmisaka valid_ref = hw_regs->h265d_addrs.reg168_decout_base;
1106*437bfbebSnyanmisaka reg_ctx->error_index[syn->dec.reg_index] = dxva_ctx->pp.CurrPic.Index7Bits;
1107*437bfbebSnyanmisaka
1108*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg169_error_ref_base = valid_ref;
1109*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_ctx->pp.RefPicList); i++) {
1110*437bfbebSnyanmisaka if (dxva_ctx->pp.RefPicList[i].bPicEntry != 0xff &&
1111*437bfbebSnyanmisaka dxva_ctx->pp.RefPicList[i].bPicEntry != 0x7f) {
1112*437bfbebSnyanmisaka
1113*437bfbebSnyanmisaka MppFrame mframe = NULL;
1114*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots,
1115*437bfbebSnyanmisaka dxva_ctx->pp.RefPicList[i].Index7Bits,
1116*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
1117*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.RefPicList[i].Index7Bits,
1118*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1119*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY) {
1120*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(reg_ctx->origin_bufs,
1121*437bfbebSnyanmisaka dxva_ctx->pp.RefPicList[i].Index7Bits);
1122*437bfbebSnyanmisaka framebuf = origin_buf->buf[0];
1123*437bfbebSnyanmisaka }
1124*437bfbebSnyanmisaka if (framebuf != NULL) {
1125*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg170_185_ref_base[i] = mpp_buffer_get_fd(framebuf);
1126*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = mpp_buffer_get_fd(framebuf);
1127*437bfbebSnyanmisaka valid_ref = hw_regs->h265d_addrs.reg170_185_ref_base[i];
1128*437bfbebSnyanmisaka if ((pocdistance(dxva_ctx->pp.PicOrderCntValList[i], dxva_ctx->pp.current_poc) < distance)
1129*437bfbebSnyanmisaka && (!mpp_frame_get_errinfo(mframe))) {
1130*437bfbebSnyanmisaka
1131*437bfbebSnyanmisaka distance = pocdistance(dxva_ctx->pp.PicOrderCntValList[i], dxva_ctx->pp.current_poc);
1132*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg169_error_ref_base = hw_regs->h265d_addrs.reg170_185_ref_base[i];
1133*437bfbebSnyanmisaka reg_ctx->error_index[syn->dec.reg_index] = dxva_ctx->pp.RefPicList[i].Index7Bits;
1134*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg16.error_proc_disable = 1;
1135*437bfbebSnyanmisaka }
1136*437bfbebSnyanmisaka } else {
1137*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg170_185_ref_base[i] = valid_ref;
1138*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = valid_ref;
1139*437bfbebSnyanmisaka }
1140*437bfbebSnyanmisaka
1141*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, dxva_ctx->pp.RefPicList[i].Index7Bits);
1142*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
1143*437bfbebSnyanmisaka }
1144*437bfbebSnyanmisaka }
1145*437bfbebSnyanmisaka
1146*437bfbebSnyanmisaka if ((reg_ctx->error_index[syn->dec.reg_index] == dxva_ctx->pp.CurrPic.Index7Bits) &&
1147*437bfbebSnyanmisaka !dxva_ctx->pp.IntraPicFlag) {
1148*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "current frm may be err, should skip process");
1149*437bfbebSnyanmisaka syn->dec.flags.ref_err = 1;
1150*437bfbebSnyanmisaka return MPP_OK;
1151*437bfbebSnyanmisaka }
1152*437bfbebSnyanmisaka
1153*437bfbebSnyanmisaka /* pps */
1154*437bfbebSnyanmisaka hw_regs->common_addr.reg131_gbl_base = reg_ctx->bufs_fd;
1155*437bfbebSnyanmisaka hw_regs->h265d_paras.reg67_global_len = 0xc; //22 * 8;
1156*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 131, reg_ctx->spspps_offset);
1157*437bfbebSnyanmisaka
1158*437bfbebSnyanmisaka /* rps */
1159*437bfbebSnyanmisaka hw_regs->common_addr.reg129_rps_base = reg_ctx->bufs_fd;
1160*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 129, reg_ctx->rps_offset);
1161*437bfbebSnyanmisaka
1162*437bfbebSnyanmisaka hal_h265d_v345_output_pps_packet(hal, syn->dec.syntax.data);
1163*437bfbebSnyanmisaka
1164*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_ctx->pp.RefPicList); i++) {
1165*437bfbebSnyanmisaka
1166*437bfbebSnyanmisaka if (dxva_ctx->pp.RefPicList[i].bPicEntry != 0xff &&
1167*437bfbebSnyanmisaka dxva_ctx->pp.RefPicList[i].bPicEntry != 0x7f) {
1168*437bfbebSnyanmisaka MppFrame mframe = NULL;
1169*437bfbebSnyanmisaka
1170*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots,
1171*437bfbebSnyanmisaka dxva_ctx->pp.RefPicList[i].Index7Bits,
1172*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
1173*437bfbebSnyanmisaka
1174*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.RefPicList[i].Index7Bits,
1175*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1176*437bfbebSnyanmisaka
1177*437bfbebSnyanmisaka if (framebuf == NULL || mpp_frame_get_errinfo(mframe)) {
1178*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, reg_ctx->error_index[syn->dec.reg_index]);
1179*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg170_185_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1180*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1181*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
1182*437bfbebSnyanmisaka }
1183*437bfbebSnyanmisaka } else {
1184*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, reg_ctx->error_index[syn->dec.reg_index]);
1185*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg170_185_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1186*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg195_210_payload_st_ref_base[i] = hw_regs->h265d_addrs.reg169_error_ref_base;
1187*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
1188*437bfbebSnyanmisaka }
1189*437bfbebSnyanmisaka }
1190*437bfbebSnyanmisaka
1191*437bfbebSnyanmisaka hal_h265d_rcb_info_update(hal, dxva_ctx, hw_regs, width, height);
1192*437bfbebSnyanmisaka vdpu383_setup_rcb(&hw_regs->common_addr, reg_ctx->dev, reg_ctx->fast_mode ?
1193*437bfbebSnyanmisaka reg_ctx->rcb_buf[syn->dec.reg_index] : reg_ctx->rcb_buf[0],
1194*437bfbebSnyanmisaka (Vdpu383RcbInfo *)reg_ctx->rcb_info);
1195*437bfbebSnyanmisaka vdpu383_setup_statistic(&hw_regs->ctrl_regs);
1196*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->bufs);
1197*437bfbebSnyanmisaka
1198*437bfbebSnyanmisaka {
1199*437bfbebSnyanmisaka //scale down config
1200*437bfbebSnyanmisaka MppFrame mframe = NULL;
1201*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
1202*437bfbebSnyanmisaka MppFrameThumbnailMode thumbnail_mode;
1203*437bfbebSnyanmisaka
1204*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
1205*437bfbebSnyanmisaka SLOT_BUFFER, &mbuffer);
1206*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_ctx->pp.CurrPic.Index7Bits,
1207*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1208*437bfbebSnyanmisaka thumbnail_mode = mpp_frame_get_thumbnail_en(mframe);
1209*437bfbebSnyanmisaka switch (thumbnail_mode) {
1210*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_ONLY:
1211*437bfbebSnyanmisaka hw_regs->common_addr.reg133_scale_down_base = mpp_buffer_get_fd(mbuffer);
1212*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(reg_ctx->origin_bufs, dxva_ctx->pp.CurrPic.Index7Bits);
1213*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(origin_buf->buf[0]);
1214*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg168_decout_base = fd;
1215*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg192_payload_st_cur_base = fd;
1216*437bfbebSnyanmisaka hw_regs->h265d_addrs.reg169_error_ref_base = fd;
1217*437bfbebSnyanmisaka vdpu383_setup_down_scale(mframe, reg_ctx->dev, &hw_regs->ctrl_regs, (void*)&hw_regs->h265d_paras);
1218*437bfbebSnyanmisaka break;
1219*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_MIXED:
1220*437bfbebSnyanmisaka hw_regs->common_addr.reg133_scale_down_base = mpp_buffer_get_fd(mbuffer);
1221*437bfbebSnyanmisaka vdpu383_setup_down_scale(mframe, reg_ctx->dev, &hw_regs->ctrl_regs, (void*)&hw_regs->h265d_paras);
1222*437bfbebSnyanmisaka break;
1223*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_NONE:
1224*437bfbebSnyanmisaka default:
1225*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg9.scale_down_en = 0;
1226*437bfbebSnyanmisaka break;
1227*437bfbebSnyanmisaka }
1228*437bfbebSnyanmisaka }
1229*437bfbebSnyanmisaka
1230*437bfbebSnyanmisaka return ret;
1231*437bfbebSnyanmisaka }
1232*437bfbebSnyanmisaka
hal_h265d_vdpu383_start(void * hal,HalTaskInfo * task)1233*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_start(void *hal, HalTaskInfo *task)
1234*437bfbebSnyanmisaka {
1235*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1236*437bfbebSnyanmisaka RK_U8* p = NULL;
1237*437bfbebSnyanmisaka Vdpu383H265dRegSet *hw_regs = NULL;
1238*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
1239*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
1240*437bfbebSnyanmisaka
1241*437bfbebSnyanmisaka RK_U32 i;
1242*437bfbebSnyanmisaka
1243*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1244*437bfbebSnyanmisaka (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
1245*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
1246*437bfbebSnyanmisaka return MPP_OK;
1247*437bfbebSnyanmisaka }
1248*437bfbebSnyanmisaka
1249*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
1250*437bfbebSnyanmisaka p = (RK_U8*)reg_ctx->g_buf[index].hw_regs;
1251*437bfbebSnyanmisaka hw_regs = ( Vdpu383H265dRegSet *)reg_ctx->g_buf[index].hw_regs;
1252*437bfbebSnyanmisaka } else {
1253*437bfbebSnyanmisaka p = (RK_U8*)reg_ctx->hw_regs;
1254*437bfbebSnyanmisaka hw_regs = ( Vdpu383H265dRegSet *)reg_ctx->hw_regs;
1255*437bfbebSnyanmisaka }
1256*437bfbebSnyanmisaka
1257*437bfbebSnyanmisaka if (hw_regs == NULL) {
1258*437bfbebSnyanmisaka mpp_err("hal_h265d_start hw_regs is NULL");
1259*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
1260*437bfbebSnyanmisaka }
1261*437bfbebSnyanmisaka for (i = 0; i < 68; i++) {
1262*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1263*437bfbebSnyanmisaka i, *((RK_U32*)p));
1264*437bfbebSnyanmisaka //mpp_log("RK_HEVC_DEC: regs[%02d]=%08X\n", i, *((RK_U32*)p));
1265*437bfbebSnyanmisaka p += 4;
1266*437bfbebSnyanmisaka }
1267*437bfbebSnyanmisaka
1268*437bfbebSnyanmisaka do {
1269*437bfbebSnyanmisaka MppDevRegWrCfg wr_cfg;
1270*437bfbebSnyanmisaka MppDevRegRdCfg rd_cfg;
1271*437bfbebSnyanmisaka
1272*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->ctrl_regs;
1273*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->ctrl_regs);
1274*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CTRL_REGS;
1275*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1276*437bfbebSnyanmisaka if (ret) {
1277*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
1278*437bfbebSnyanmisaka break;
1279*437bfbebSnyanmisaka }
1280*437bfbebSnyanmisaka
1281*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->common_addr;
1282*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->common_addr);
1283*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
1284*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1285*437bfbebSnyanmisaka if (ret) {
1286*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1287*437bfbebSnyanmisaka break;
1288*437bfbebSnyanmisaka }
1289*437bfbebSnyanmisaka
1290*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->h265d_paras;
1291*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->h265d_paras);
1292*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_PARAS_REGS;
1293*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1294*437bfbebSnyanmisaka if (ret) {
1295*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1296*437bfbebSnyanmisaka break;
1297*437bfbebSnyanmisaka }
1298*437bfbebSnyanmisaka
1299*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->h265d_addrs;
1300*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->h265d_addrs);
1301*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
1302*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1303*437bfbebSnyanmisaka if (ret) {
1304*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1305*437bfbebSnyanmisaka break;
1306*437bfbebSnyanmisaka }
1307*437bfbebSnyanmisaka
1308*437bfbebSnyanmisaka rd_cfg.reg = &hw_regs->ctrl_regs.reg15;
1309*437bfbebSnyanmisaka rd_cfg.size = sizeof(hw_regs->ctrl_regs.reg15);
1310*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_INTERRUPT_REGS;
1311*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_RD, &rd_cfg);
1312*437bfbebSnyanmisaka if (ret) {
1313*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
1314*437bfbebSnyanmisaka break;
1315*437bfbebSnyanmisaka }
1316*437bfbebSnyanmisaka
1317*437bfbebSnyanmisaka /* rcb info for sram */
1318*437bfbebSnyanmisaka vdpu383_set_rcbinfo(reg_ctx->dev, (Vdpu383RcbInfo*)reg_ctx->rcb_info);
1319*437bfbebSnyanmisaka
1320*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_SEND, NULL);
1321*437bfbebSnyanmisaka if (ret) {
1322*437bfbebSnyanmisaka mpp_err_f("send cmd failed %d\n", ret);
1323*437bfbebSnyanmisaka break;
1324*437bfbebSnyanmisaka }
1325*437bfbebSnyanmisaka } while (0);
1326*437bfbebSnyanmisaka
1327*437bfbebSnyanmisaka return ret;
1328*437bfbebSnyanmisaka }
1329*437bfbebSnyanmisaka
1330*437bfbebSnyanmisaka
hal_h265d_vdpu383_wait(void * hal,HalTaskInfo * task)1331*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_wait(void *hal, HalTaskInfo *task)
1332*437bfbebSnyanmisaka {
1333*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1334*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
1335*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
1336*437bfbebSnyanmisaka RK_U8* p = NULL;
1337*437bfbebSnyanmisaka Vdpu383H265dRegSet *hw_regs = NULL;
1338*437bfbebSnyanmisaka RK_S32 i;
1339*437bfbebSnyanmisaka
1340*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
1341*437bfbebSnyanmisaka hw_regs = ( Vdpu383H265dRegSet *)reg_ctx->g_buf[index].hw_regs;
1342*437bfbebSnyanmisaka } else {
1343*437bfbebSnyanmisaka hw_regs = ( Vdpu383H265dRegSet *)reg_ctx->hw_regs;
1344*437bfbebSnyanmisaka }
1345*437bfbebSnyanmisaka
1346*437bfbebSnyanmisaka p = (RK_U8*)hw_regs;
1347*437bfbebSnyanmisaka
1348*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1349*437bfbebSnyanmisaka (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
1350*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
1351*437bfbebSnyanmisaka goto ERR_PROC;
1352*437bfbebSnyanmisaka }
1353*437bfbebSnyanmisaka
1354*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_POLL, NULL);
1355*437bfbebSnyanmisaka if (ret)
1356*437bfbebSnyanmisaka mpp_err_f("poll cmd failed %d\n", ret);
1357*437bfbebSnyanmisaka
1358*437bfbebSnyanmisaka ERR_PROC:
1359*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1360*437bfbebSnyanmisaka task->dec.flags.ref_err ||
1361*437bfbebSnyanmisaka (!hw_regs->ctrl_regs.reg15.rkvdec_frame_rdy_sta) ||
1362*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_strm_error_sta ||
1363*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_core_timeout_sta ||
1364*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_ip_timeout_sta ||
1365*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_bus_error_sta ||
1366*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_buffer_empty_sta ||
1367*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_colmv_ref_error_sta) {
1368*437bfbebSnyanmisaka if (!reg_ctx->fast_mode) {
1369*437bfbebSnyanmisaka if (reg_ctx->dec_cb)
1370*437bfbebSnyanmisaka mpp_callback(reg_ctx->dec_cb, &task->dec);
1371*437bfbebSnyanmisaka } else {
1372*437bfbebSnyanmisaka MppFrame mframe = NULL;
1373*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1374*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1375*437bfbebSnyanmisaka if (mframe) {
1376*437bfbebSnyanmisaka reg_ctx->fast_mode_err_found = 1;
1377*437bfbebSnyanmisaka mpp_frame_set_errinfo(mframe, 1);
1378*437bfbebSnyanmisaka }
1379*437bfbebSnyanmisaka }
1380*437bfbebSnyanmisaka } else {
1381*437bfbebSnyanmisaka if (reg_ctx->fast_mode && reg_ctx->fast_mode_err_found) {
1382*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(task->dec.refer); i++) {
1383*437bfbebSnyanmisaka if (task->dec.refer[i] >= 0) {
1384*437bfbebSnyanmisaka MppFrame frame_ref = NULL;
1385*437bfbebSnyanmisaka
1386*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.refer[i],
1387*437bfbebSnyanmisaka SLOT_FRAME_PTR, &frame_ref);
1388*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_FAST_ERR, "refer[%d] %d frame %p\n",
1389*437bfbebSnyanmisaka i, task->dec.refer[i], frame_ref);
1390*437bfbebSnyanmisaka if (frame_ref && mpp_frame_get_errinfo(frame_ref)) {
1391*437bfbebSnyanmisaka MppFrame frame_out = NULL;
1392*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1393*437bfbebSnyanmisaka SLOT_FRAME_PTR, &frame_out);
1394*437bfbebSnyanmisaka mpp_frame_set_errinfo(frame_out, 1);
1395*437bfbebSnyanmisaka break;
1396*437bfbebSnyanmisaka }
1397*437bfbebSnyanmisaka }
1398*437bfbebSnyanmisaka }
1399*437bfbebSnyanmisaka }
1400*437bfbebSnyanmisaka }
1401*437bfbebSnyanmisaka
1402*437bfbebSnyanmisaka for (i = 0; i < 68; i++) {
1403*437bfbebSnyanmisaka if (i == 1) {
1404*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1405*437bfbebSnyanmisaka i, *((RK_U32*)p));
1406*437bfbebSnyanmisaka }
1407*437bfbebSnyanmisaka
1408*437bfbebSnyanmisaka if (i == 45) {
1409*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1410*437bfbebSnyanmisaka i, *((RK_U32*)p));
1411*437bfbebSnyanmisaka }
1412*437bfbebSnyanmisaka p += 4;
1413*437bfbebSnyanmisaka }
1414*437bfbebSnyanmisaka
1415*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
1416*437bfbebSnyanmisaka reg_ctx->g_buf[index].use_flag = 0;
1417*437bfbebSnyanmisaka }
1418*437bfbebSnyanmisaka
1419*437bfbebSnyanmisaka return ret;
1420*437bfbebSnyanmisaka }
1421*437bfbebSnyanmisaka
hal_h265d_vdpu383_reset(void * hal)1422*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_reset(void *hal)
1423*437bfbebSnyanmisaka {
1424*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1425*437bfbebSnyanmisaka HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1426*437bfbebSnyanmisaka p_hal->fast_mode_err_found = 0;
1427*437bfbebSnyanmisaka (void)hal;
1428*437bfbebSnyanmisaka return ret;
1429*437bfbebSnyanmisaka }
1430*437bfbebSnyanmisaka
hal_h265d_vdpu383_flush(void * hal)1431*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_flush(void *hal)
1432*437bfbebSnyanmisaka {
1433*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1434*437bfbebSnyanmisaka
1435*437bfbebSnyanmisaka (void)hal;
1436*437bfbebSnyanmisaka return ret;
1437*437bfbebSnyanmisaka }
1438*437bfbebSnyanmisaka
hal_h265d_vdpu383_control(void * hal,MpiCmd cmd_type,void * param)1439*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu383_control(void *hal, MpiCmd cmd_type, void *param)
1440*437bfbebSnyanmisaka {
1441*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1442*437bfbebSnyanmisaka HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1443*437bfbebSnyanmisaka
1444*437bfbebSnyanmisaka (void)hal;
1445*437bfbebSnyanmisaka (void)param;
1446*437bfbebSnyanmisaka switch ((MpiCmd)cmd_type) {
1447*437bfbebSnyanmisaka case MPP_DEC_SET_FRAME_INFO: {
1448*437bfbebSnyanmisaka MppFrame frame = (MppFrame)param;
1449*437bfbebSnyanmisaka MppFrameFormat fmt = mpp_frame_get_fmt(frame);
1450*437bfbebSnyanmisaka RK_U32 imgwidth = mpp_frame_get_width((MppFrame)param);
1451*437bfbebSnyanmisaka RK_U32 imgheight = mpp_frame_get_height((MppFrame)param);
1452*437bfbebSnyanmisaka
1453*437bfbebSnyanmisaka if (fmt == MPP_FMT_YUV422SP) {
1454*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->slots, SLOTS_LEN_ALIGN, rkv_len_align_422);
1455*437bfbebSnyanmisaka } else if (fmt == MPP_FMT_YUV444SP || fmt == MPP_FMT_YUV444SP_10BIT) {
1456*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->slots, SLOTS_LEN_ALIGN, rkv_len_align_444);
1457*437bfbebSnyanmisaka }
1458*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1459*437bfbebSnyanmisaka vdpu383_afbc_align_calc(p_hal->slots, frame, 16);
1460*437bfbebSnyanmisaka } else if (imgwidth > 1920 || imgheight > 1088) {
1461*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
1462*437bfbebSnyanmisaka }
1463*437bfbebSnyanmisaka break;
1464*437bfbebSnyanmisaka }
1465*437bfbebSnyanmisaka case MPP_DEC_GET_THUMBNAIL_FRAME_INFO: {
1466*437bfbebSnyanmisaka vdpu383_update_thumbnail_frame_info((MppFrame)param);
1467*437bfbebSnyanmisaka } break;
1468*437bfbebSnyanmisaka case MPP_DEC_SET_OUTPUT_FORMAT: {
1469*437bfbebSnyanmisaka } break;
1470*437bfbebSnyanmisaka default: {
1471*437bfbebSnyanmisaka } break;
1472*437bfbebSnyanmisaka }
1473*437bfbebSnyanmisaka return ret;
1474*437bfbebSnyanmisaka }
1475*437bfbebSnyanmisaka
1476*437bfbebSnyanmisaka const MppHalApi hal_h265d_vdpu383 = {
1477*437bfbebSnyanmisaka .name = "h265d_vdpu383",
1478*437bfbebSnyanmisaka .type = MPP_CTX_DEC,
1479*437bfbebSnyanmisaka .coding = MPP_VIDEO_CodingHEVC,
1480*437bfbebSnyanmisaka .ctx_size = sizeof(HalH265dCtx),
1481*437bfbebSnyanmisaka .flag = 0,
1482*437bfbebSnyanmisaka .init = hal_h265d_vdpu383_init,
1483*437bfbebSnyanmisaka .deinit = hal_h265d_vdpu383_deinit,
1484*437bfbebSnyanmisaka .reg_gen = hal_h265d_vdpu383_gen_regs,
1485*437bfbebSnyanmisaka .start = hal_h265d_vdpu383_start,
1486*437bfbebSnyanmisaka .wait = hal_h265d_vdpu383_wait,
1487*437bfbebSnyanmisaka .reset = hal_h265d_vdpu383_reset,
1488*437bfbebSnyanmisaka .flush = hal_h265d_vdpu383_flush,
1489*437bfbebSnyanmisaka .control = hal_h265d_vdpu383_control,
1490*437bfbebSnyanmisaka };
1491