1*437bfbebSnyanmisaka /*
2*437bfbebSnyanmisaka * Copyright 2022 Rockchip Electronics Co. LTD
3*437bfbebSnyanmisaka *
4*437bfbebSnyanmisaka * Licensed under the Apache License, Version 2.0 (the "License");
5*437bfbebSnyanmisaka * you may not use this file except in compliance with the License.
6*437bfbebSnyanmisaka * You may obtain a copy of the License at
7*437bfbebSnyanmisaka *
8*437bfbebSnyanmisaka * http://www.apache.org/licenses/LICENSE-2.0
9*437bfbebSnyanmisaka *
10*437bfbebSnyanmisaka * Unless required by applicable law or agreed to in writing, software
11*437bfbebSnyanmisaka * distributed under the License is distributed on an "AS IS" BASIS,
12*437bfbebSnyanmisaka * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*437bfbebSnyanmisaka * See the License for the specific language governing permissions and
14*437bfbebSnyanmisaka * limitations under the License.
15*437bfbebSnyanmisaka */
16*437bfbebSnyanmisaka
17*437bfbebSnyanmisaka #define MODULE_TAG "hal_h265d_vdpu382"
18*437bfbebSnyanmisaka
19*437bfbebSnyanmisaka #include <stdio.h>
20*437bfbebSnyanmisaka #include <string.h>
21*437bfbebSnyanmisaka
22*437bfbebSnyanmisaka #include "mpp_env.h"
23*437bfbebSnyanmisaka #include "mpp_mem.h"
24*437bfbebSnyanmisaka #include "mpp_bitread.h"
25*437bfbebSnyanmisaka #include "mpp_bitput.h"
26*437bfbebSnyanmisaka
27*437bfbebSnyanmisaka #include "h265d_syntax.h"
28*437bfbebSnyanmisaka #include "hal_h265d_debug.h"
29*437bfbebSnyanmisaka #include "hal_h265d_ctx.h"
30*437bfbebSnyanmisaka #include "hal_h265d_com.h"
31*437bfbebSnyanmisaka #include "hal_h265d_vdpu382.h"
32*437bfbebSnyanmisaka #include "vdpu382_h265d.h"
33*437bfbebSnyanmisaka
34*437bfbebSnyanmisaka /* #define dump */
35*437bfbebSnyanmisaka #ifdef dump
36*437bfbebSnyanmisaka static FILE *fp = NULL;
37*437bfbebSnyanmisaka #endif
38*437bfbebSnyanmisaka
39*437bfbebSnyanmisaka #define HW_RPS
40*437bfbebSnyanmisaka #define PPS_SIZE (112 * 64)//(96x64)
41*437bfbebSnyanmisaka
42*437bfbebSnyanmisaka #define SET_REF_VALID(regs, index, value)\
43*437bfbebSnyanmisaka do{ \
44*437bfbebSnyanmisaka switch(index){\
45*437bfbebSnyanmisaka case 0: regs.reg99.hevc_ref_valid_0 = value; break;\
46*437bfbebSnyanmisaka case 1: regs.reg99.hevc_ref_valid_1 = value; break;\
47*437bfbebSnyanmisaka case 2: regs.reg99.hevc_ref_valid_2 = value; break;\
48*437bfbebSnyanmisaka case 3: regs.reg99.hevc_ref_valid_3 = value; break;\
49*437bfbebSnyanmisaka case 4: regs.reg99.hevc_ref_valid_4 = value; break;\
50*437bfbebSnyanmisaka case 5: regs.reg99.hevc_ref_valid_5 = value; break;\
51*437bfbebSnyanmisaka case 6: regs.reg99.hevc_ref_valid_6 = value; break;\
52*437bfbebSnyanmisaka case 7: regs.reg99.hevc_ref_valid_7 = value; break;\
53*437bfbebSnyanmisaka case 8: regs.reg99.hevc_ref_valid_8 = value; break;\
54*437bfbebSnyanmisaka case 9: regs.reg99.hevc_ref_valid_9 = value; break;\
55*437bfbebSnyanmisaka case 10: regs.reg99.hevc_ref_valid_10 = value; break;\
56*437bfbebSnyanmisaka case 11: regs.reg99.hevc_ref_valid_11 = value; break;\
57*437bfbebSnyanmisaka case 12: regs.reg99.hevc_ref_valid_12 = value; break;\
58*437bfbebSnyanmisaka case 13: regs.reg99.hevc_ref_valid_13 = value; break;\
59*437bfbebSnyanmisaka case 14: regs.reg99.hevc_ref_valid_14 = value; break;\
60*437bfbebSnyanmisaka default: break;}\
61*437bfbebSnyanmisaka }while(0)
62*437bfbebSnyanmisaka
63*437bfbebSnyanmisaka #define FMT 4
64*437bfbebSnyanmisaka #define CTU 3
65*437bfbebSnyanmisaka
66*437bfbebSnyanmisaka typedef struct {
67*437bfbebSnyanmisaka RK_U32 a;
68*437bfbebSnyanmisaka RK_U32 b;
69*437bfbebSnyanmisaka } FilterdColBufRatio;
70*437bfbebSnyanmisaka
71*437bfbebSnyanmisaka static const FilterdColBufRatio filterd_fbc_on[CTU][FMT] = {
72*437bfbebSnyanmisaka /* 400 420 422 444 */
73*437bfbebSnyanmisaka {{0, 0}, {27, 15}, {36, 15}, {52, 15}}, //ctu 16
74*437bfbebSnyanmisaka {{0, 0}, {27, 8}, {36, 8}, {52, 8}}, //ctu 32
75*437bfbebSnyanmisaka {{0, 0}, {27, 5}, {36, 5}, {52, 5}} //ctu 64
76*437bfbebSnyanmisaka };
77*437bfbebSnyanmisaka
78*437bfbebSnyanmisaka static const FilterdColBufRatio filterd_fbc_off[CTU][FMT] = {
79*437bfbebSnyanmisaka /* 400 420 422 444 */
80*437bfbebSnyanmisaka {{0, 0}, {15, 5}, {20, 5}, {20, 5}}, //ctu 16
81*437bfbebSnyanmisaka {{0, 0}, {15, 9}, {20, 9}, {20, 9}}, //ctu 32
82*437bfbebSnyanmisaka {{0, 0}, {15, 16}, {20, 16}, {20, 16}} //ctu 64
83*437bfbebSnyanmisaka };
84*437bfbebSnyanmisaka
85*437bfbebSnyanmisaka #define CABAC_TAB_ALIGEND_SIZE (MPP_ALIGN(27456, SZ_4K))
86*437bfbebSnyanmisaka #define SPSPPS_ALIGNED_SIZE (MPP_ALIGN(112 * 64, SZ_4K))
87*437bfbebSnyanmisaka #define RPS_ALIGEND_SIZE (MPP_ALIGN(400 * 8, SZ_4K))
88*437bfbebSnyanmisaka #define SCALIST_ALIGNED_SIZE (MPP_ALIGN(81 * 1360, SZ_4K))
89*437bfbebSnyanmisaka #define INFO_BUFFER_SIZE (SPSPPS_ALIGNED_SIZE + RPS_ALIGEND_SIZE + SCALIST_ALIGNED_SIZE)
90*437bfbebSnyanmisaka #define ALL_BUFFER_SIZE(cnt) (CABAC_TAB_ALIGEND_SIZE + INFO_BUFFER_SIZE *cnt)
91*437bfbebSnyanmisaka
92*437bfbebSnyanmisaka #define CABAC_TAB_OFFSET (0)
93*437bfbebSnyanmisaka #define SPSPPS_OFFSET(pos) (CABAC_TAB_OFFSET + CABAC_TAB_ALIGEND_SIZE + (INFO_BUFFER_SIZE * pos))
94*437bfbebSnyanmisaka #define RPS_OFFSET(pos) (SPSPPS_OFFSET(pos) + SPSPPS_ALIGNED_SIZE)
95*437bfbebSnyanmisaka #define SCALIST_OFFSET(pos) (RPS_OFFSET(pos) + RPS_ALIGEND_SIZE)
96*437bfbebSnyanmisaka
hal_h265d_vdpu382_init(void * hal,MppHalCfg * cfg)97*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_init(void *hal, MppHalCfg *cfg)
98*437bfbebSnyanmisaka {
99*437bfbebSnyanmisaka RK_S32 ret = 0;
100*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
101*437bfbebSnyanmisaka
102*437bfbebSnyanmisaka mpp_slots_set_prop(reg_ctx->slots, SLOTS_HOR_ALIGN, hevc_hor_align);
103*437bfbebSnyanmisaka mpp_slots_set_prop(reg_ctx->slots, SLOTS_VER_ALIGN, hevc_ver_align);
104*437bfbebSnyanmisaka
105*437bfbebSnyanmisaka reg_ctx->scaling_qm = mpp_calloc(DXVA_Qmatrix_HEVC, 1);
106*437bfbebSnyanmisaka if (reg_ctx->scaling_qm == NULL) {
107*437bfbebSnyanmisaka mpp_err("scaling_org alloc fail");
108*437bfbebSnyanmisaka return MPP_ERR_MALLOC;
109*437bfbebSnyanmisaka }
110*437bfbebSnyanmisaka
111*437bfbebSnyanmisaka reg_ctx->scaling_rk = mpp_calloc(scalingFactor_t, 1);
112*437bfbebSnyanmisaka reg_ctx->pps_buf = mpp_calloc(RK_U64, 15);
113*437bfbebSnyanmisaka reg_ctx->sw_rps_buf = mpp_calloc(RK_U64, 400);
114*437bfbebSnyanmisaka
115*437bfbebSnyanmisaka if (reg_ctx->scaling_rk == NULL) {
116*437bfbebSnyanmisaka mpp_err("scaling_rk alloc fail");
117*437bfbebSnyanmisaka return MPP_ERR_MALLOC;
118*437bfbebSnyanmisaka }
119*437bfbebSnyanmisaka
120*437bfbebSnyanmisaka if (reg_ctx->group == NULL) {
121*437bfbebSnyanmisaka ret = mpp_buffer_group_get_internal(®_ctx->group, MPP_BUFFER_TYPE_ION);
122*437bfbebSnyanmisaka if (ret) {
123*437bfbebSnyanmisaka mpp_err("h265d mpp_buffer_group_get failed\n");
124*437bfbebSnyanmisaka return ret;
125*437bfbebSnyanmisaka }
126*437bfbebSnyanmisaka }
127*437bfbebSnyanmisaka
128*437bfbebSnyanmisaka {
129*437bfbebSnyanmisaka RK_U32 i = 0;
130*437bfbebSnyanmisaka RK_U32 max_cnt = reg_ctx->fast_mode ? MAX_GEN_REG : 1;
131*437bfbebSnyanmisaka
132*437bfbebSnyanmisaka //!< malloc buffers
133*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->bufs, ALL_BUFFER_SIZE(max_cnt));
134*437bfbebSnyanmisaka if (ret) {
135*437bfbebSnyanmisaka mpp_err("h265d mpp_buffer_get failed\n");
136*437bfbebSnyanmisaka return ret;
137*437bfbebSnyanmisaka }
138*437bfbebSnyanmisaka
139*437bfbebSnyanmisaka reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
140*437bfbebSnyanmisaka reg_ctx->offset_cabac = CABAC_TAB_OFFSET;
141*437bfbebSnyanmisaka for (i = 0; i < max_cnt; i++) {
142*437bfbebSnyanmisaka reg_ctx->g_buf[i].hw_regs = mpp_calloc_size(void, sizeof(Vdpu382H265dRegSet));
143*437bfbebSnyanmisaka reg_ctx->offset_spspps[i] = SPSPPS_OFFSET(i);
144*437bfbebSnyanmisaka reg_ctx->offset_rps[i] = RPS_OFFSET(i);
145*437bfbebSnyanmisaka reg_ctx->offset_sclst[i] = SCALIST_OFFSET(i);
146*437bfbebSnyanmisaka }
147*437bfbebSnyanmisaka }
148*437bfbebSnyanmisaka
149*437bfbebSnyanmisaka if (!reg_ctx->fast_mode) {
150*437bfbebSnyanmisaka reg_ctx->hw_regs = reg_ctx->g_buf[0].hw_regs;
151*437bfbebSnyanmisaka reg_ctx->spspps_offset = reg_ctx->offset_spspps[0];
152*437bfbebSnyanmisaka reg_ctx->rps_offset = reg_ctx->offset_rps[0];
153*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->offset_sclst[0];
154*437bfbebSnyanmisaka }
155*437bfbebSnyanmisaka
156*437bfbebSnyanmisaka ret = mpp_buffer_write(reg_ctx->bufs, 0, (void*)cabac_table, sizeof(cabac_table));
157*437bfbebSnyanmisaka if (ret) {
158*437bfbebSnyanmisaka mpp_err("h265d write cabac_table data failed\n");
159*437bfbebSnyanmisaka return ret;
160*437bfbebSnyanmisaka }
161*437bfbebSnyanmisaka
162*437bfbebSnyanmisaka if (cfg->hal_fbc_adj_cfg) {
163*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->func = vdpu382_afbc_align_calc;
164*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->expand = 16;
165*437bfbebSnyanmisaka }
166*437bfbebSnyanmisaka
167*437bfbebSnyanmisaka #ifdef dump
168*437bfbebSnyanmisaka fp = fopen("/data/hal.bin", "wb");
169*437bfbebSnyanmisaka #endif
170*437bfbebSnyanmisaka (void) cfg;
171*437bfbebSnyanmisaka return MPP_OK;
172*437bfbebSnyanmisaka }
173*437bfbebSnyanmisaka
hal_h265d_vdpu382_deinit(void * hal)174*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_deinit(void *hal)
175*437bfbebSnyanmisaka {
176*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
177*437bfbebSnyanmisaka RK_U32 loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->g_buf) : 1;
178*437bfbebSnyanmisaka RK_U32 i;
179*437bfbebSnyanmisaka
180*437bfbebSnyanmisaka if (reg_ctx->bufs) {
181*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->bufs);
182*437bfbebSnyanmisaka reg_ctx->bufs = NULL;
183*437bfbebSnyanmisaka }
184*437bfbebSnyanmisaka
185*437bfbebSnyanmisaka loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->rcb_buf) : 1;
186*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
187*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
188*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
189*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
190*437bfbebSnyanmisaka }
191*437bfbebSnyanmisaka }
192*437bfbebSnyanmisaka
193*437bfbebSnyanmisaka if (reg_ctx->group) {
194*437bfbebSnyanmisaka mpp_buffer_group_put(reg_ctx->group);
195*437bfbebSnyanmisaka reg_ctx->group = NULL;
196*437bfbebSnyanmisaka }
197*437bfbebSnyanmisaka
198*437bfbebSnyanmisaka for (i = 0; i < loop; i++)
199*437bfbebSnyanmisaka MPP_FREE(reg_ctx->g_buf[i].hw_regs);
200*437bfbebSnyanmisaka
201*437bfbebSnyanmisaka MPP_FREE(reg_ctx->scaling_qm);
202*437bfbebSnyanmisaka MPP_FREE(reg_ctx->scaling_rk);
203*437bfbebSnyanmisaka MPP_FREE(reg_ctx->pps_buf);
204*437bfbebSnyanmisaka MPP_FREE(reg_ctx->sw_rps_buf);
205*437bfbebSnyanmisaka
206*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs) {
207*437bfbebSnyanmisaka hal_bufs_deinit(reg_ctx->cmv_bufs);
208*437bfbebSnyanmisaka reg_ctx->cmv_bufs = NULL;
209*437bfbebSnyanmisaka }
210*437bfbebSnyanmisaka
211*437bfbebSnyanmisaka return MPP_OK;
212*437bfbebSnyanmisaka }
213*437bfbebSnyanmisaka
hal_h265d_v382_output_pps_packet(void * hal,void * dxva)214*437bfbebSnyanmisaka static RK_S32 hal_h265d_v382_output_pps_packet(void *hal, void *dxva)
215*437bfbebSnyanmisaka {
216*437bfbebSnyanmisaka RK_S32 fifo_len = 14;//12
217*437bfbebSnyanmisaka RK_S32 i, j;
218*437bfbebSnyanmisaka RK_U32 addr;
219*437bfbebSnyanmisaka RK_U32 log2_min_cb_size;
220*437bfbebSnyanmisaka RK_S32 width, height;
221*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
222*437bfbebSnyanmisaka Vdpu382H265dRegSet *hw_reg = (Vdpu382H265dRegSet*)(reg_ctx->hw_regs);
223*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
224*437bfbebSnyanmisaka BitputCtx_t bp;
225*437bfbebSnyanmisaka
226*437bfbebSnyanmisaka if (NULL == reg_ctx || dxva_cxt == NULL) {
227*437bfbebSnyanmisaka mpp_err("%s:%s:%d reg_ctx or dxva_cxt is NULL",
228*437bfbebSnyanmisaka __FILE__, __FUNCTION__, __LINE__);
229*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
230*437bfbebSnyanmisaka }
231*437bfbebSnyanmisaka void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->spspps_offset;
232*437bfbebSnyanmisaka if (dxva_cxt->pp.ps_update_flag) {
233*437bfbebSnyanmisaka RK_U64 *pps_packet = reg_ctx->pps_buf;
234*437bfbebSnyanmisaka if (NULL == pps_ptr) {
235*437bfbebSnyanmisaka mpp_err("pps_data get ptr error");
236*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
237*437bfbebSnyanmisaka }
238*437bfbebSnyanmisaka
239*437bfbebSnyanmisaka for (i = 0; i < 14; i++) pps_packet[i] = 0;
240*437bfbebSnyanmisaka
241*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, pps_packet, fifo_len);
242*437bfbebSnyanmisaka
243*437bfbebSnyanmisaka // SPS
244*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.vps_id , 4);
245*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_id , 4);
246*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.chroma_format_idc , 2);
247*437bfbebSnyanmisaka
248*437bfbebSnyanmisaka log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
249*437bfbebSnyanmisaka width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
250*437bfbebSnyanmisaka height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
251*437bfbebSnyanmisaka
252*437bfbebSnyanmisaka mpp_put_bits(&bp, width , 16);
253*437bfbebSnyanmisaka mpp_put_bits(&bp, height , 16);
254*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_luma_minus8 + 8 , 4);
255*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_chroma_minus8 + 8 , 4);
256*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_max_pic_order_cnt_lsb_minus4 + 4 , 5);
257*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size , 2); //log2_maxa_coding_block_depth
258*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3 , 3);
259*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_min_transform_block_size_minus2 + 2 , 3);
260*437bfbebSnyanmisaka ///<-zrh comment ^ 63 bit above
261*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_transform_block_size , 2);
262*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_inter , 3);
263*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_intra , 3);
264*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.scaling_list_enabled_flag , 1);
265*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.amp_enabled_flag , 1);
266*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sample_adaptive_offset_enabled_flag , 1);
267*437bfbebSnyanmisaka ///<-zrh comment ^ 68 bit above
268*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag , 1);
269*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0 , 4);
270*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0 , 4);
271*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_loop_filter_disabled_flag , 1);
272*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_pcm_luma_coding_block_size , 3);
273*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
274*437bfbebSnyanmisaka
275*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_short_term_ref_pic_sets , 7);
276*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.long_term_ref_pics_present_flag , 1);
277*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_long_term_ref_pics_sps , 6);
278*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_temporal_mvp_enabled_flag , 1);
279*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.strong_intra_smoothing_enabled_flag , 1);
280*437bfbebSnyanmisaka ///<-zrh comment ^ 100 bit above
281*437bfbebSnyanmisaka
282*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 7 ); //49bits
283*437bfbebSnyanmisaka //yandong change
284*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_max_dec_pic_buffering_minus1, 4);
285*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 3);
286*437bfbebSnyanmisaka mpp_put_align(&bp , 32, 0xf); //128
287*437bfbebSnyanmisaka // PPS
288*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_id , 6 );
289*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_id , 4 );
290*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.dependent_slice_segments_enabled_flag , 1 );
291*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.output_flag_present_flag , 1 );
292*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_extra_slice_header_bits , 13);
293*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sign_data_hiding_enabled_flag , 1);
294*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.cabac_init_present_flag , 1);
295*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l0_default_active_minus1 + 1 , 4);//31 bits
296*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l1_default_active_minus1 + 1 , 4);
297*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.init_qp_minus26 , 7);
298*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.constrained_intra_pred_flag , 1);
299*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.transform_skip_enabled_flag , 1);
300*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.cu_qp_delta_enabled_flag , 1); //164
301*437bfbebSnyanmisaka mpp_put_bits(&bp, log2_min_cb_size +
302*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size -
303*437bfbebSnyanmisaka dxva_cxt->pp.diff_cu_qp_delta_depth , 3);
304*437bfbebSnyanmisaka
305*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_PPS, "log2_min_cb_size %d %d %d \n", log2_min_cb_size,
306*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size, dxva_cxt->pp.diff_cu_qp_delta_depth );
307*437bfbebSnyanmisaka
308*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_cb_qp_offset , 5);
309*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_cr_qp_offset , 5);
310*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_slice_chroma_qp_offsets_present_flag , 1);
311*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.weighted_pred_flag , 1);
312*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.weighted_bipred_flag , 1);
313*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.transquant_bypass_enabled_flag , 1 );
314*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag , 1 );
315*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.entropy_coding_sync_enabled_flag , 1);
316*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_loop_filter_across_slices_enabled_flag , 1);
317*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.loop_filter_across_tiles_enabled_flag , 1); //185
318*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.deblocking_filter_override_enabled_flag , 1);
319*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_deblocking_filter_disabled_flag , 1);
320*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_beta_offset_div2 , 4);
321*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_tc_offset_div2 , 4);
322*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.lists_modification_present_flag , 1);
323*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_parallel_merge_level_minus2 + 2 , 3);
324*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.slice_segment_header_extension_present_flag , 1);
325*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 3);
326*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag ? dxva_cxt->pp.num_tile_columns_minus1 + 1 : 0, 5);
327*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag ? dxva_cxt->pp.num_tile_rows_minus1 + 1 : 0 , 5 );
328*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 4);//2 //mSps_Pps[i]->mMode
329*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0xf);
330*437bfbebSnyanmisaka {
331*437bfbebSnyanmisaka /// tiles info begin
332*437bfbebSnyanmisaka RK_U16 column_width[20];
333*437bfbebSnyanmisaka RK_U16 row_height[22];
334*437bfbebSnyanmisaka
335*437bfbebSnyanmisaka memset(column_width, 0, sizeof(column_width));
336*437bfbebSnyanmisaka memset(row_height, 0, sizeof(row_height));
337*437bfbebSnyanmisaka
338*437bfbebSnyanmisaka if (dxva_cxt->pp.tiles_enabled_flag) {
339*437bfbebSnyanmisaka
340*437bfbebSnyanmisaka if (dxva_cxt->pp.uniform_spacing_flag == 0) {
341*437bfbebSnyanmisaka RK_S32 maxcuwidth = dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
342*437bfbebSnyanmisaka RK_S32 ctu_width_in_pic = (width +
343*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
344*437bfbebSnyanmisaka RK_S32 ctu_height_in_pic = (height +
345*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
346*437bfbebSnyanmisaka RK_S32 sum = 0;
347*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1; i++) {
348*437bfbebSnyanmisaka column_width[i] = dxva_cxt->pp.column_width_minus1[i] + 1;
349*437bfbebSnyanmisaka sum += column_width[i] ;
350*437bfbebSnyanmisaka }
351*437bfbebSnyanmisaka column_width[i] = ctu_width_in_pic - sum;
352*437bfbebSnyanmisaka
353*437bfbebSnyanmisaka sum = 0;
354*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1; i++) {
355*437bfbebSnyanmisaka row_height[i] = dxva_cxt->pp.row_height_minus1[i] + 1;
356*437bfbebSnyanmisaka sum += row_height[i];
357*437bfbebSnyanmisaka }
358*437bfbebSnyanmisaka row_height[i] = ctu_height_in_pic - sum;
359*437bfbebSnyanmisaka } // end of (pps->uniform_spacing_flag == 0)
360*437bfbebSnyanmisaka else {
361*437bfbebSnyanmisaka
362*437bfbebSnyanmisaka RK_S32 pic_in_cts_width = (width +
363*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
364*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
365*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
366*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
367*437bfbebSnyanmisaka RK_S32 pic_in_cts_height = (height +
368*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
369*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
370*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
371*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
372*437bfbebSnyanmisaka
373*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1 + 1; i++)
374*437bfbebSnyanmisaka column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1) -
375*437bfbebSnyanmisaka (i * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1);
376*437bfbebSnyanmisaka
377*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1 + 1; i++)
378*437bfbebSnyanmisaka row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1) -
379*437bfbebSnyanmisaka (i * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1);
380*437bfbebSnyanmisaka }
381*437bfbebSnyanmisaka } // pps->tiles_enabled_flag
382*437bfbebSnyanmisaka else {
383*437bfbebSnyanmisaka RK_S32 MaxCUWidth = (1 << (dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
384*437bfbebSnyanmisaka column_width[0] = (width + MaxCUWidth - 1) / MaxCUWidth;
385*437bfbebSnyanmisaka row_height[0] = (height + MaxCUWidth - 1) / MaxCUWidth;
386*437bfbebSnyanmisaka }
387*437bfbebSnyanmisaka
388*437bfbebSnyanmisaka for (j = 0; j < 20; j++) {
389*437bfbebSnyanmisaka if (column_width[j] > 0)
390*437bfbebSnyanmisaka column_width[j]--;
391*437bfbebSnyanmisaka mpp_put_bits(&bp, column_width[j], 12);
392*437bfbebSnyanmisaka }
393*437bfbebSnyanmisaka
394*437bfbebSnyanmisaka for (j = 0; j < 22; j++) {
395*437bfbebSnyanmisaka if (row_height[j] > 0)
396*437bfbebSnyanmisaka row_height[j]--;
397*437bfbebSnyanmisaka mpp_put_bits(&bp, row_height[j], 12);
398*437bfbebSnyanmisaka }
399*437bfbebSnyanmisaka }
400*437bfbebSnyanmisaka
401*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 32);
402*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 70);
403*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0xf);//128
404*437bfbebSnyanmisaka }
405*437bfbebSnyanmisaka
406*437bfbebSnyanmisaka if (dxva_cxt->pp.scaling_list_enabled_flag) {
407*437bfbebSnyanmisaka RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->sclst_offset;
408*437bfbebSnyanmisaka
409*437bfbebSnyanmisaka if (dxva_cxt->pp.scaling_list_data_present_flag) {
410*437bfbebSnyanmisaka addr = (dxva_cxt->pp.pps_id + 16) * 1360;
411*437bfbebSnyanmisaka } else if (dxva_cxt->pp.scaling_list_enabled_flag) {
412*437bfbebSnyanmisaka addr = dxva_cxt->pp.sps_id * 1360;
413*437bfbebSnyanmisaka } else {
414*437bfbebSnyanmisaka addr = 80 * 1360;
415*437bfbebSnyanmisaka }
416*437bfbebSnyanmisaka
417*437bfbebSnyanmisaka hal_h265d_output_scalinglist_packet(hal, ptr_scaling + addr, dxva);
418*437bfbebSnyanmisaka
419*437bfbebSnyanmisaka hw_reg->h265d_addr.reg180_scanlist_addr = reg_ctx->bufs_fd;
420*437bfbebSnyanmisaka hw_reg->common.reg012.scanlist_addr_valid_en = 1;
421*437bfbebSnyanmisaka
422*437bfbebSnyanmisaka /* need to config addr */
423*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 180, addr + reg_ctx->sclst_offset);
424*437bfbebSnyanmisaka }
425*437bfbebSnyanmisaka
426*437bfbebSnyanmisaka for (i = 0; i < 64; i++)
427*437bfbebSnyanmisaka memcpy(pps_ptr + i * 112, reg_ctx->pps_buf, 112);
428*437bfbebSnyanmisaka #ifdef dump
429*437bfbebSnyanmisaka fwrite(pps_ptr, 1, 80 * 64, fp);
430*437bfbebSnyanmisaka RK_U32 *tmp = (RK_U32 *)pps_ptr;
431*437bfbebSnyanmisaka for (i = 0; i < 112 / 4; i++) {
432*437bfbebSnyanmisaka mpp_log("pps[%3d] = 0x%08x\n", i, tmp[i]);
433*437bfbebSnyanmisaka }
434*437bfbebSnyanmisaka #endif
435*437bfbebSnyanmisaka return 0;
436*437bfbebSnyanmisaka }
437*437bfbebSnyanmisaka
h265d_refine_rcb_size(Vdpu382RcbInfo * rcb_info,Vdpu382H265dRegSet * hw_regs,RK_S32 width,RK_S32 height,void * dxva)438*437bfbebSnyanmisaka static void h265d_refine_rcb_size(Vdpu382RcbInfo *rcb_info,
439*437bfbebSnyanmisaka Vdpu382H265dRegSet *hw_regs,
440*437bfbebSnyanmisaka RK_S32 width, RK_S32 height, void *dxva)
441*437bfbebSnyanmisaka {
442*437bfbebSnyanmisaka RK_U32 rcb_bits = 0;
443*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
444*437bfbebSnyanmisaka DXVA_PicParams_HEVC *pp = &dxva_cxt->pp;
445*437bfbebSnyanmisaka RK_U32 chroma_fmt_idc = pp->chroma_format_idc;//0 400,1 420 ,2 422,3 444
446*437bfbebSnyanmisaka RK_U8 bit_depth = MPP_MAX(pp->bit_depth_luma_minus8, pp->bit_depth_chroma_minus8) + 8;
447*437bfbebSnyanmisaka RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size + pp->log2_min_luma_coding_block_size_minus3 + 3);
448*437bfbebSnyanmisaka RK_U32 tile_col_cut_num = pp->num_tile_columns_minus1;
449*437bfbebSnyanmisaka RK_U32 ext_align_size = tile_col_cut_num * 64 * 8;
450*437bfbebSnyanmisaka
451*437bfbebSnyanmisaka width = MPP_ALIGN(width, ctu_size);
452*437bfbebSnyanmisaka height = MPP_ALIGN(height, ctu_size);
453*437bfbebSnyanmisaka
454*437bfbebSnyanmisaka /* RCB_STRMD_ROW */
455*437bfbebSnyanmisaka if (width >= 8192) {
456*437bfbebSnyanmisaka RK_U32 factor = 64 / ctu_size;
457*437bfbebSnyanmisaka
458*437bfbebSnyanmisaka rcb_bits = (MPP_ALIGN(width, ctu_size) + factor - 1) / factor * 24 + ext_align_size;
459*437bfbebSnyanmisaka } else
460*437bfbebSnyanmisaka rcb_bits = 0;
461*437bfbebSnyanmisaka rcb_info[RCB_STRMD_ROW].size = MPP_RCB_BYTES(rcb_bits);
462*437bfbebSnyanmisaka
463*437bfbebSnyanmisaka /* RCB_TRANSD_ROW */
464*437bfbebSnyanmisaka if (width >= 8192)
465*437bfbebSnyanmisaka rcb_bits = (MPP_ALIGN(width - 8192, 4) << 1) + ext_align_size;
466*437bfbebSnyanmisaka else
467*437bfbebSnyanmisaka rcb_bits = 0;
468*437bfbebSnyanmisaka rcb_info[RCB_TRANSD_ROW].size = MPP_RCB_BYTES(rcb_bits);
469*437bfbebSnyanmisaka
470*437bfbebSnyanmisaka /* RCB_TRANSD_COL */
471*437bfbebSnyanmisaka if (height >= 8192 && tile_col_cut_num)
472*437bfbebSnyanmisaka rcb_bits = tile_col_cut_num ? (MPP_ALIGN(height - 8192, 4) << 1) : 0;
473*437bfbebSnyanmisaka else
474*437bfbebSnyanmisaka rcb_bits = 0;
475*437bfbebSnyanmisaka rcb_info[RCB_TRANSD_COL].size = MPP_RCB_BYTES(rcb_bits);
476*437bfbebSnyanmisaka
477*437bfbebSnyanmisaka /* RCB_INTER_ROW */
478*437bfbebSnyanmisaka rcb_bits = width * 22 + ext_align_size;
479*437bfbebSnyanmisaka rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
480*437bfbebSnyanmisaka
481*437bfbebSnyanmisaka /* RCB_INTER_COL */
482*437bfbebSnyanmisaka rcb_bits = tile_col_cut_num ? (height * 22) : 0;
483*437bfbebSnyanmisaka rcb_info[RCB_INTER_COL].size = MPP_RCB_BYTES(rcb_bits);
484*437bfbebSnyanmisaka
485*437bfbebSnyanmisaka /* RCB_INTRA_ROW */
486*437bfbebSnyanmisaka rcb_bits = width * ((chroma_fmt_idc ? 1 : 0) + 1) * 11 + ext_align_size;
487*437bfbebSnyanmisaka rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
488*437bfbebSnyanmisaka
489*437bfbebSnyanmisaka /* RCB_DBLK_ROW */
490*437bfbebSnyanmisaka if (chroma_fmt_idc == 1 || chroma_fmt_idc == 2) {
491*437bfbebSnyanmisaka if (ctu_size == 32)
492*437bfbebSnyanmisaka rcb_bits = width * ( 4 + 6 * bit_depth);
493*437bfbebSnyanmisaka else
494*437bfbebSnyanmisaka rcb_bits = width * ( 2 + 6 * bit_depth);
495*437bfbebSnyanmisaka } else {
496*437bfbebSnyanmisaka if (ctu_size == 32)
497*437bfbebSnyanmisaka rcb_bits = width * ( 4 + 8 * bit_depth);
498*437bfbebSnyanmisaka else
499*437bfbebSnyanmisaka rcb_bits = width * ( 2 + 8 * bit_depth);
500*437bfbebSnyanmisaka }
501*437bfbebSnyanmisaka rcb_bits += (tile_col_cut_num * (bit_depth == 8 ? 256 : 192)) + ext_align_size;
502*437bfbebSnyanmisaka rcb_info[RCB_DBLK_ROW].size = MPP_RCB_BYTES(rcb_bits);
503*437bfbebSnyanmisaka
504*437bfbebSnyanmisaka /* RCB_SAO_ROW */
505*437bfbebSnyanmisaka if (chroma_fmt_idc == 1 || chroma_fmt_idc == 2) {
506*437bfbebSnyanmisaka rcb_bits = width * (128 / ctu_size + 2 * bit_depth);
507*437bfbebSnyanmisaka } else {
508*437bfbebSnyanmisaka rcb_bits = width * (128 / ctu_size + 3 * bit_depth);
509*437bfbebSnyanmisaka }
510*437bfbebSnyanmisaka rcb_bits += (tile_col_cut_num * (bit_depth == 8 ? 160 : 128)) + ext_align_size;
511*437bfbebSnyanmisaka rcb_info[RCB_SAO_ROW].size = MPP_RCB_BYTES(rcb_bits);
512*437bfbebSnyanmisaka
513*437bfbebSnyanmisaka /* RCB_FBC_ROW */
514*437bfbebSnyanmisaka if (hw_regs->common.reg012.fbc_e) {
515*437bfbebSnyanmisaka rcb_bits = width * (chroma_fmt_idc - 1) * 2 * bit_depth;
516*437bfbebSnyanmisaka rcb_bits += (tile_col_cut_num * (bit_depth == 8 ? 128 : 64)) + ext_align_size;
517*437bfbebSnyanmisaka } else
518*437bfbebSnyanmisaka rcb_bits = 0;
519*437bfbebSnyanmisaka rcb_info[RCB_FBC_ROW].size = MPP_RCB_BYTES(rcb_bits);
520*437bfbebSnyanmisaka
521*437bfbebSnyanmisaka /* RCB_FILT_COL */
522*437bfbebSnyanmisaka if (tile_col_cut_num) {
523*437bfbebSnyanmisaka if (hw_regs->common.reg012.fbc_e) {
524*437bfbebSnyanmisaka RK_U32 ctu_idx = ctu_size >> 5;
525*437bfbebSnyanmisaka RK_U32 a = filterd_fbc_on[ctu_idx][chroma_fmt_idc].a;
526*437bfbebSnyanmisaka RK_U32 b = filterd_fbc_on[ctu_idx][chroma_fmt_idc].b;
527*437bfbebSnyanmisaka
528*437bfbebSnyanmisaka rcb_bits = height * (a * bit_depth + b);
529*437bfbebSnyanmisaka } else {
530*437bfbebSnyanmisaka RK_U32 ctu_idx = ctu_size >> 5;
531*437bfbebSnyanmisaka RK_U32 a = filterd_fbc_off[ctu_idx][chroma_fmt_idc].a;
532*437bfbebSnyanmisaka RK_U32 b = filterd_fbc_off[ctu_idx][chroma_fmt_idc].b;
533*437bfbebSnyanmisaka
534*437bfbebSnyanmisaka rcb_bits = height * (a * bit_depth + b);
535*437bfbebSnyanmisaka }
536*437bfbebSnyanmisaka } else
537*437bfbebSnyanmisaka rcb_bits = 0;
538*437bfbebSnyanmisaka rcb_info[RCB_FILT_COL].size = MPP_RCB_BYTES(rcb_bits);
539*437bfbebSnyanmisaka }
540*437bfbebSnyanmisaka
hal_h265d_rcb_info_update(void * hal,void * dxva,Vdpu382H265dRegSet * hw_regs,RK_S32 width,RK_S32 height)541*437bfbebSnyanmisaka static void hal_h265d_rcb_info_update(void *hal, void *dxva,
542*437bfbebSnyanmisaka Vdpu382H265dRegSet *hw_regs,
543*437bfbebSnyanmisaka RK_S32 width, RK_S32 height)
544*437bfbebSnyanmisaka {
545*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
546*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
547*437bfbebSnyanmisaka DXVA_PicParams_HEVC *pp = &dxva_cxt->pp;
548*437bfbebSnyanmisaka RK_U32 chroma_fmt_idc = pp->chroma_format_idc;//0 400,1 4202 ,422,3 444
549*437bfbebSnyanmisaka RK_U8 bit_depth = MPP_MAX(pp->bit_depth_luma_minus8, pp->bit_depth_chroma_minus8) + 8;
550*437bfbebSnyanmisaka RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size + pp->log2_min_luma_coding_block_size_minus3 + 3);
551*437bfbebSnyanmisaka RK_U32 num_tiles = pp->num_tile_rows_minus1 + 1;
552*437bfbebSnyanmisaka
553*437bfbebSnyanmisaka if (reg_ctx->num_row_tiles != num_tiles ||
554*437bfbebSnyanmisaka reg_ctx->bit_depth != bit_depth ||
555*437bfbebSnyanmisaka reg_ctx->chroma_fmt_idc != chroma_fmt_idc ||
556*437bfbebSnyanmisaka reg_ctx->ctu_size != ctu_size ||
557*437bfbebSnyanmisaka reg_ctx->width != width ||
558*437bfbebSnyanmisaka reg_ctx->height != height) {
559*437bfbebSnyanmisaka RK_U32 i = 0;
560*437bfbebSnyanmisaka RK_U32 loop = reg_ctx->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->g_buf) : 1;
561*437bfbebSnyanmisaka
562*437bfbebSnyanmisaka reg_ctx->rcb_buf_size = vdpu382_get_rcb_buf_size((Vdpu382RcbInfo*)reg_ctx->rcb_info, width, height);
563*437bfbebSnyanmisaka h265d_refine_rcb_size((Vdpu382RcbInfo*)reg_ctx->rcb_info, hw_regs, width, height, dxva_cxt);
564*437bfbebSnyanmisaka
565*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
566*437bfbebSnyanmisaka MppBuffer rcb_buf;
567*437bfbebSnyanmisaka
568*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
569*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
570*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
571*437bfbebSnyanmisaka }
572*437bfbebSnyanmisaka mpp_buffer_get(reg_ctx->group, &rcb_buf, reg_ctx->rcb_buf_size);
573*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = rcb_buf;
574*437bfbebSnyanmisaka }
575*437bfbebSnyanmisaka
576*437bfbebSnyanmisaka reg_ctx->num_row_tiles = num_tiles;
577*437bfbebSnyanmisaka reg_ctx->bit_depth = bit_depth;
578*437bfbebSnyanmisaka reg_ctx->chroma_fmt_idc = chroma_fmt_idc;
579*437bfbebSnyanmisaka reg_ctx->ctu_size = ctu_size;
580*437bfbebSnyanmisaka reg_ctx->width = width;
581*437bfbebSnyanmisaka reg_ctx->height = height;
582*437bfbebSnyanmisaka }
583*437bfbebSnyanmisaka }
584*437bfbebSnyanmisaka
585*437bfbebSnyanmisaka #define SET_POC_HIGNBIT_INFO(regs, index, field, value)\
586*437bfbebSnyanmisaka do{ \
587*437bfbebSnyanmisaka switch(index){\
588*437bfbebSnyanmisaka case 0: regs.reg200.ref0_##field = value; break;\
589*437bfbebSnyanmisaka case 1: regs.reg200.ref1_##field = value; break;\
590*437bfbebSnyanmisaka case 2: regs.reg200.ref2_##field = value; break;\
591*437bfbebSnyanmisaka case 3: regs.reg200.ref3_##field = value; break;\
592*437bfbebSnyanmisaka case 4: regs.reg200.ref4_##field = value; break;\
593*437bfbebSnyanmisaka case 5: regs.reg200.ref5_##field = value; break;\
594*437bfbebSnyanmisaka case 6: regs.reg200.ref6_##field = value; break;\
595*437bfbebSnyanmisaka case 7: regs.reg200.ref7_##field = value; break;\
596*437bfbebSnyanmisaka case 8: regs.reg201.ref8_##field = value; break;\
597*437bfbebSnyanmisaka case 9: regs.reg201.ref9_##field = value; break;\
598*437bfbebSnyanmisaka case 10: regs.reg201.ref10_##field = value; break;\
599*437bfbebSnyanmisaka case 11: regs.reg201.ref11_##field = value; break;\
600*437bfbebSnyanmisaka case 12: regs.reg201.ref12_##field = value; break;\
601*437bfbebSnyanmisaka case 13: regs.reg201.ref13_##field = value; break;\
602*437bfbebSnyanmisaka case 14: regs.reg201.ref14_##field = value; break;\
603*437bfbebSnyanmisaka case 15: regs.reg201.ref15_##field = value; break;\
604*437bfbebSnyanmisaka default: break;}\
605*437bfbebSnyanmisaka }while(0)
606*437bfbebSnyanmisaka
607*437bfbebSnyanmisaka #define pocdistance(a, b) (((a) > (b)) ? ((a) - (b)) : ((b) - (a)))
608*437bfbebSnyanmisaka
hal_h265d_vdpu382_setup_colmv_buf(void * hal,HalTaskInfo * syn)609*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_setup_colmv_buf(void *hal, HalTaskInfo *syn)
610*437bfbebSnyanmisaka {
611*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
612*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
613*437bfbebSnyanmisaka DXVA_PicParams_HEVC *pp = &dxva_cxt->pp;
614*437bfbebSnyanmisaka RK_U8 ctu_size = 1 << (pp->log2_diff_max_min_luma_coding_block_size +
615*437bfbebSnyanmisaka pp->log2_min_luma_coding_block_size_minus3 + 3);
616*437bfbebSnyanmisaka RK_U32 log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
617*437bfbebSnyanmisaka
618*437bfbebSnyanmisaka RK_U32 width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
619*437bfbebSnyanmisaka RK_U32 height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
620*437bfbebSnyanmisaka RK_U32 mv_size = 0, colmv_size = 16, colmv_byte = 16;
621*437bfbebSnyanmisaka RK_U32 compress = reg_ctx->hw_info ? reg_ctx->hw_info->cap_colmv_compress : 1;
622*437bfbebSnyanmisaka
623*437bfbebSnyanmisaka
624*437bfbebSnyanmisaka mv_size = vdpu382_get_colmv_size(width, height, ctu_size, colmv_byte, colmv_size, compress);
625*437bfbebSnyanmisaka
626*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs == NULL || reg_ctx->mv_size < mv_size) {
627*437bfbebSnyanmisaka size_t size = mv_size;
628*437bfbebSnyanmisaka
629*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs) {
630*437bfbebSnyanmisaka hal_bufs_deinit(reg_ctx->cmv_bufs);
631*437bfbebSnyanmisaka reg_ctx->cmv_bufs = NULL;
632*437bfbebSnyanmisaka }
633*437bfbebSnyanmisaka
634*437bfbebSnyanmisaka hal_bufs_init(®_ctx->cmv_bufs);
635*437bfbebSnyanmisaka if (reg_ctx->cmv_bufs == NULL) {
636*437bfbebSnyanmisaka mpp_err_f("colmv bufs init fail");
637*437bfbebSnyanmisaka return MPP_ERR_NOMEM;;
638*437bfbebSnyanmisaka }
639*437bfbebSnyanmisaka
640*437bfbebSnyanmisaka reg_ctx->mv_size = mv_size;
641*437bfbebSnyanmisaka reg_ctx->mv_count = mpp_buf_slot_get_count(reg_ctx->slots);
642*437bfbebSnyanmisaka hal_bufs_setup(reg_ctx->cmv_bufs, reg_ctx->mv_count, 1, &size);
643*437bfbebSnyanmisaka }
644*437bfbebSnyanmisaka
645*437bfbebSnyanmisaka return MPP_OK;
646*437bfbebSnyanmisaka }
647*437bfbebSnyanmisaka
hal_h265d_vdpu382_gen_regs(void * hal,HalTaskInfo * syn)648*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_gen_regs(void *hal, HalTaskInfo *syn)
649*437bfbebSnyanmisaka {
650*437bfbebSnyanmisaka RK_S32 i = 0;
651*437bfbebSnyanmisaka RK_S32 log2_min_cb_size;
652*437bfbebSnyanmisaka RK_S32 width, height;
653*437bfbebSnyanmisaka RK_S32 stride_y, stride_uv, virstrid_y;
654*437bfbebSnyanmisaka Vdpu382H265dRegSet *hw_regs;
655*437bfbebSnyanmisaka RK_S32 ret = MPP_SUCCESS;
656*437bfbebSnyanmisaka MppBuffer streambuf = NULL;
657*437bfbebSnyanmisaka RK_S32 aglin_offset = 0;
658*437bfbebSnyanmisaka RK_S32 valid_ref = -1;
659*437bfbebSnyanmisaka MppBuffer framebuf = NULL;
660*437bfbebSnyanmisaka HalBuf *mv_buf = NULL;
661*437bfbebSnyanmisaka RK_S32 fd = -1;
662*437bfbebSnyanmisaka RK_S32 distance = INT_MAX;
663*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt =
664*437bfbebSnyanmisaka (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
665*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
666*437bfbebSnyanmisaka void *rps_ptr = NULL;
667*437bfbebSnyanmisaka RK_U32 stream_buf_size = 0;
668*437bfbebSnyanmisaka
669*437bfbebSnyanmisaka if (syn->dec.flags.parse_err ||
670*437bfbebSnyanmisaka (syn->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
671*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
672*437bfbebSnyanmisaka return MPP_OK;
673*437bfbebSnyanmisaka }
674*437bfbebSnyanmisaka
675*437bfbebSnyanmisaka if (reg_ctx ->fast_mode) {
676*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
677*437bfbebSnyanmisaka if (!reg_ctx->g_buf[i].use_flag) {
678*437bfbebSnyanmisaka syn->dec.reg_index = i;
679*437bfbebSnyanmisaka
680*437bfbebSnyanmisaka reg_ctx->spspps_offset = reg_ctx->offset_spspps[i];
681*437bfbebSnyanmisaka reg_ctx->rps_offset = reg_ctx->offset_rps[i];
682*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->offset_sclst[i];
683*437bfbebSnyanmisaka
684*437bfbebSnyanmisaka reg_ctx->hw_regs = reg_ctx->g_buf[i].hw_regs;
685*437bfbebSnyanmisaka reg_ctx->g_buf[i].use_flag = 1;
686*437bfbebSnyanmisaka break;
687*437bfbebSnyanmisaka }
688*437bfbebSnyanmisaka }
689*437bfbebSnyanmisaka if (i == MAX_GEN_REG) {
690*437bfbebSnyanmisaka mpp_err("hevc rps buf all used");
691*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
692*437bfbebSnyanmisaka }
693*437bfbebSnyanmisaka } else {
694*437bfbebSnyanmisaka syn->dec.reg_index = 0;
695*437bfbebSnyanmisaka }
696*437bfbebSnyanmisaka rps_ptr = mpp_buffer_get_ptr(reg_ctx->bufs) + reg_ctx->rps_offset;
697*437bfbebSnyanmisaka if (NULL == rps_ptr) {
698*437bfbebSnyanmisaka
699*437bfbebSnyanmisaka mpp_err("rps_data get ptr error");
700*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
701*437bfbebSnyanmisaka }
702*437bfbebSnyanmisaka
703*437bfbebSnyanmisaka
704*437bfbebSnyanmisaka if (syn->dec.syntax.data == NULL) {
705*437bfbebSnyanmisaka mpp_err("%s:%s:%d dxva is NULL", __FILE__, __FUNCTION__, __LINE__);
706*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
707*437bfbebSnyanmisaka }
708*437bfbebSnyanmisaka
709*437bfbebSnyanmisaka /* output pps */
710*437bfbebSnyanmisaka hw_regs = (Vdpu382H265dRegSet*)reg_ctx->hw_regs;
711*437bfbebSnyanmisaka memset(hw_regs, 0, sizeof(Vdpu382H265dRegSet));
712*437bfbebSnyanmisaka
713*437bfbebSnyanmisaka if (NULL == reg_ctx->hw_regs) {
714*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
715*437bfbebSnyanmisaka }
716*437bfbebSnyanmisaka
717*437bfbebSnyanmisaka
718*437bfbebSnyanmisaka log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
719*437bfbebSnyanmisaka
720*437bfbebSnyanmisaka width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
721*437bfbebSnyanmisaka height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
722*437bfbebSnyanmisaka ret = hal_h265d_vdpu382_setup_colmv_buf(hal, syn);
723*437bfbebSnyanmisaka if (ret)
724*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
725*437bfbebSnyanmisaka
726*437bfbebSnyanmisaka {
727*437bfbebSnyanmisaka MppFrame mframe = NULL;
728*437bfbebSnyanmisaka RK_U32 ver_virstride;
729*437bfbebSnyanmisaka
730*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
731*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
732*437bfbebSnyanmisaka stride_y = mpp_frame_get_hor_stride(mframe);
733*437bfbebSnyanmisaka ver_virstride = mpp_frame_get_ver_stride(mframe);
734*437bfbebSnyanmisaka stride_uv = stride_y;
735*437bfbebSnyanmisaka virstrid_y = ver_virstride * stride_y;
736*437bfbebSnyanmisaka hw_regs->common.reg013.h26x_error_mode = 1;
737*437bfbebSnyanmisaka hw_regs->common.reg021.error_deb_en = 1;
738*437bfbebSnyanmisaka hw_regs->common.reg021.inter_error_prc_mode = 0;
739*437bfbebSnyanmisaka hw_regs->common.reg021.error_intra_mode = 1;
740*437bfbebSnyanmisaka
741*437bfbebSnyanmisaka hw_regs->common.reg017.slice_num = dxva_cxt->slice_count;
742*437bfbebSnyanmisaka hw_regs->h265d_param.reg64.h26x_rps_mode = 0;
743*437bfbebSnyanmisaka hw_regs->h265d_param.reg64.h26x_frame_orslice = 0;
744*437bfbebSnyanmisaka hw_regs->h265d_param.reg64.h26x_stream_mode = 0;
745*437bfbebSnyanmisaka
746*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe))) {
747*437bfbebSnyanmisaka RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
748*437bfbebSnyanmisaka RK_U32 fbd_offset = MPP_ALIGN(fbc_hdr_stride * (ver_virstride + 64) / 16, SZ_4K);
749*437bfbebSnyanmisaka
750*437bfbebSnyanmisaka hw_regs->common.reg012.fbc_e = 1;
751*437bfbebSnyanmisaka hw_regs->common.reg018.y_hor_virstride = fbc_hdr_stride >> 4;
752*437bfbebSnyanmisaka hw_regs->common.reg019.uv_hor_virstride = fbc_hdr_stride >> 4;
753*437bfbebSnyanmisaka hw_regs->common.reg020_fbc_payload_off.payload_st_offset = fbd_offset >> 4;
754*437bfbebSnyanmisaka } else {
755*437bfbebSnyanmisaka hw_regs->common.reg012.fbc_e = 0;
756*437bfbebSnyanmisaka hw_regs->common.reg018.y_hor_virstride = stride_y >> 4;
757*437bfbebSnyanmisaka hw_regs->common.reg019.uv_hor_virstride = stride_uv >> 4;
758*437bfbebSnyanmisaka hw_regs->common.reg020_y_virstride.y_virstride = virstrid_y >> 4;
759*437bfbebSnyanmisaka }
760*437bfbebSnyanmisaka }
761*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
762*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
763*437bfbebSnyanmisaka hw_regs->common_addr.reg130_decout_base = mpp_buffer_get_fd(framebuf); //just index need map
764*437bfbebSnyanmisaka /*if out_base is equal to zero it means this frame may error
765*437bfbebSnyanmisaka we return directly add by csy*/
766*437bfbebSnyanmisaka
767*437bfbebSnyanmisaka if (hw_regs->common_addr.reg130_decout_base == 0) {
768*437bfbebSnyanmisaka return 0;
769*437bfbebSnyanmisaka }
770*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(framebuf);
771*437bfbebSnyanmisaka hw_regs->common_addr.reg130_decout_base = fd;
772*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, dxva_cxt->pp.CurrPic.Index7Bits);
773*437bfbebSnyanmisaka hw_regs->common_addr.reg131_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
774*437bfbebSnyanmisaka
775*437bfbebSnyanmisaka hw_regs->h265d_param.reg65.cur_top_poc = dxva_cxt->pp.CurrPicOrderCntVal;
776*437bfbebSnyanmisaka
777*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->packet_slots, syn->dec.input, SLOT_BUFFER,
778*437bfbebSnyanmisaka &streambuf);
779*437bfbebSnyanmisaka if ( dxva_cxt->bitstream == NULL) {
780*437bfbebSnyanmisaka dxva_cxt->bitstream = mpp_buffer_get_ptr(streambuf);
781*437bfbebSnyanmisaka }
782*437bfbebSnyanmisaka #ifdef HW_RPS
783*437bfbebSnyanmisaka hw_regs->h265d_param.reg103.ref_pic_layer_same_with_cur = 0xffff;
784*437bfbebSnyanmisaka hal_h265d_slice_hw_rps(syn->dec.syntax.data, rps_ptr, reg_ctx->sw_rps_buf, reg_ctx->fast_mode);
785*437bfbebSnyanmisaka #else
786*437bfbebSnyanmisaka hw_regs->sw_sysctrl.sw_h26x_rps_mode = 1;
787*437bfbebSnyanmisaka hal_h265d_slice_output_rps(syn->dec.syntax.data, rps_ptr);
788*437bfbebSnyanmisaka #endif
789*437bfbebSnyanmisaka
790*437bfbebSnyanmisaka /* cabac table */
791*437bfbebSnyanmisaka hw_regs->h265d_addr.reg197_cabactbl_base = reg_ctx->bufs_fd;
792*437bfbebSnyanmisaka /* pps */
793*437bfbebSnyanmisaka hw_regs->h265d_addr.reg161_pps_base = reg_ctx->bufs_fd;
794*437bfbebSnyanmisaka hw_regs->h265d_addr.reg163_rps_base = reg_ctx->bufs_fd;
795*437bfbebSnyanmisaka
796*437bfbebSnyanmisaka hw_regs->common_addr.reg128_rlc_base = mpp_buffer_get_fd(streambuf);
797*437bfbebSnyanmisaka hw_regs->common_addr.reg129_rlcwrite_base = mpp_buffer_get_fd(streambuf);
798*437bfbebSnyanmisaka stream_buf_size = mpp_buffer_get_size(streambuf);
799*437bfbebSnyanmisaka hw_regs->common.reg016_str_len = ((dxva_cxt->bitstream_size + 15)
800*437bfbebSnyanmisaka & (~15)) + 64;
801*437bfbebSnyanmisaka hw_regs->common.reg016_str_len = stream_buf_size > hw_regs->common.reg016_str_len ?
802*437bfbebSnyanmisaka hw_regs->common.reg016_str_len : stream_buf_size;
803*437bfbebSnyanmisaka
804*437bfbebSnyanmisaka aglin_offset = hw_regs->common.reg016_str_len - dxva_cxt->bitstream_size;
805*437bfbebSnyanmisaka if (aglin_offset > 0) {
806*437bfbebSnyanmisaka memset((void *)(dxva_cxt->bitstream + dxva_cxt->bitstream_size), 0,
807*437bfbebSnyanmisaka aglin_offset);
808*437bfbebSnyanmisaka }
809*437bfbebSnyanmisaka hw_regs->common.reg010.dec_e = 1;
810*437bfbebSnyanmisaka hw_regs->common.reg012.colmv_compress_en = reg_ctx->hw_info ?
811*437bfbebSnyanmisaka reg_ctx->hw_info->cap_colmv_compress : 0;
812*437bfbebSnyanmisaka
813*437bfbebSnyanmisaka hw_regs->common.reg024.cabac_err_en_lowbits = 0xffffdfff;
814*437bfbebSnyanmisaka hw_regs->common.reg025.cabac_err_en_highbits = 0x3ffbf9ff;
815*437bfbebSnyanmisaka
816*437bfbebSnyanmisaka hw_regs->common.reg011.dec_clkgate_e = 1;
817*437bfbebSnyanmisaka hw_regs->common.reg011.err_head_fill_e = 1;
818*437bfbebSnyanmisaka hw_regs->common.reg011.err_colmv_fill_e = 1;
819*437bfbebSnyanmisaka
820*437bfbebSnyanmisaka hw_regs->common.reg026.inter_auto_gating_e = 1;
821*437bfbebSnyanmisaka hw_regs->common.reg026.filterd_auto_gating_e = 1;
822*437bfbebSnyanmisaka hw_regs->common.reg026.strmd_auto_gating_e = 1;
823*437bfbebSnyanmisaka hw_regs->common.reg026.mcp_auto_gating_e = 1;
824*437bfbebSnyanmisaka hw_regs->common.reg026.busifd_auto_gating_e = 1;
825*437bfbebSnyanmisaka hw_regs->common.reg026.dec_ctrl_auto_gating_e = 1;
826*437bfbebSnyanmisaka hw_regs->common.reg026.intra_auto_gating_e = 1;
827*437bfbebSnyanmisaka hw_regs->common.reg026.mc_auto_gating_e = 1;
828*437bfbebSnyanmisaka hw_regs->common.reg026.transd_auto_gating_e = 1;
829*437bfbebSnyanmisaka hw_regs->common.reg026.sram_auto_gating_e = 1;
830*437bfbebSnyanmisaka hw_regs->common.reg026.cru_auto_gating_e = 1;
831*437bfbebSnyanmisaka hw_regs->common.reg026.reg_cfg_gating_en = 1;
832*437bfbebSnyanmisaka hw_regs->common.reg032_timeout_threshold = 0x3ffff;
833*437bfbebSnyanmisaka
834*437bfbebSnyanmisaka valid_ref = hw_regs->common_addr.reg130_decout_base;
835*437bfbebSnyanmisaka reg_ctx->error_index[syn->dec.reg_index] = dxva_cxt->pp.CurrPic.Index7Bits;
836*437bfbebSnyanmisaka hw_regs->common_addr.reg132_error_ref_base = valid_ref;
837*437bfbebSnyanmisaka
838*437bfbebSnyanmisaka memset(&hw_regs->highpoc.reg205, 0, sizeof(RK_U32));
839*437bfbebSnyanmisaka
840*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_cxt->pp.RefPicList); i++) {
841*437bfbebSnyanmisaka if (dxva_cxt->pp.RefPicList[i].bPicEntry != 0xff &&
842*437bfbebSnyanmisaka dxva_cxt->pp.RefPicList[i].bPicEntry != 0x7f) {
843*437bfbebSnyanmisaka
844*437bfbebSnyanmisaka MppFrame mframe = NULL;
845*437bfbebSnyanmisaka hw_regs->h265d_param.reg67_82_ref_poc[i] = dxva_cxt->pp.PicOrderCntValList[i];
846*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots,
847*437bfbebSnyanmisaka dxva_cxt->pp.RefPicList[i].Index7Bits,
848*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
849*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.RefPicList[i].Index7Bits,
850*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
851*437bfbebSnyanmisaka if (framebuf != NULL) {
852*437bfbebSnyanmisaka hw_regs->h265d_addr.reg164_179_ref_base[i] = mpp_buffer_get_fd(framebuf);
853*437bfbebSnyanmisaka valid_ref = hw_regs->h265d_addr.reg164_179_ref_base[i];
854*437bfbebSnyanmisaka // mpp_log("cur poc %d, ref poc %d", dxva_cxt->pp.current_poc, dxva_cxt->pp.PicOrderCntValList[i]);
855*437bfbebSnyanmisaka if ((pocdistance(dxva_cxt->pp.PicOrderCntValList[i], dxva_cxt->pp.current_poc) < distance)
856*437bfbebSnyanmisaka && (!mpp_frame_get_errinfo(mframe))) {
857*437bfbebSnyanmisaka distance = pocdistance(dxva_cxt->pp.PicOrderCntValList[i], dxva_cxt->pp.current_poc);
858*437bfbebSnyanmisaka hw_regs->common_addr.reg132_error_ref_base = hw_regs->h265d_addr.reg164_179_ref_base[i];
859*437bfbebSnyanmisaka reg_ctx->error_index[syn->dec.reg_index] = dxva_cxt->pp.RefPicList[i].Index7Bits;
860*437bfbebSnyanmisaka hw_regs->common.reg021.error_intra_mode = 0;
861*437bfbebSnyanmisaka
862*437bfbebSnyanmisaka }
863*437bfbebSnyanmisaka } else {
864*437bfbebSnyanmisaka hw_regs->h265d_addr.reg164_179_ref_base[i] = valid_ref;
865*437bfbebSnyanmisaka }
866*437bfbebSnyanmisaka
867*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, dxva_cxt->pp.RefPicList[i].Index7Bits);
868*437bfbebSnyanmisaka hw_regs->h265d_addr.reg181_196_colmv_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
869*437bfbebSnyanmisaka
870*437bfbebSnyanmisaka SET_REF_VALID(hw_regs->h265d_param, i, 1);
871*437bfbebSnyanmisaka }
872*437bfbebSnyanmisaka }
873*437bfbebSnyanmisaka
874*437bfbebSnyanmisaka if ((reg_ctx->error_index[syn->dec.reg_index] == dxva_cxt->pp.CurrPic.Index7Bits) &&
875*437bfbebSnyanmisaka !dxva_cxt->pp.IntraPicFlag) {
876*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "current frm may be err, should skip process");
877*437bfbebSnyanmisaka syn->dec.flags.ref_err = 1;
878*437bfbebSnyanmisaka return MPP_OK;
879*437bfbebSnyanmisaka }
880*437bfbebSnyanmisaka
881*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_cxt->pp.RefPicList); i++) {
882*437bfbebSnyanmisaka
883*437bfbebSnyanmisaka if (dxva_cxt->pp.RefPicList[i].bPicEntry != 0xff &&
884*437bfbebSnyanmisaka dxva_cxt->pp.RefPicList[i].bPicEntry != 0x7f) {
885*437bfbebSnyanmisaka MppFrame mframe = NULL;
886*437bfbebSnyanmisaka
887*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots,
888*437bfbebSnyanmisaka dxva_cxt->pp.RefPicList[i].Index7Bits,
889*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
890*437bfbebSnyanmisaka
891*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.RefPicList[i].Index7Bits,
892*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
893*437bfbebSnyanmisaka
894*437bfbebSnyanmisaka if (framebuf == NULL || mpp_frame_get_errinfo(mframe)) {
895*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, reg_ctx->error_index[syn->dec.reg_index]);
896*437bfbebSnyanmisaka hw_regs->h265d_addr.reg164_179_ref_base[i] = hw_regs->common_addr.reg132_error_ref_base;
897*437bfbebSnyanmisaka hw_regs->h265d_addr.reg181_196_colmv_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
898*437bfbebSnyanmisaka }
899*437bfbebSnyanmisaka } else {
900*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(reg_ctx->cmv_bufs, reg_ctx->error_index[syn->dec.reg_index]);
901*437bfbebSnyanmisaka hw_regs->h265d_addr.reg164_179_ref_base[i] = hw_regs->common_addr.reg132_error_ref_base;
902*437bfbebSnyanmisaka hw_regs->h265d_addr.reg181_196_colmv_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
903*437bfbebSnyanmisaka /* mark 3 to differ from current frame */
904*437bfbebSnyanmisaka if (reg_ctx->error_index[syn->dec.reg_index] == dxva_cxt->pp.CurrPic.Index7Bits)
905*437bfbebSnyanmisaka SET_POC_HIGNBIT_INFO(hw_regs->highpoc, i, poc_highbit, 3);
906*437bfbebSnyanmisaka }
907*437bfbebSnyanmisaka }
908*437bfbebSnyanmisaka hal_h265d_v382_output_pps_packet(hal, syn->dec.syntax.data);
909*437bfbebSnyanmisaka
910*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 161, reg_ctx->spspps_offset);
911*437bfbebSnyanmisaka /* rps */
912*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 163, reg_ctx->rps_offset);
913*437bfbebSnyanmisaka
914*437bfbebSnyanmisaka hw_regs->common.reg013.cur_pic_is_idr = dxva_cxt->pp.IdrPicFlag;//p_hal->slice_long->idr_flag;
915*437bfbebSnyanmisaka
916*437bfbebSnyanmisaka hw_regs->common.reg011.buf_empty_en = 1;
917*437bfbebSnyanmisaka
918*437bfbebSnyanmisaka hal_h265d_rcb_info_update(hal, dxva_cxt, hw_regs, width, height);
919*437bfbebSnyanmisaka vdpu382_setup_rcb(&hw_regs->common_addr, reg_ctx->dev, reg_ctx->fast_mode ?
920*437bfbebSnyanmisaka reg_ctx->rcb_buf[syn->dec.reg_index] : reg_ctx->rcb_buf[0],
921*437bfbebSnyanmisaka (Vdpu382RcbInfo*)reg_ctx->rcb_info);
922*437bfbebSnyanmisaka {
923*437bfbebSnyanmisaka MppFrame mframe = NULL;
924*437bfbebSnyanmisaka
925*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
926*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
927*437bfbebSnyanmisaka
928*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe)) {
929*437bfbebSnyanmisaka hw_regs->h265d_addr.reg198_scale_down_luma_base =
930*437bfbebSnyanmisaka hw_regs->common_addr.reg130_decout_base;
931*437bfbebSnyanmisaka hw_regs->h265d_addr.reg199_scale_down_chorme_base =
932*437bfbebSnyanmisaka hw_regs->common_addr.reg130_decout_base;
933*437bfbebSnyanmisaka vdpu382_setup_down_scale(mframe, reg_ctx->dev, &hw_regs->common);
934*437bfbebSnyanmisaka } else {
935*437bfbebSnyanmisaka hw_regs->h265d_addr.reg198_scale_down_luma_base = 0;
936*437bfbebSnyanmisaka hw_regs->h265d_addr.reg199_scale_down_chorme_base = 0;
937*437bfbebSnyanmisaka hw_regs->common.reg012.scale_down_en = 0;
938*437bfbebSnyanmisaka }
939*437bfbebSnyanmisaka }
940*437bfbebSnyanmisaka vdpu382_setup_statistic(&hw_regs->common, &hw_regs->statistic);
941*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->bufs);
942*437bfbebSnyanmisaka
943*437bfbebSnyanmisaka return ret;
944*437bfbebSnyanmisaka }
945*437bfbebSnyanmisaka
hal_h265d_vdpu382_start(void * hal,HalTaskInfo * task)946*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_start(void *hal, HalTaskInfo *task)
947*437bfbebSnyanmisaka {
948*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
949*437bfbebSnyanmisaka RK_U8* p = NULL;
950*437bfbebSnyanmisaka Vdpu382H265dRegSet *hw_regs = NULL;
951*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
952*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
953*437bfbebSnyanmisaka
954*437bfbebSnyanmisaka RK_U32 i;
955*437bfbebSnyanmisaka
956*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
957*437bfbebSnyanmisaka (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
958*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
959*437bfbebSnyanmisaka return MPP_OK;
960*437bfbebSnyanmisaka }
961*437bfbebSnyanmisaka
962*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
963*437bfbebSnyanmisaka p = (RK_U8*)reg_ctx->g_buf[index].hw_regs;
964*437bfbebSnyanmisaka hw_regs = ( Vdpu382H265dRegSet *)reg_ctx->g_buf[index].hw_regs;
965*437bfbebSnyanmisaka } else {
966*437bfbebSnyanmisaka p = (RK_U8*)reg_ctx->hw_regs;
967*437bfbebSnyanmisaka hw_regs = ( Vdpu382H265dRegSet *)reg_ctx->hw_regs;
968*437bfbebSnyanmisaka }
969*437bfbebSnyanmisaka
970*437bfbebSnyanmisaka if (hw_regs == NULL) {
971*437bfbebSnyanmisaka mpp_err("hal_h265d_start hw_regs is NULL");
972*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
973*437bfbebSnyanmisaka }
974*437bfbebSnyanmisaka for (i = 0; i < 68; i++) {
975*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
976*437bfbebSnyanmisaka i, *((RK_U32*)p));
977*437bfbebSnyanmisaka //mpp_log("RK_HEVC_DEC: regs[%02d]=%08X\n", i, *((RK_U32*)p));
978*437bfbebSnyanmisaka p += 4;
979*437bfbebSnyanmisaka }
980*437bfbebSnyanmisaka
981*437bfbebSnyanmisaka do {
982*437bfbebSnyanmisaka MppDevRegWrCfg wr_cfg;
983*437bfbebSnyanmisaka MppDevRegRdCfg rd_cfg;
984*437bfbebSnyanmisaka
985*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->common;
986*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->common);
987*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_REGS;
988*437bfbebSnyanmisaka
989*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
990*437bfbebSnyanmisaka if (ret) {
991*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
992*437bfbebSnyanmisaka break;
993*437bfbebSnyanmisaka }
994*437bfbebSnyanmisaka
995*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->h265d_param;
996*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->h265d_param);
997*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_PARAMS_REGS;
998*437bfbebSnyanmisaka
999*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1000*437bfbebSnyanmisaka if (ret) {
1001*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1002*437bfbebSnyanmisaka break;
1003*437bfbebSnyanmisaka }
1004*437bfbebSnyanmisaka
1005*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->common_addr;
1006*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->common_addr);
1007*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
1008*437bfbebSnyanmisaka
1009*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1010*437bfbebSnyanmisaka if (ret) {
1011*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1012*437bfbebSnyanmisaka break;
1013*437bfbebSnyanmisaka }
1014*437bfbebSnyanmisaka
1015*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->h265d_addr;
1016*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->h265d_addr);
1017*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
1018*437bfbebSnyanmisaka
1019*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1020*437bfbebSnyanmisaka if (ret) {
1021*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1022*437bfbebSnyanmisaka break;
1023*437bfbebSnyanmisaka }
1024*437bfbebSnyanmisaka
1025*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->statistic;
1026*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->statistic);
1027*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_STATISTIC_REGS;
1028*437bfbebSnyanmisaka
1029*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1030*437bfbebSnyanmisaka if (ret) {
1031*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1032*437bfbebSnyanmisaka break;
1033*437bfbebSnyanmisaka }
1034*437bfbebSnyanmisaka
1035*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->highpoc;
1036*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->highpoc);
1037*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_POC_HIGHBIT_REGS;
1038*437bfbebSnyanmisaka
1039*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
1040*437bfbebSnyanmisaka if (ret) {
1041*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1042*437bfbebSnyanmisaka break;
1043*437bfbebSnyanmisaka }
1044*437bfbebSnyanmisaka
1045*437bfbebSnyanmisaka rd_cfg.reg = &hw_regs->irq_status;
1046*437bfbebSnyanmisaka rd_cfg.size = sizeof(hw_regs->irq_status);
1047*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_INTERRUPT_REGS;
1048*437bfbebSnyanmisaka
1049*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_RD, &rd_cfg);
1050*437bfbebSnyanmisaka if (ret) {
1051*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
1052*437bfbebSnyanmisaka break;
1053*437bfbebSnyanmisaka }
1054*437bfbebSnyanmisaka /* rcb info for sram */
1055*437bfbebSnyanmisaka vdpu382_set_rcbinfo(reg_ctx->dev, (Vdpu382RcbInfo*)reg_ctx->rcb_info);
1056*437bfbebSnyanmisaka
1057*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_SEND, NULL);
1058*437bfbebSnyanmisaka if (ret) {
1059*437bfbebSnyanmisaka mpp_err_f("send cmd failed %d\n", ret);
1060*437bfbebSnyanmisaka break;
1061*437bfbebSnyanmisaka }
1062*437bfbebSnyanmisaka } while (0);
1063*437bfbebSnyanmisaka
1064*437bfbebSnyanmisaka return ret;
1065*437bfbebSnyanmisaka }
1066*437bfbebSnyanmisaka
1067*437bfbebSnyanmisaka
hal_h265d_vdpu382_wait(void * hal,HalTaskInfo * task)1068*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_wait(void *hal, HalTaskInfo *task)
1069*437bfbebSnyanmisaka {
1070*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1071*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
1072*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
1073*437bfbebSnyanmisaka RK_U8* p = NULL;
1074*437bfbebSnyanmisaka Vdpu382H265dRegSet *hw_regs = NULL;
1075*437bfbebSnyanmisaka RK_S32 i;
1076*437bfbebSnyanmisaka
1077*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
1078*437bfbebSnyanmisaka hw_regs = ( Vdpu382H265dRegSet *)reg_ctx->g_buf[index].hw_regs;
1079*437bfbebSnyanmisaka } else {
1080*437bfbebSnyanmisaka hw_regs = ( Vdpu382H265dRegSet *)reg_ctx->hw_regs;
1081*437bfbebSnyanmisaka }
1082*437bfbebSnyanmisaka
1083*437bfbebSnyanmisaka p = (RK_U8*)hw_regs;
1084*437bfbebSnyanmisaka
1085*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1086*437bfbebSnyanmisaka (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
1087*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
1088*437bfbebSnyanmisaka goto ERR_PROC;
1089*437bfbebSnyanmisaka }
1090*437bfbebSnyanmisaka
1091*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_POLL, NULL);
1092*437bfbebSnyanmisaka if (ret)
1093*437bfbebSnyanmisaka mpp_err_f("poll cmd failed %d\n", ret);
1094*437bfbebSnyanmisaka
1095*437bfbebSnyanmisaka ERR_PROC:
1096*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1097*437bfbebSnyanmisaka task->dec.flags.ref_err ||
1098*437bfbebSnyanmisaka hw_regs->irq_status.reg224.dec_error_sta ||
1099*437bfbebSnyanmisaka hw_regs->irq_status.reg224.buf_empty_sta ||
1100*437bfbebSnyanmisaka hw_regs->irq_status.reg224.dec_bus_sta ||
1101*437bfbebSnyanmisaka !hw_regs->irq_status.reg224.dec_rdy_sta) {
1102*437bfbebSnyanmisaka if (!reg_ctx->fast_mode) {
1103*437bfbebSnyanmisaka if (reg_ctx->dec_cb)
1104*437bfbebSnyanmisaka mpp_callback(reg_ctx->dec_cb, &task->dec);
1105*437bfbebSnyanmisaka } else {
1106*437bfbebSnyanmisaka MppFrame mframe = NULL;
1107*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1108*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1109*437bfbebSnyanmisaka if (mframe) {
1110*437bfbebSnyanmisaka reg_ctx->fast_mode_err_found = 1;
1111*437bfbebSnyanmisaka mpp_frame_set_errinfo(mframe, 1);
1112*437bfbebSnyanmisaka }
1113*437bfbebSnyanmisaka }
1114*437bfbebSnyanmisaka } else {
1115*437bfbebSnyanmisaka if (reg_ctx->fast_mode && reg_ctx->fast_mode_err_found) {
1116*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(task->dec.refer); i++) {
1117*437bfbebSnyanmisaka if (task->dec.refer[i] >= 0) {
1118*437bfbebSnyanmisaka MppFrame frame_ref = NULL;
1119*437bfbebSnyanmisaka
1120*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.refer[i],
1121*437bfbebSnyanmisaka SLOT_FRAME_PTR, &frame_ref);
1122*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_FAST_ERR, "refer[%d] %d frame %p\n",
1123*437bfbebSnyanmisaka i, task->dec.refer[i], frame_ref);
1124*437bfbebSnyanmisaka if (frame_ref && mpp_frame_get_errinfo(frame_ref)) {
1125*437bfbebSnyanmisaka MppFrame frame_out = NULL;
1126*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1127*437bfbebSnyanmisaka SLOT_FRAME_PTR, &frame_out);
1128*437bfbebSnyanmisaka mpp_frame_set_errinfo(frame_out, 1);
1129*437bfbebSnyanmisaka break;
1130*437bfbebSnyanmisaka }
1131*437bfbebSnyanmisaka }
1132*437bfbebSnyanmisaka }
1133*437bfbebSnyanmisaka }
1134*437bfbebSnyanmisaka }
1135*437bfbebSnyanmisaka
1136*437bfbebSnyanmisaka for (i = 0; i < 68; i++) {
1137*437bfbebSnyanmisaka if (i == 1) {
1138*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1139*437bfbebSnyanmisaka i, *((RK_U32*)p));
1140*437bfbebSnyanmisaka }
1141*437bfbebSnyanmisaka
1142*437bfbebSnyanmisaka if (i == 45) {
1143*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n",
1144*437bfbebSnyanmisaka i, *((RK_U32*)p));
1145*437bfbebSnyanmisaka }
1146*437bfbebSnyanmisaka p += 4;
1147*437bfbebSnyanmisaka }
1148*437bfbebSnyanmisaka
1149*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
1150*437bfbebSnyanmisaka reg_ctx->g_buf[index].use_flag = 0;
1151*437bfbebSnyanmisaka }
1152*437bfbebSnyanmisaka
1153*437bfbebSnyanmisaka return ret;
1154*437bfbebSnyanmisaka }
1155*437bfbebSnyanmisaka
hal_h265d_vdpu382_reset(void * hal)1156*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_reset(void *hal)
1157*437bfbebSnyanmisaka {
1158*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1159*437bfbebSnyanmisaka HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1160*437bfbebSnyanmisaka p_hal->fast_mode_err_found = 0;
1161*437bfbebSnyanmisaka (void)hal;
1162*437bfbebSnyanmisaka return ret;
1163*437bfbebSnyanmisaka }
1164*437bfbebSnyanmisaka
hal_h265d_vdpu382_flush(void * hal)1165*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_flush(void *hal)
1166*437bfbebSnyanmisaka {
1167*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1168*437bfbebSnyanmisaka
1169*437bfbebSnyanmisaka (void)hal;
1170*437bfbebSnyanmisaka return ret;
1171*437bfbebSnyanmisaka }
1172*437bfbebSnyanmisaka
hal_h265d_vdpu382_control(void * hal,MpiCmd cmd_type,void * param)1173*437bfbebSnyanmisaka static MPP_RET hal_h265d_vdpu382_control(void *hal, MpiCmd cmd_type, void *param)
1174*437bfbebSnyanmisaka {
1175*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1176*437bfbebSnyanmisaka HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1177*437bfbebSnyanmisaka
1178*437bfbebSnyanmisaka (void)hal;
1179*437bfbebSnyanmisaka switch ((MpiCmd)cmd_type) {
1180*437bfbebSnyanmisaka case MPP_DEC_SET_FRAME_INFO: {
1181*437bfbebSnyanmisaka MppFrame frame = (MppFrame)param;
1182*437bfbebSnyanmisaka MppFrameFormat fmt = mpp_frame_get_fmt(frame);
1183*437bfbebSnyanmisaka
1184*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1185*437bfbebSnyanmisaka vdpu382_afbc_align_calc(p_hal->slots, frame, 16);
1186*437bfbebSnyanmisaka }
1187*437bfbebSnyanmisaka break;
1188*437bfbebSnyanmisaka }
1189*437bfbebSnyanmisaka case MPP_DEC_SET_OUTPUT_FORMAT: {
1190*437bfbebSnyanmisaka } break;
1191*437bfbebSnyanmisaka default:
1192*437bfbebSnyanmisaka break;
1193*437bfbebSnyanmisaka }
1194*437bfbebSnyanmisaka return ret;
1195*437bfbebSnyanmisaka }
1196*437bfbebSnyanmisaka
1197*437bfbebSnyanmisaka const MppHalApi hal_h265d_vdpu382 = {
1198*437bfbebSnyanmisaka .name = "h265d_vdpu382",
1199*437bfbebSnyanmisaka .type = MPP_CTX_DEC,
1200*437bfbebSnyanmisaka .coding = MPP_VIDEO_CodingHEVC,
1201*437bfbebSnyanmisaka .ctx_size = sizeof(HalH265dCtx),
1202*437bfbebSnyanmisaka .flag = 0,
1203*437bfbebSnyanmisaka .init = hal_h265d_vdpu382_init,
1204*437bfbebSnyanmisaka .deinit = hal_h265d_vdpu382_deinit,
1205*437bfbebSnyanmisaka .reg_gen = hal_h265d_vdpu382_gen_regs,
1206*437bfbebSnyanmisaka .start = hal_h265d_vdpu382_start,
1207*437bfbebSnyanmisaka .wait = hal_h265d_vdpu382_wait,
1208*437bfbebSnyanmisaka .reset = hal_h265d_vdpu382_reset,
1209*437bfbebSnyanmisaka .flush = hal_h265d_vdpu382_flush,
1210*437bfbebSnyanmisaka .control = hal_h265d_vdpu382_control,
1211*437bfbebSnyanmisaka };
1212