1*437bfbebSnyanmisaka /*
2*437bfbebSnyanmisaka * Copyright 2020 Rockchip Electronics Co. LTD
3*437bfbebSnyanmisaka *
4*437bfbebSnyanmisaka * Licensed under the Apache License, Version 2.0 (the "License");
5*437bfbebSnyanmisaka * you may not use this file except in compliance with the License.
6*437bfbebSnyanmisaka * You may obtain a copy of the License at
7*437bfbebSnyanmisaka *
8*437bfbebSnyanmisaka * http://www.apache.org/licenses/LICENSE-2.0
9*437bfbebSnyanmisaka *
10*437bfbebSnyanmisaka * Unless required by applicable law or agreed to in writing, software
11*437bfbebSnyanmisaka * distributed under the License is distributed on an "AS IS" BASIS,
12*437bfbebSnyanmisaka * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*437bfbebSnyanmisaka * See the License for the specific language governing permissions and
14*437bfbebSnyanmisaka * limitations under the License.
15*437bfbebSnyanmisaka */
16*437bfbebSnyanmisaka
17*437bfbebSnyanmisaka #define MODULE_TAG "hal_h265d_rkv"
18*437bfbebSnyanmisaka
19*437bfbebSnyanmisaka #include <stdio.h>
20*437bfbebSnyanmisaka #include <string.h>
21*437bfbebSnyanmisaka
22*437bfbebSnyanmisaka #include "mpp_mem.h"
23*437bfbebSnyanmisaka #include "mpp_bitread.h"
24*437bfbebSnyanmisaka #include "mpp_bitput.h"
25*437bfbebSnyanmisaka
26*437bfbebSnyanmisaka #include "hal_h265d_debug.h"
27*437bfbebSnyanmisaka #include "hal_h265d_ctx.h"
28*437bfbebSnyanmisaka #include "hal_h265d_com.h"
29*437bfbebSnyanmisaka #include "hal_h265d_rkv.h"
30*437bfbebSnyanmisaka #include "hal_h265d_rkv_reg.h"
31*437bfbebSnyanmisaka #include "h265d_syntax.h"
32*437bfbebSnyanmisaka
33*437bfbebSnyanmisaka /* #define dump */
34*437bfbebSnyanmisaka #ifdef dump
35*437bfbebSnyanmisaka static FILE *fp = NULL;
36*437bfbebSnyanmisaka #endif
37*437bfbebSnyanmisaka #define HW_RPS
38*437bfbebSnyanmisaka
39*437bfbebSnyanmisaka #define PPS_SIZE (96 * 64)
40*437bfbebSnyanmisaka
hal_h265d_alloc_res(void * hal)41*437bfbebSnyanmisaka static MPP_RET hal_h265d_alloc_res(void *hal)
42*437bfbebSnyanmisaka {
43*437bfbebSnyanmisaka RK_S32 i = 0;
44*437bfbebSnyanmisaka RK_S32 ret = 0;
45*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
46*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
47*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
48*437bfbebSnyanmisaka reg_ctx->g_buf[i].hw_regs =
49*437bfbebSnyanmisaka mpp_calloc_size(void, sizeof(H265d_REGS_t));
50*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group,
51*437bfbebSnyanmisaka ®_ctx->g_buf[i].scaling_list_data,
52*437bfbebSnyanmisaka SCALING_LIST_SIZE);
53*437bfbebSnyanmisaka if (ret) {
54*437bfbebSnyanmisaka mpp_err("h265d scaling_list_data get buffer failed\n");
55*437bfbebSnyanmisaka return ret;
56*437bfbebSnyanmisaka }
57*437bfbebSnyanmisaka
58*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->g_buf[i].pps_data,
59*437bfbebSnyanmisaka PPS_SIZE);
60*437bfbebSnyanmisaka if (ret) {
61*437bfbebSnyanmisaka mpp_err("h265d pps_data get buffer failed\n");
62*437bfbebSnyanmisaka return ret;
63*437bfbebSnyanmisaka }
64*437bfbebSnyanmisaka
65*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->g_buf[i].rps_data,
66*437bfbebSnyanmisaka RPS_SIZE);
67*437bfbebSnyanmisaka if (ret) {
68*437bfbebSnyanmisaka mpp_err("h265d rps_data get buffer failed\n");
69*437bfbebSnyanmisaka return ret;
70*437bfbebSnyanmisaka }
71*437bfbebSnyanmisaka }
72*437bfbebSnyanmisaka } else {
73*437bfbebSnyanmisaka reg_ctx->hw_regs = mpp_calloc_size(void, sizeof(H265d_REGS_t));
74*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->scaling_list_data,
75*437bfbebSnyanmisaka SCALING_LIST_SIZE);
76*437bfbebSnyanmisaka if (ret) {
77*437bfbebSnyanmisaka mpp_err("h265d scaling_list_data get buffer failed\n");
78*437bfbebSnyanmisaka return ret;
79*437bfbebSnyanmisaka }
80*437bfbebSnyanmisaka
81*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->pps_data, PPS_SIZE);
82*437bfbebSnyanmisaka if (ret) {
83*437bfbebSnyanmisaka mpp_err("h265d pps_data get buffer failed\n");
84*437bfbebSnyanmisaka return ret;
85*437bfbebSnyanmisaka }
86*437bfbebSnyanmisaka
87*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->rps_data, RPS_SIZE);
88*437bfbebSnyanmisaka if (ret) {
89*437bfbebSnyanmisaka mpp_err("h265d rps_data get buffer failed\n");
90*437bfbebSnyanmisaka return ret;
91*437bfbebSnyanmisaka }
92*437bfbebSnyanmisaka
93*437bfbebSnyanmisaka }
94*437bfbebSnyanmisaka return MPP_OK;
95*437bfbebSnyanmisaka }
96*437bfbebSnyanmisaka
hal_h265d_release_res(void * hal)97*437bfbebSnyanmisaka static MPP_RET hal_h265d_release_res(void *hal)
98*437bfbebSnyanmisaka {
99*437bfbebSnyanmisaka RK_S32 ret = 0;
100*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
101*437bfbebSnyanmisaka RK_S32 i = 0;
102*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
103*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
104*437bfbebSnyanmisaka if (reg_ctx->g_buf[i].scaling_list_data) {
105*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->g_buf[i].scaling_list_data);
106*437bfbebSnyanmisaka if (ret) {
107*437bfbebSnyanmisaka mpp_err("h265d scaling_list_data free buffer failed\n");
108*437bfbebSnyanmisaka return ret;
109*437bfbebSnyanmisaka }
110*437bfbebSnyanmisaka }
111*437bfbebSnyanmisaka if (reg_ctx->g_buf[i].pps_data) {
112*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->g_buf[i].pps_data);
113*437bfbebSnyanmisaka if (ret) {
114*437bfbebSnyanmisaka mpp_err("h265d pps_data free buffer failed\n");
115*437bfbebSnyanmisaka return ret;
116*437bfbebSnyanmisaka }
117*437bfbebSnyanmisaka }
118*437bfbebSnyanmisaka
119*437bfbebSnyanmisaka if (reg_ctx->g_buf[i].rps_data) {
120*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->g_buf[i].rps_data);
121*437bfbebSnyanmisaka if (ret) {
122*437bfbebSnyanmisaka mpp_err("h265d rps_data free buffer failed\n");
123*437bfbebSnyanmisaka return ret;
124*437bfbebSnyanmisaka }
125*437bfbebSnyanmisaka }
126*437bfbebSnyanmisaka
127*437bfbebSnyanmisaka if (reg_ctx->g_buf[i].hw_regs) {
128*437bfbebSnyanmisaka mpp_free(reg_ctx->g_buf[i].hw_regs);
129*437bfbebSnyanmisaka reg_ctx->g_buf[i].hw_regs = NULL;
130*437bfbebSnyanmisaka }
131*437bfbebSnyanmisaka }
132*437bfbebSnyanmisaka } else {
133*437bfbebSnyanmisaka if (reg_ctx->scaling_list_data) {
134*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->scaling_list_data);
135*437bfbebSnyanmisaka if (ret) {
136*437bfbebSnyanmisaka mpp_err("h265d scaling_list_data free buffer failed\n");
137*437bfbebSnyanmisaka return ret;
138*437bfbebSnyanmisaka }
139*437bfbebSnyanmisaka }
140*437bfbebSnyanmisaka if (reg_ctx->pps_data) {
141*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->pps_data);
142*437bfbebSnyanmisaka if (ret) {
143*437bfbebSnyanmisaka mpp_err("h265d pps_data free buffer failed\n");
144*437bfbebSnyanmisaka return ret;
145*437bfbebSnyanmisaka }
146*437bfbebSnyanmisaka }
147*437bfbebSnyanmisaka
148*437bfbebSnyanmisaka if (reg_ctx->rps_data) {
149*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->rps_data);
150*437bfbebSnyanmisaka if (ret) {
151*437bfbebSnyanmisaka mpp_err("h265d rps_data free buffer failed\n");
152*437bfbebSnyanmisaka return ret;
153*437bfbebSnyanmisaka }
154*437bfbebSnyanmisaka }
155*437bfbebSnyanmisaka
156*437bfbebSnyanmisaka if (reg_ctx->hw_regs) {
157*437bfbebSnyanmisaka mpp_free(reg_ctx->hw_regs);
158*437bfbebSnyanmisaka reg_ctx->hw_regs = NULL;
159*437bfbebSnyanmisaka }
160*437bfbebSnyanmisaka }
161*437bfbebSnyanmisaka return MPP_OK;
162*437bfbebSnyanmisaka }
163*437bfbebSnyanmisaka
hal_h265d_rkv_init(void * hal,MppHalCfg * cfg)164*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_init(void *hal, MppHalCfg *cfg)
165*437bfbebSnyanmisaka {
166*437bfbebSnyanmisaka MPP_RET ret = MPP_NOK;
167*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
168*437bfbebSnyanmisaka
169*437bfbebSnyanmisaka mpp_slots_set_prop(reg_ctx->slots, SLOTS_HOR_ALIGN, hevc_hor_align);
170*437bfbebSnyanmisaka mpp_slots_set_prop(reg_ctx->slots, SLOTS_VER_ALIGN, hevc_ver_align);
171*437bfbebSnyanmisaka
172*437bfbebSnyanmisaka reg_ctx->scaling_qm = mpp_calloc(DXVA_Qmatrix_HEVC, 1);
173*437bfbebSnyanmisaka reg_ctx->sw_rps_buf = mpp_calloc(RK_U64, 400);
174*437bfbebSnyanmisaka
175*437bfbebSnyanmisaka if (reg_ctx->scaling_qm == NULL) {
176*437bfbebSnyanmisaka mpp_err("scaling_org alloc fail");
177*437bfbebSnyanmisaka return MPP_ERR_MALLOC;
178*437bfbebSnyanmisaka }
179*437bfbebSnyanmisaka
180*437bfbebSnyanmisaka reg_ctx->scaling_rk = mpp_calloc(scalingFactor_t, 1);
181*437bfbebSnyanmisaka if (reg_ctx->scaling_rk == NULL) {
182*437bfbebSnyanmisaka mpp_err("scaling_rk alloc fail");
183*437bfbebSnyanmisaka return MPP_ERR_MALLOC;
184*437bfbebSnyanmisaka }
185*437bfbebSnyanmisaka
186*437bfbebSnyanmisaka if (reg_ctx->group == NULL) {
187*437bfbebSnyanmisaka ret = mpp_buffer_group_get_internal(®_ctx->group, MPP_BUFFER_TYPE_ION);
188*437bfbebSnyanmisaka if (ret) {
189*437bfbebSnyanmisaka mpp_err("h265d mpp_buffer_group_get failed\n");
190*437bfbebSnyanmisaka return ret;
191*437bfbebSnyanmisaka }
192*437bfbebSnyanmisaka }
193*437bfbebSnyanmisaka
194*437bfbebSnyanmisaka ret = mpp_buffer_get(reg_ctx->group, ®_ctx->cabac_table_data, sizeof(cabac_table));
195*437bfbebSnyanmisaka if (ret) {
196*437bfbebSnyanmisaka mpp_err("h265d cabac_table get buffer failed\n");
197*437bfbebSnyanmisaka return ret;
198*437bfbebSnyanmisaka }
199*437bfbebSnyanmisaka
200*437bfbebSnyanmisaka ret = mpp_buffer_write(reg_ctx->cabac_table_data, 0, (void*)cabac_table, sizeof(cabac_table));
201*437bfbebSnyanmisaka if (ret) {
202*437bfbebSnyanmisaka mpp_err("h265d write cabac_table data failed\n");
203*437bfbebSnyanmisaka return ret;
204*437bfbebSnyanmisaka }
205*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->cabac_table_data);
206*437bfbebSnyanmisaka
207*437bfbebSnyanmisaka ret = hal_h265d_alloc_res(hal);
208*437bfbebSnyanmisaka if (ret) {
209*437bfbebSnyanmisaka mpp_err("hal_h265d_alloc_res failed\n");
210*437bfbebSnyanmisaka return ret;
211*437bfbebSnyanmisaka }
212*437bfbebSnyanmisaka
213*437bfbebSnyanmisaka #ifdef dump
214*437bfbebSnyanmisaka fp = fopen("/data/hal.bin", "wb");
215*437bfbebSnyanmisaka #endif
216*437bfbebSnyanmisaka (void) cfg;
217*437bfbebSnyanmisaka return MPP_OK;
218*437bfbebSnyanmisaka }
219*437bfbebSnyanmisaka
hal_h265d_rkv_deinit(void * hal)220*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_deinit(void *hal)
221*437bfbebSnyanmisaka {
222*437bfbebSnyanmisaka RK_S32 ret = 0;
223*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
224*437bfbebSnyanmisaka
225*437bfbebSnyanmisaka ret = mpp_buffer_put(reg_ctx->cabac_table_data);
226*437bfbebSnyanmisaka if (ret) {
227*437bfbebSnyanmisaka mpp_err("h265d cabac_table free buffer failed\n");
228*437bfbebSnyanmisaka return ret;
229*437bfbebSnyanmisaka }
230*437bfbebSnyanmisaka
231*437bfbebSnyanmisaka if (reg_ctx->scaling_qm) {
232*437bfbebSnyanmisaka mpp_free(reg_ctx->scaling_qm);
233*437bfbebSnyanmisaka }
234*437bfbebSnyanmisaka
235*437bfbebSnyanmisaka if (reg_ctx->sw_rps_buf) {
236*437bfbebSnyanmisaka mpp_free(reg_ctx->sw_rps_buf);
237*437bfbebSnyanmisaka }
238*437bfbebSnyanmisaka
239*437bfbebSnyanmisaka if (reg_ctx->scaling_rk) {
240*437bfbebSnyanmisaka mpp_free(reg_ctx->scaling_rk);
241*437bfbebSnyanmisaka }
242*437bfbebSnyanmisaka
243*437bfbebSnyanmisaka hal_h265d_release_res(hal);
244*437bfbebSnyanmisaka
245*437bfbebSnyanmisaka if (reg_ctx->group) {
246*437bfbebSnyanmisaka ret = mpp_buffer_group_put(reg_ctx->group);
247*437bfbebSnyanmisaka if (ret) {
248*437bfbebSnyanmisaka mpp_err("h265d group free buffer failed\n");
249*437bfbebSnyanmisaka return ret;
250*437bfbebSnyanmisaka }
251*437bfbebSnyanmisaka }
252*437bfbebSnyanmisaka return MPP_OK;
253*437bfbebSnyanmisaka }
254*437bfbebSnyanmisaka
hal_h265d_v345_output_pps_packet(void * hal,void * dxva)255*437bfbebSnyanmisaka static RK_S32 hal_h265d_v345_output_pps_packet(void *hal, void *dxva)
256*437bfbebSnyanmisaka {
257*437bfbebSnyanmisaka RK_S32 fifo_len = 12;
258*437bfbebSnyanmisaka RK_S32 i, j;
259*437bfbebSnyanmisaka RK_U32 log2_min_cb_size;
260*437bfbebSnyanmisaka RK_S32 width, height;
261*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
262*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
263*437bfbebSnyanmisaka BitputCtx_t bp;
264*437bfbebSnyanmisaka RK_U64 *pps_packet = mpp_calloc(RK_U64, fifo_len + 1);
265*437bfbebSnyanmisaka
266*437bfbebSnyanmisaka if (NULL == reg_ctx || dxva_cxt == NULL) {
267*437bfbebSnyanmisaka mpp_err("%s:%s:%d reg_ctx or dxva_cxt is NULL",
268*437bfbebSnyanmisaka __FILE__, __FUNCTION__, __LINE__);
269*437bfbebSnyanmisaka MPP_FREE(pps_packet);
270*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
271*437bfbebSnyanmisaka }
272*437bfbebSnyanmisaka
273*437bfbebSnyanmisaka void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->pps_data);
274*437bfbebSnyanmisaka if (NULL == pps_ptr) {
275*437bfbebSnyanmisaka mpp_err("pps_data get ptr error");
276*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
277*437bfbebSnyanmisaka }
278*437bfbebSnyanmisaka memset(pps_ptr, 0, 96 * 64);
279*437bfbebSnyanmisaka // pps_packet = (RK_U64 *)(pps_ptr + dxva_cxt->pp.pps_id * 80);
280*437bfbebSnyanmisaka
281*437bfbebSnyanmisaka for (i = 0; i < 12; i++) pps_packet[i] = 0;
282*437bfbebSnyanmisaka
283*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, pps_packet, fifo_len);
284*437bfbebSnyanmisaka
285*437bfbebSnyanmisaka // SPS
286*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.vps_id , 4);
287*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_id , 4);
288*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.chroma_format_idc , 2);
289*437bfbebSnyanmisaka
290*437bfbebSnyanmisaka log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
291*437bfbebSnyanmisaka width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
292*437bfbebSnyanmisaka height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
293*437bfbebSnyanmisaka
294*437bfbebSnyanmisaka mpp_put_bits(&bp, width , 13);
295*437bfbebSnyanmisaka mpp_put_bits(&bp, height , 13);
296*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_luma_minus8 + 8 , 4);
297*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_chroma_minus8 + 8 , 4);
298*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_max_pic_order_cnt_lsb_minus4 + 4 , 5);
299*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size , 2); //log2_maxa_coding_block_depth
300*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3 , 3);
301*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_min_transform_block_size_minus2 + 2 , 3);
302*437bfbebSnyanmisaka ///<-zrh comment ^ 57 bit above
303*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_transform_block_size , 2);
304*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_inter , 3);
305*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_intra , 3);
306*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.scaling_list_enabled_flag , 1);
307*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.amp_enabled_flag , 1);
308*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sample_adaptive_offset_enabled_flag , 1);
309*437bfbebSnyanmisaka ///<-zrh comment ^ 68 bit above
310*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag , 1);
311*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0 , 4);
312*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0 , 4);
313*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_loop_filter_disabled_flag , 1);
314*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_pcm_luma_coding_block_size , 3);
315*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
316*437bfbebSnyanmisaka
317*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_short_term_ref_pic_sets , 7);
318*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.long_term_ref_pics_present_flag , 1);
319*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_long_term_ref_pics_sps , 6);
320*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_temporal_mvp_enabled_flag , 1);
321*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.strong_intra_smoothing_enabled_flag , 1);
322*437bfbebSnyanmisaka ///<-zrh comment ^ 100 bit above
323*437bfbebSnyanmisaka
324*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 7 );
325*437bfbebSnyanmisaka
326*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_max_dec_pic_buffering_minus1, 4);
327*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 3);
328*437bfbebSnyanmisaka mpp_put_align(&bp , 32, 0xf); //128
329*437bfbebSnyanmisaka
330*437bfbebSnyanmisaka // PPS
331*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_id , 6 );
332*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_id , 4 );
333*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.dependent_slice_segments_enabled_flag , 1 );
334*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.output_flag_present_flag , 1 );
335*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_extra_slice_header_bits , 13);
336*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sign_data_hiding_enabled_flag , 1);
337*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.cabac_init_present_flag , 1);
338*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l0_default_active_minus1 + 1 , 4);
339*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l1_default_active_minus1 + 1 , 4);
340*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.init_qp_minus26 , 7);
341*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.constrained_intra_pred_flag , 1);
342*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.transform_skip_enabled_flag , 1);
343*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.cu_qp_delta_enabled_flag , 1); //164
344*437bfbebSnyanmisaka
345*437bfbebSnyanmisaka mpp_put_bits(&bp, log2_min_cb_size +
346*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size -
347*437bfbebSnyanmisaka dxva_cxt->pp.diff_cu_qp_delta_depth , 3);
348*437bfbebSnyanmisaka
349*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_PPS, "log2_min_cb_size %d %d %d \n", log2_min_cb_size,
350*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size, dxva_cxt->pp.diff_cu_qp_delta_depth );
351*437bfbebSnyanmisaka
352*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_cb_qp_offset , 5);
353*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_cr_qp_offset , 5);
354*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_slice_chroma_qp_offsets_present_flag , 1);
355*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.weighted_pred_flag , 1);
356*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.weighted_bipred_flag , 1);
357*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.transquant_bypass_enabled_flag , 1 );
358*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag , 1 );
359*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.entropy_coding_sync_enabled_flag , 1);
360*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_loop_filter_across_slices_enabled_flag , 1);
361*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.loop_filter_across_tiles_enabled_flag , 1); //185
362*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.deblocking_filter_override_enabled_flag , 1);
363*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_deblocking_filter_disabled_flag , 1);
364*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_beta_offset_div2 , 4);
365*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_tc_offset_div2 , 4);
366*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.lists_modification_present_flag , 1);
367*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_parallel_merge_level_minus2 + 2 , 3);
368*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.slice_segment_header_extension_present_flag , 1);
369*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 3);
370*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag ? dxva_cxt->pp.num_tile_columns_minus1 + 1 : 0, 5);
371*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag ? dxva_cxt->pp.num_tile_rows_minus1 + 1 : 0 , 5 );
372*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 4); //mSps_Pps[i]->mMode
373*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0xf);
374*437bfbebSnyanmisaka {
375*437bfbebSnyanmisaka /// tiles info begin
376*437bfbebSnyanmisaka RK_U16 column_width[20];
377*437bfbebSnyanmisaka RK_U16 row_height[22];
378*437bfbebSnyanmisaka
379*437bfbebSnyanmisaka memset(column_width, 0, sizeof(column_width));
380*437bfbebSnyanmisaka memset(row_height, 0, sizeof(row_height));
381*437bfbebSnyanmisaka
382*437bfbebSnyanmisaka if (dxva_cxt->pp.tiles_enabled_flag) {
383*437bfbebSnyanmisaka
384*437bfbebSnyanmisaka if (dxva_cxt->pp.uniform_spacing_flag == 0) {
385*437bfbebSnyanmisaka RK_S32 maxcuwidth = dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
386*437bfbebSnyanmisaka RK_S32 ctu_width_in_pic = (width +
387*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
388*437bfbebSnyanmisaka RK_S32 ctu_height_in_pic = (height +
389*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
390*437bfbebSnyanmisaka RK_S32 sum = 0;
391*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1; i++) {
392*437bfbebSnyanmisaka column_width[i] = dxva_cxt->pp.column_width_minus1[i] + 1;
393*437bfbebSnyanmisaka sum += column_width[i] ;
394*437bfbebSnyanmisaka }
395*437bfbebSnyanmisaka column_width[i] = ctu_width_in_pic - sum;
396*437bfbebSnyanmisaka
397*437bfbebSnyanmisaka sum = 0;
398*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1; i++) {
399*437bfbebSnyanmisaka row_height[i] = dxva_cxt->pp.row_height_minus1[i] + 1;
400*437bfbebSnyanmisaka sum += row_height[i];
401*437bfbebSnyanmisaka }
402*437bfbebSnyanmisaka row_height[i] = ctu_height_in_pic - sum;
403*437bfbebSnyanmisaka } // end of (pps->uniform_spacing_flag == 0)
404*437bfbebSnyanmisaka else {
405*437bfbebSnyanmisaka
406*437bfbebSnyanmisaka RK_S32 pic_in_cts_width = (width +
407*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
408*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
409*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
410*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
411*437bfbebSnyanmisaka RK_S32 pic_in_cts_height = (height +
412*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
413*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
414*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
415*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
416*437bfbebSnyanmisaka
417*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1 + 1; i++)
418*437bfbebSnyanmisaka column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1) -
419*437bfbebSnyanmisaka (i * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1);
420*437bfbebSnyanmisaka
421*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1 + 1; i++)
422*437bfbebSnyanmisaka row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1) -
423*437bfbebSnyanmisaka (i * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1);
424*437bfbebSnyanmisaka }
425*437bfbebSnyanmisaka } // pps->tiles_enabled_flag
426*437bfbebSnyanmisaka else {
427*437bfbebSnyanmisaka RK_S32 MaxCUWidth = (1 << (dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
428*437bfbebSnyanmisaka column_width[0] = (width + MaxCUWidth - 1) / MaxCUWidth;
429*437bfbebSnyanmisaka row_height[0] = (height + MaxCUWidth - 1) / MaxCUWidth;
430*437bfbebSnyanmisaka }
431*437bfbebSnyanmisaka
432*437bfbebSnyanmisaka for (j = 0; j < 20; j++) {
433*437bfbebSnyanmisaka if (column_width[j] > 0)
434*437bfbebSnyanmisaka column_width[j]--;
435*437bfbebSnyanmisaka mpp_put_bits(&bp, column_width[j], 8);
436*437bfbebSnyanmisaka }
437*437bfbebSnyanmisaka
438*437bfbebSnyanmisaka for (j = 0; j < 22; j++) {
439*437bfbebSnyanmisaka if (row_height[j] > 0)
440*437bfbebSnyanmisaka row_height[j]--;
441*437bfbebSnyanmisaka mpp_put_bits(&bp, row_height[j], 8);
442*437bfbebSnyanmisaka }
443*437bfbebSnyanmisaka }
444*437bfbebSnyanmisaka
445*437bfbebSnyanmisaka {
446*437bfbebSnyanmisaka RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->scaling_list_data);
447*437bfbebSnyanmisaka RK_U32 fd = mpp_buffer_get_fd(reg_ctx->scaling_list_data);
448*437bfbebSnyanmisaka
449*437bfbebSnyanmisaka hal_h265d_output_scalinglist_packet(hal, ptr_scaling, dxva);
450*437bfbebSnyanmisaka mpp_put_bits(&bp, fd, 32);
451*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 60);
452*437bfbebSnyanmisaka mpp_put_align(&bp, 128, 0xf);
453*437bfbebSnyanmisaka }
454*437bfbebSnyanmisaka
455*437bfbebSnyanmisaka for (i = 0; i < 64; i++)
456*437bfbebSnyanmisaka memcpy(pps_ptr + i * 96, pps_packet, 96);
457*437bfbebSnyanmisaka
458*437bfbebSnyanmisaka #ifdef dump
459*437bfbebSnyanmisaka fwrite(pps_ptr, 1, 80 * 64, fp);
460*437bfbebSnyanmisaka RK_U32 *tmp = (RK_U32 *)pps_ptr;
461*437bfbebSnyanmisaka for (i = 0; i < 96 / 4; i++) {
462*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_PPS, "pps[%3d] = 0x%08x\n", i, tmp[i]);
463*437bfbebSnyanmisaka }
464*437bfbebSnyanmisaka #endif
465*437bfbebSnyanmisaka MPP_FREE(pps_packet);
466*437bfbebSnyanmisaka return 0;
467*437bfbebSnyanmisaka }
468*437bfbebSnyanmisaka
hal_h265d_output_pps_packet(void * hal,void * dxva)469*437bfbebSnyanmisaka static RK_S32 hal_h265d_output_pps_packet(void *hal, void *dxva)
470*437bfbebSnyanmisaka {
471*437bfbebSnyanmisaka RK_S32 fifo_len = 10;
472*437bfbebSnyanmisaka RK_S32 i, j;
473*437bfbebSnyanmisaka RK_U32 log2_min_cb_size;
474*437bfbebSnyanmisaka RK_S32 width, height;
475*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
476*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
477*437bfbebSnyanmisaka BitputCtx_t bp;
478*437bfbebSnyanmisaka RK_U64 *pps_packet = mpp_calloc(RK_U64, fifo_len + 1);
479*437bfbebSnyanmisaka
480*437bfbebSnyanmisaka if (NULL == reg_ctx || dxva_cxt == NULL) {
481*437bfbebSnyanmisaka mpp_err("%s:%s:%d reg_ctx or dxva_cxt is NULL",
482*437bfbebSnyanmisaka __FILE__, __FUNCTION__, __LINE__);
483*437bfbebSnyanmisaka MPP_FREE(pps_packet);
484*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
485*437bfbebSnyanmisaka }
486*437bfbebSnyanmisaka
487*437bfbebSnyanmisaka void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->pps_data);
488*437bfbebSnyanmisaka if (NULL == pps_ptr) {
489*437bfbebSnyanmisaka mpp_err("pps_data get ptr error");
490*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
491*437bfbebSnyanmisaka }
492*437bfbebSnyanmisaka memset(pps_ptr, 0, 80 * 64);
493*437bfbebSnyanmisaka // pps_packet = (RK_U64 *)(pps_ptr + dxva_cxt->pp.pps_id * 80);
494*437bfbebSnyanmisaka
495*437bfbebSnyanmisaka for (i = 0; i < 10; i++) pps_packet[i] = 0;
496*437bfbebSnyanmisaka
497*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, pps_packet, fifo_len);
498*437bfbebSnyanmisaka
499*437bfbebSnyanmisaka // SPS
500*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.vps_id , 4);
501*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_id , 4);
502*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.chroma_format_idc , 2);
503*437bfbebSnyanmisaka
504*437bfbebSnyanmisaka log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
505*437bfbebSnyanmisaka width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
506*437bfbebSnyanmisaka height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
507*437bfbebSnyanmisaka
508*437bfbebSnyanmisaka mpp_put_bits(&bp, width , 13);
509*437bfbebSnyanmisaka mpp_put_bits(&bp, height , 13);
510*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_luma_minus8 + 8 , 4);
511*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_chroma_minus8 + 8 , 4);
512*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_max_pic_order_cnt_lsb_minus4 + 4 , 5);
513*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size , 2); //log2_maxa_coding_block_depth
514*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3 , 3);
515*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_min_transform_block_size_minus2 + 2 , 3);
516*437bfbebSnyanmisaka ///<-zrh comment ^ 57 bit above
517*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_transform_block_size , 2);
518*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_inter , 3);
519*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_intra , 3);
520*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.scaling_list_enabled_flag , 1);
521*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.amp_enabled_flag , 1);
522*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sample_adaptive_offset_enabled_flag , 1);
523*437bfbebSnyanmisaka ///<-zrh comment ^ 68 bit above
524*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag , 1);
525*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0 , 4);
526*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0 , 4);
527*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_loop_filter_disabled_flag , 1);
528*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_pcm_luma_coding_block_size , 3);
529*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
530*437bfbebSnyanmisaka
531*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_short_term_ref_pic_sets , 7);
532*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.long_term_ref_pics_present_flag , 1);
533*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_long_term_ref_pics_sps , 6);
534*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_temporal_mvp_enabled_flag , 1);
535*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.strong_intra_smoothing_enabled_flag , 1);
536*437bfbebSnyanmisaka ///<-zrh comment ^ 100 bit above
537*437bfbebSnyanmisaka
538*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 7 );
539*437bfbebSnyanmisaka mpp_put_align(&bp , 32, 0xf);
540*437bfbebSnyanmisaka
541*437bfbebSnyanmisaka // PPS
542*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_id , 6 );
543*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sps_id , 4 );
544*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.dependent_slice_segments_enabled_flag , 1 );
545*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.output_flag_present_flag , 1 );
546*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_extra_slice_header_bits , 13);
547*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.sign_data_hiding_enabled_flag , 1);
548*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.cabac_init_present_flag , 1);
549*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l0_default_active_minus1 + 1 , 4);
550*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l1_default_active_minus1 + 1 , 4);
551*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.init_qp_minus26 , 7);
552*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.constrained_intra_pred_flag , 1);
553*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.transform_skip_enabled_flag , 1);
554*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.cu_qp_delta_enabled_flag , 1);
555*437bfbebSnyanmisaka
556*437bfbebSnyanmisaka mpp_put_bits(&bp, log2_min_cb_size +
557*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size -
558*437bfbebSnyanmisaka dxva_cxt->pp.diff_cu_qp_delta_depth , 3);
559*437bfbebSnyanmisaka
560*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_PPS, "log2_min_cb_size %d %d %d \n", log2_min_cb_size,
561*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size, dxva_cxt->pp.diff_cu_qp_delta_depth );
562*437bfbebSnyanmisaka
563*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_cb_qp_offset , 5);
564*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_cr_qp_offset , 5);
565*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_slice_chroma_qp_offsets_present_flag , 1);
566*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.weighted_pred_flag , 1);
567*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.weighted_bipred_flag , 1);
568*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.transquant_bypass_enabled_flag , 1 );
569*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag , 1 );
570*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.entropy_coding_sync_enabled_flag , 1);
571*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_loop_filter_across_slices_enabled_flag , 1);
572*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.loop_filter_across_tiles_enabled_flag , 1);
573*437bfbebSnyanmisaka
574*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.deblocking_filter_override_enabled_flag , 1);
575*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_deblocking_filter_disabled_flag , 1);
576*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_beta_offset_div2 , 4);
577*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.pps_tc_offset_div2 , 4);
578*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.lists_modification_present_flag , 1);
579*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.log2_parallel_merge_level_minus2 + 2 , 3);
580*437bfbebSnyanmisaka /*slice_segment_header_extension_present_flag need set 0 */
581*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 1);
582*437bfbebSnyanmisaka mpp_put_bits(&bp, 0 , 3);
583*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_tile_columns_minus1 + 1, 5);
584*437bfbebSnyanmisaka mpp_put_bits(&bp, dxva_cxt->pp.num_tile_rows_minus1 + 1 , 5 );
585*437bfbebSnyanmisaka mpp_put_bits(&bp, 3, 2); //mSps_Pps[i]->mMode
586*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0xf);
587*437bfbebSnyanmisaka
588*437bfbebSnyanmisaka {
589*437bfbebSnyanmisaka /// tiles info begin
590*437bfbebSnyanmisaka RK_U16 column_width[20];
591*437bfbebSnyanmisaka RK_U16 row_height[22];
592*437bfbebSnyanmisaka
593*437bfbebSnyanmisaka memset(column_width, 0, sizeof(column_width));
594*437bfbebSnyanmisaka memset(row_height, 0, sizeof(row_height));
595*437bfbebSnyanmisaka
596*437bfbebSnyanmisaka if (dxva_cxt->pp.tiles_enabled_flag) {
597*437bfbebSnyanmisaka if (dxva_cxt->pp.uniform_spacing_flag == 0) {
598*437bfbebSnyanmisaka RK_S32 maxcuwidth = dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
599*437bfbebSnyanmisaka RK_S32 ctu_width_in_pic = (width +
600*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
601*437bfbebSnyanmisaka RK_S32 ctu_height_in_pic = (height +
602*437bfbebSnyanmisaka (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
603*437bfbebSnyanmisaka RK_S32 sum = 0;
604*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1; i++) {
605*437bfbebSnyanmisaka column_width[i] = dxva_cxt->pp.column_width_minus1[i] + 1;
606*437bfbebSnyanmisaka sum += column_width[i] ;
607*437bfbebSnyanmisaka }
608*437bfbebSnyanmisaka column_width[i] = ctu_width_in_pic - sum;
609*437bfbebSnyanmisaka
610*437bfbebSnyanmisaka sum = 0;
611*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1; i++) {
612*437bfbebSnyanmisaka row_height[i] = dxva_cxt->pp.row_height_minus1[i] + 1;
613*437bfbebSnyanmisaka sum += row_height[i];
614*437bfbebSnyanmisaka }
615*437bfbebSnyanmisaka row_height[i] = ctu_height_in_pic - sum;
616*437bfbebSnyanmisaka } // end of (pps->uniform_spacing_flag == 0)
617*437bfbebSnyanmisaka else {
618*437bfbebSnyanmisaka
619*437bfbebSnyanmisaka RK_S32 pic_in_cts_width = (width +
620*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
621*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
622*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
623*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
624*437bfbebSnyanmisaka RK_S32 pic_in_cts_height = (height +
625*437bfbebSnyanmisaka (1 << (log2_min_cb_size +
626*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
627*437bfbebSnyanmisaka / (1 << (log2_min_cb_size +
628*437bfbebSnyanmisaka dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
629*437bfbebSnyanmisaka
630*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1 + 1; i++)
631*437bfbebSnyanmisaka column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1) -
632*437bfbebSnyanmisaka (i * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1);
633*437bfbebSnyanmisaka
634*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1 + 1; i++)
635*437bfbebSnyanmisaka row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1) -
636*437bfbebSnyanmisaka (i * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1);
637*437bfbebSnyanmisaka }
638*437bfbebSnyanmisaka } // pps->tiles_enabled_flag
639*437bfbebSnyanmisaka else {
640*437bfbebSnyanmisaka RK_S32 MaxCUWidth = (1 << (dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
641*437bfbebSnyanmisaka column_width[0] = (width + MaxCUWidth - 1) / MaxCUWidth;
642*437bfbebSnyanmisaka row_height[0] = (height + MaxCUWidth - 1) / MaxCUWidth;
643*437bfbebSnyanmisaka }
644*437bfbebSnyanmisaka
645*437bfbebSnyanmisaka for (j = 0; j < 20; j++) {
646*437bfbebSnyanmisaka if (column_width[j] > 0)
647*437bfbebSnyanmisaka column_width[j]--;
648*437bfbebSnyanmisaka mpp_put_bits(&bp, column_width[j], 8);
649*437bfbebSnyanmisaka }
650*437bfbebSnyanmisaka
651*437bfbebSnyanmisaka for (j = 0; j < 22; j++) {
652*437bfbebSnyanmisaka if (row_height[j] > 0)
653*437bfbebSnyanmisaka row_height[j]--;
654*437bfbebSnyanmisaka mpp_put_bits(&bp, row_height[j], 8);
655*437bfbebSnyanmisaka }
656*437bfbebSnyanmisaka }
657*437bfbebSnyanmisaka
658*437bfbebSnyanmisaka {
659*437bfbebSnyanmisaka RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->scaling_list_data);
660*437bfbebSnyanmisaka RK_U32 fd = mpp_buffer_get_fd(reg_ctx->scaling_list_data);
661*437bfbebSnyanmisaka
662*437bfbebSnyanmisaka hal_h265d_output_scalinglist_packet(hal, ptr_scaling, dxva);
663*437bfbebSnyanmisaka mpp_put_bits(&bp, fd, 32);
664*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0xf);
665*437bfbebSnyanmisaka }
666*437bfbebSnyanmisaka
667*437bfbebSnyanmisaka for (i = 0; i < 64; i++)
668*437bfbebSnyanmisaka memcpy(pps_ptr + i * 80, pps_packet, 80);
669*437bfbebSnyanmisaka
670*437bfbebSnyanmisaka #ifdef dump
671*437bfbebSnyanmisaka fwrite(pps_ptr, 1, 80 * 64, fp);
672*437bfbebSnyanmisaka fflush(fp);
673*437bfbebSnyanmisaka #endif
674*437bfbebSnyanmisaka
675*437bfbebSnyanmisaka MPP_FREE(pps_packet);
676*437bfbebSnyanmisaka return 0;
677*437bfbebSnyanmisaka }
678*437bfbebSnyanmisaka
update_stream_buffer(MppBuffer streambuf,HalTaskInfo * syn)679*437bfbebSnyanmisaka static void update_stream_buffer(MppBuffer streambuf, HalTaskInfo *syn)
680*437bfbebSnyanmisaka {
681*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt =
682*437bfbebSnyanmisaka (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
683*437bfbebSnyanmisaka RK_U8 *ptr = (RK_U8*)mpp_buffer_get_ptr(streambuf);
684*437bfbebSnyanmisaka RK_U8 bit_left = 0;
685*437bfbebSnyanmisaka RK_U16 start_byte, end_byte, i = 0;
686*437bfbebSnyanmisaka RK_U32 stream_size = dxva_cxt->bitstream_size;
687*437bfbebSnyanmisaka RK_U8 *buf = NULL;
688*437bfbebSnyanmisaka RK_U8 *temp = NULL;
689*437bfbebSnyanmisaka RK_U32 cut_byte = 0, cut_byte_acc = 0;
690*437bfbebSnyanmisaka
691*437bfbebSnyanmisaka for (i = 0; i < dxva_cxt->slice_count; i++) {
692*437bfbebSnyanmisaka if (dxva_cxt->slice_cut_param[i].is_enable) {
693*437bfbebSnyanmisaka
694*437bfbebSnyanmisaka bit_left = 8 - (dxva_cxt->slice_cut_param[i].start_bit & 0x7);
695*437bfbebSnyanmisaka start_byte = dxva_cxt->slice_cut_param[i].start_bit >> 3;
696*437bfbebSnyanmisaka end_byte = (dxva_cxt->slice_cut_param[i].end_bit + 7) >> 3;
697*437bfbebSnyanmisaka buf = ptr + (dxva_cxt->slice_short[i].BSNALunitDataLocation - cut_byte_acc);
698*437bfbebSnyanmisaka temp = buf + start_byte;
699*437bfbebSnyanmisaka
700*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_FUNCTION, "start bit %d start byte[%d] 0x%x end bit %d end byte[%d] 0x%x\n",
701*437bfbebSnyanmisaka dxva_cxt->slice_cut_param[i].start_bit, start_byte, buf[start_byte],
702*437bfbebSnyanmisaka dxva_cxt->slice_cut_param[i].end_bit, end_byte, buf[end_byte]);
703*437bfbebSnyanmisaka if (bit_left < 8) {
704*437bfbebSnyanmisaka *temp = (*temp >> bit_left) << bit_left;
705*437bfbebSnyanmisaka *temp |= 1 << (bit_left - 1);
706*437bfbebSnyanmisaka } else {
707*437bfbebSnyanmisaka *temp = 0x80;
708*437bfbebSnyanmisaka }
709*437bfbebSnyanmisaka if ((dxva_cxt->slice_cut_param[i].end_bit & 0x7) == 0 && buf[end_byte] == 0x80)
710*437bfbebSnyanmisaka end_byte += 1;
711*437bfbebSnyanmisaka
712*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_FUNCTION, "i %d location %d count %d SliceBytesInBuffer %d bitstream_size %d\n",
713*437bfbebSnyanmisaka i, dxva_cxt->slice_short[i].BSNALunitDataLocation, dxva_cxt->slice_count,
714*437bfbebSnyanmisaka dxva_cxt->slice_short[i].SliceBytesInBuffer, dxva_cxt->bitstream_size);
715*437bfbebSnyanmisaka
716*437bfbebSnyanmisaka memmove(buf + start_byte + 1, buf + end_byte,
717*437bfbebSnyanmisaka stream_size - dxva_cxt->slice_short[i].BSNALunitDataLocation - end_byte);
718*437bfbebSnyanmisaka
719*437bfbebSnyanmisaka cut_byte = end_byte - start_byte - 1;
720*437bfbebSnyanmisaka dxva_cxt->slice_short[i].SliceBytesInBuffer -= cut_byte;
721*437bfbebSnyanmisaka dxva_cxt->bitstream_size -= cut_byte;
722*437bfbebSnyanmisaka cut_byte_acc += cut_byte;
723*437bfbebSnyanmisaka }
724*437bfbebSnyanmisaka }
725*437bfbebSnyanmisaka }
726*437bfbebSnyanmisaka
hal_h265d_rkv_gen_regs(void * hal,HalTaskInfo * syn)727*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_gen_regs(void *hal, HalTaskInfo *syn)
728*437bfbebSnyanmisaka {
729*437bfbebSnyanmisaka RK_S32 i = 0;
730*437bfbebSnyanmisaka RK_S32 stride_y, stride_uv, virstrid_y, virstrid_yuv;
731*437bfbebSnyanmisaka H265d_REGS_t *hw_regs;
732*437bfbebSnyanmisaka RK_S32 ret = MPP_SUCCESS;
733*437bfbebSnyanmisaka MppBuffer streambuf = NULL;
734*437bfbebSnyanmisaka RK_S32 aglin_offset = 0;
735*437bfbebSnyanmisaka RK_S32 valid_ref = -1;
736*437bfbebSnyanmisaka MppBuffer framebuf = NULL;
737*437bfbebSnyanmisaka RK_U32 sw_ref_valid = 0;
738*437bfbebSnyanmisaka RK_U32 stream_buf_size = 0;
739*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
740*437bfbebSnyanmisaka MppFrame mframe;
741*437bfbebSnyanmisaka
742*437bfbebSnyanmisaka if (syn->dec.flags.parse_err ||
743*437bfbebSnyanmisaka (syn->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
744*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
745*437bfbebSnyanmisaka return MPP_OK;
746*437bfbebSnyanmisaka }
747*437bfbebSnyanmisaka
748*437bfbebSnyanmisaka h265d_dxva2_picture_context_t *dxva_cxt =
749*437bfbebSnyanmisaka (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
750*437bfbebSnyanmisaka
751*437bfbebSnyanmisaka void *rps_ptr = NULL;
752*437bfbebSnyanmisaka if (reg_ctx ->fast_mode) {
753*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
754*437bfbebSnyanmisaka if (!reg_ctx->g_buf[i].use_flag) {
755*437bfbebSnyanmisaka syn->dec.reg_index = i;
756*437bfbebSnyanmisaka reg_ctx->rps_data = reg_ctx->g_buf[i].rps_data;
757*437bfbebSnyanmisaka reg_ctx->scaling_list_data =
758*437bfbebSnyanmisaka reg_ctx->g_buf[i].scaling_list_data;
759*437bfbebSnyanmisaka reg_ctx->pps_data = reg_ctx->g_buf[i].pps_data;
760*437bfbebSnyanmisaka reg_ctx->hw_regs = reg_ctx->g_buf[i].hw_regs;
761*437bfbebSnyanmisaka reg_ctx->g_buf[i].use_flag = 1;
762*437bfbebSnyanmisaka break;
763*437bfbebSnyanmisaka }
764*437bfbebSnyanmisaka }
765*437bfbebSnyanmisaka if (i == MAX_GEN_REG) {
766*437bfbebSnyanmisaka mpp_err("hevc rps buf all used");
767*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
768*437bfbebSnyanmisaka }
769*437bfbebSnyanmisaka } else {
770*437bfbebSnyanmisaka syn->dec.reg_index = 0;
771*437bfbebSnyanmisaka }
772*437bfbebSnyanmisaka rps_ptr = mpp_buffer_get_ptr(reg_ctx->rps_data);
773*437bfbebSnyanmisaka if (NULL == rps_ptr) {
774*437bfbebSnyanmisaka
775*437bfbebSnyanmisaka mpp_err("rps_data get ptr error");
776*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
777*437bfbebSnyanmisaka }
778*437bfbebSnyanmisaka
779*437bfbebSnyanmisaka
780*437bfbebSnyanmisaka if (syn->dec.syntax.data == NULL) {
781*437bfbebSnyanmisaka mpp_err("%s:%s:%d dxva is NULL", __FILE__, __FUNCTION__, __LINE__);
782*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
783*437bfbebSnyanmisaka }
784*437bfbebSnyanmisaka
785*437bfbebSnyanmisaka /* output pps */
786*437bfbebSnyanmisaka if (reg_ctx->is_v345) {
787*437bfbebSnyanmisaka hal_h265d_v345_output_pps_packet(hal, syn->dec.syntax.data);
788*437bfbebSnyanmisaka } else {
789*437bfbebSnyanmisaka hal_h265d_output_pps_packet(hal, syn->dec.syntax.data);
790*437bfbebSnyanmisaka }
791*437bfbebSnyanmisaka
792*437bfbebSnyanmisaka if (NULL == reg_ctx->hw_regs) {
793*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
794*437bfbebSnyanmisaka }
795*437bfbebSnyanmisaka
796*437bfbebSnyanmisaka hw_regs = (H265d_REGS_t*)reg_ctx->hw_regs;
797*437bfbebSnyanmisaka memset(hw_regs, 0, sizeof(H265d_REGS_t));
798*437bfbebSnyanmisaka
799*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
800*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
801*437bfbebSnyanmisaka stride_y = mpp_frame_get_hor_stride(mframe);
802*437bfbebSnyanmisaka stride_uv = mpp_frame_get_hor_stride(mframe);
803*437bfbebSnyanmisaka virstrid_y = mpp_frame_get_ver_stride(mframe) * stride_y;
804*437bfbebSnyanmisaka virstrid_yuv = virstrid_y + stride_uv * mpp_frame_get_ver_stride(mframe) / 2;
805*437bfbebSnyanmisaka
806*437bfbebSnyanmisaka hw_regs->sw_picparameter.sw_slice_num = dxva_cxt->slice_count;
807*437bfbebSnyanmisaka hw_regs->sw_picparameter.sw_y_hor_virstride = stride_y >> 4;
808*437bfbebSnyanmisaka hw_regs->sw_picparameter.sw_uv_hor_virstride = stride_uv >> 4;
809*437bfbebSnyanmisaka hw_regs->sw_y_virstride = virstrid_y >> 4;
810*437bfbebSnyanmisaka hw_regs->sw_yuv_virstride = virstrid_yuv >> 4;
811*437bfbebSnyanmisaka hw_regs->sw_sysctrl.sw_h26x_rps_mode = 0;
812*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
813*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
814*437bfbebSnyanmisaka hw_regs->sw_decout_base = mpp_buffer_get_fd(framebuf); //just index need map
815*437bfbebSnyanmisaka
816*437bfbebSnyanmisaka /*if out_base is equal to zero it means this frame may error
817*437bfbebSnyanmisaka we return directly add by csy*/
818*437bfbebSnyanmisaka
819*437bfbebSnyanmisaka if (hw_regs->sw_decout_base == 0) {
820*437bfbebSnyanmisaka return 0;
821*437bfbebSnyanmisaka }
822*437bfbebSnyanmisaka
823*437bfbebSnyanmisaka hw_regs->sw_cur_poc = dxva_cxt->pp.CurrPicOrderCntVal;
824*437bfbebSnyanmisaka
825*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->packet_slots, syn->dec.input, SLOT_BUFFER,
826*437bfbebSnyanmisaka &streambuf);
827*437bfbebSnyanmisaka
828*437bfbebSnyanmisaka if ( dxva_cxt->bitstream == NULL) {
829*437bfbebSnyanmisaka dxva_cxt->bitstream = mpp_buffer_get_ptr(streambuf);
830*437bfbebSnyanmisaka }
831*437bfbebSnyanmisaka if (reg_ctx->is_v345) {
832*437bfbebSnyanmisaka #ifdef HW_RPS
833*437bfbebSnyanmisaka hw_regs->sw_sysctrl.sw_wait_reset_en = 1;
834*437bfbebSnyanmisaka hw_regs->v345_reg_ends.reg064_mvc0.refp_layer_same_with_cur = 0xffff;
835*437bfbebSnyanmisaka hal_h265d_slice_hw_rps(syn->dec.syntax.data, rps_ptr, reg_ctx->sw_rps_buf, reg_ctx->fast_mode);
836*437bfbebSnyanmisaka #else
837*437bfbebSnyanmisaka hw_regs->sw_sysctrl.sw_h26x_rps_mode = 1;
838*437bfbebSnyanmisaka hal_h265d_slice_output_rps(syn->dec.syntax.data, rps_ptr);
839*437bfbebSnyanmisaka #endif
840*437bfbebSnyanmisaka } else {
841*437bfbebSnyanmisaka hal_h265d_slice_output_rps(syn->dec.syntax.data, rps_ptr);
842*437bfbebSnyanmisaka }
843*437bfbebSnyanmisaka
844*437bfbebSnyanmisaka if (dxva_cxt->pp.slice_segment_header_extension_present_flag && !reg_ctx->is_v345) {
845*437bfbebSnyanmisaka update_stream_buffer(streambuf, syn);
846*437bfbebSnyanmisaka mpp_buffer_sync_end(streambuf);
847*437bfbebSnyanmisaka }
848*437bfbebSnyanmisaka
849*437bfbebSnyanmisaka hw_regs->sw_cabactbl_base = mpp_buffer_get_fd(reg_ctx->cabac_table_data);
850*437bfbebSnyanmisaka hw_regs->sw_pps_base = mpp_buffer_get_fd(reg_ctx->pps_data);
851*437bfbebSnyanmisaka hw_regs->sw_rps_base = mpp_buffer_get_fd(reg_ctx->rps_data);
852*437bfbebSnyanmisaka hw_regs->sw_strm_rlc_base = mpp_buffer_get_fd(streambuf);
853*437bfbebSnyanmisaka stream_buf_size = mpp_buffer_get_size(streambuf);
854*437bfbebSnyanmisaka
855*437bfbebSnyanmisaka hw_regs->sw_stream_len = ((dxva_cxt->bitstream_size + 15)
856*437bfbebSnyanmisaka & (~15)) + 64;
857*437bfbebSnyanmisaka hw_regs->sw_stream_len = stream_buf_size > hw_regs->sw_stream_len ?
858*437bfbebSnyanmisaka hw_regs->sw_stream_len : stream_buf_size;
859*437bfbebSnyanmisaka
860*437bfbebSnyanmisaka aglin_offset = hw_regs->sw_stream_len - dxva_cxt->bitstream_size;
861*437bfbebSnyanmisaka if (aglin_offset > 0) {
862*437bfbebSnyanmisaka memset((void *)(dxva_cxt->bitstream + dxva_cxt->bitstream_size), 0,
863*437bfbebSnyanmisaka aglin_offset);
864*437bfbebSnyanmisaka }
865*437bfbebSnyanmisaka hw_regs->sw_interrupt.sw_dec_e = 1;
866*437bfbebSnyanmisaka hw_regs->sw_interrupt.sw_dec_timeout_e = 1;
867*437bfbebSnyanmisaka hw_regs->sw_interrupt.sw_wr_ddr_align_en = dxva_cxt->pp.tiles_enabled_flag
868*437bfbebSnyanmisaka ? 0 : 1;
869*437bfbebSnyanmisaka
870*437bfbebSnyanmisaka ///find s->rps_model[i] position, and set register
871*437bfbebSnyanmisaka hw_regs->cabac_error_en = 0xfdfffffd;
872*437bfbebSnyanmisaka hw_regs->rkv_reg_ends.extern_error_en = 0x30000000;
873*437bfbebSnyanmisaka
874*437bfbebSnyanmisaka valid_ref = hw_regs->sw_decout_base;
875*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_cxt->pp.RefPicList); i++) {
876*437bfbebSnyanmisaka if (dxva_cxt->pp.RefPicList[i].bPicEntry != 0xff &&
877*437bfbebSnyanmisaka dxva_cxt->pp.RefPicList[i].bPicEntry != 0x7f) {
878*437bfbebSnyanmisaka hw_regs->sw_refer_poc[i] = dxva_cxt->pp.PicOrderCntValList[i];
879*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots,
880*437bfbebSnyanmisaka dxva_cxt->pp.RefPicList[i].Index7Bits,
881*437bfbebSnyanmisaka SLOT_BUFFER, &framebuf);
882*437bfbebSnyanmisaka if (framebuf != NULL) {
883*437bfbebSnyanmisaka hw_regs->sw_refer_base[i] = mpp_buffer_get_fd(framebuf);
884*437bfbebSnyanmisaka valid_ref = hw_regs->sw_refer_base[i];
885*437bfbebSnyanmisaka } else {
886*437bfbebSnyanmisaka hw_regs->sw_refer_base[i] = valid_ref;
887*437bfbebSnyanmisaka }
888*437bfbebSnyanmisaka sw_ref_valid |= (1 << i);
889*437bfbebSnyanmisaka } else {
890*437bfbebSnyanmisaka hw_regs->sw_refer_base[i] = hw_regs->sw_decout_base;
891*437bfbebSnyanmisaka }
892*437bfbebSnyanmisaka }
893*437bfbebSnyanmisaka
894*437bfbebSnyanmisaka if (sw_ref_valid) {
895*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 10, sw_ref_valid & 0xf);
896*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 11, ((sw_ref_valid >> 4) & 0xf));
897*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 12, ((sw_ref_valid >> 8) & 0xf));
898*437bfbebSnyanmisaka mpp_dev_set_reg_offset(reg_ctx->dev, 13, ((sw_ref_valid >> 12) & 0xf));
899*437bfbebSnyanmisaka }
900*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->scaling_list_data);
901*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->pps_data);
902*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->rps_data);
903*437bfbebSnyanmisaka
904*437bfbebSnyanmisaka return ret;
905*437bfbebSnyanmisaka }
906*437bfbebSnyanmisaka
hal_h265d_rkv_start(void * hal,HalTaskInfo * task)907*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_start(void *hal, HalTaskInfo *task)
908*437bfbebSnyanmisaka {
909*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
910*437bfbebSnyanmisaka H265d_REGS_t *hw_regs = NULL;
911*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
912*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
913*437bfbebSnyanmisaka
914*437bfbebSnyanmisaka RK_U32 i;
915*437bfbebSnyanmisaka
916*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
917*437bfbebSnyanmisaka (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
918*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
919*437bfbebSnyanmisaka return MPP_OK;
920*437bfbebSnyanmisaka }
921*437bfbebSnyanmisaka
922*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
923*437bfbebSnyanmisaka hw_regs = ( H265d_REGS_t *)reg_ctx->g_buf[index].hw_regs;
924*437bfbebSnyanmisaka } else {
925*437bfbebSnyanmisaka hw_regs = ( H265d_REGS_t *)reg_ctx->hw_regs;
926*437bfbebSnyanmisaka }
927*437bfbebSnyanmisaka
928*437bfbebSnyanmisaka if (hw_regs == NULL) {
929*437bfbebSnyanmisaka mpp_err("hal_h265d_start hw_regs is NULL");
930*437bfbebSnyanmisaka return MPP_ERR_NULL_PTR;
931*437bfbebSnyanmisaka }
932*437bfbebSnyanmisaka
933*437bfbebSnyanmisaka do {
934*437bfbebSnyanmisaka MppDevRegWrCfg wr_cfg;
935*437bfbebSnyanmisaka MppDevRegRdCfg rd_cfg;
936*437bfbebSnyanmisaka
937*437bfbebSnyanmisaka RK_U32 reg_size = (reg_ctx->is_v341 || reg_ctx->is_v345) ? V345_HEVC_REGISTERS :
938*437bfbebSnyanmisaka (reg_ctx->client_type == VPU_CLIENT_RKVDEC) ?
939*437bfbebSnyanmisaka RKVDEC_V1_REGISTERS : RKVDEC_HEVC_REGISTERS;
940*437bfbebSnyanmisaka
941*437bfbebSnyanmisaka reg_size *= sizeof(RK_U32);
942*437bfbebSnyanmisaka
943*437bfbebSnyanmisaka wr_cfg.reg = hw_regs;
944*437bfbebSnyanmisaka wr_cfg.size = reg_size;
945*437bfbebSnyanmisaka wr_cfg.offset = 0;
946*437bfbebSnyanmisaka
947*437bfbebSnyanmisaka if (hal_h265d_debug & H265H_DBG_REG) {
948*437bfbebSnyanmisaka for (i = 0; i < reg_size / sizeof(RK_U32); i++)
949*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n", i, ((RK_U32 *)hw_regs)[i]);
950*437bfbebSnyanmisaka }
951*437bfbebSnyanmisaka
952*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
953*437bfbebSnyanmisaka if (ret) {
954*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
955*437bfbebSnyanmisaka break;
956*437bfbebSnyanmisaka }
957*437bfbebSnyanmisaka
958*437bfbebSnyanmisaka rd_cfg.reg = hw_regs;
959*437bfbebSnyanmisaka rd_cfg.size = reg_size;
960*437bfbebSnyanmisaka rd_cfg.offset = 0;
961*437bfbebSnyanmisaka
962*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_RD, &rd_cfg);
963*437bfbebSnyanmisaka if (ret) {
964*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
965*437bfbebSnyanmisaka break;
966*437bfbebSnyanmisaka }
967*437bfbebSnyanmisaka
968*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_SEND, NULL);
969*437bfbebSnyanmisaka if (ret) {
970*437bfbebSnyanmisaka mpp_err_f("send cmd failed %d\n", ret);
971*437bfbebSnyanmisaka break;
972*437bfbebSnyanmisaka }
973*437bfbebSnyanmisaka } while (0);
974*437bfbebSnyanmisaka
975*437bfbebSnyanmisaka return ret;
976*437bfbebSnyanmisaka }
977*437bfbebSnyanmisaka
hal_h265d_rkv_wait(void * hal,HalTaskInfo * task)978*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_wait(void *hal, HalTaskInfo *task)
979*437bfbebSnyanmisaka {
980*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
981*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
982*437bfbebSnyanmisaka HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
983*437bfbebSnyanmisaka H265d_REGS_t *hw_regs = NULL;
984*437bfbebSnyanmisaka RK_S32 i;
985*437bfbebSnyanmisaka
986*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
987*437bfbebSnyanmisaka hw_regs = ( H265d_REGS_t *)reg_ctx->g_buf[index].hw_regs;
988*437bfbebSnyanmisaka } else {
989*437bfbebSnyanmisaka hw_regs = ( H265d_REGS_t *)reg_ctx->hw_regs;
990*437bfbebSnyanmisaka }
991*437bfbebSnyanmisaka
992*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
993*437bfbebSnyanmisaka (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
994*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
995*437bfbebSnyanmisaka goto ERR_PROC;
996*437bfbebSnyanmisaka }
997*437bfbebSnyanmisaka
998*437bfbebSnyanmisaka ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_POLL, NULL);
999*437bfbebSnyanmisaka if (ret)
1000*437bfbebSnyanmisaka mpp_err_f("poll cmd failed %d\n", ret);
1001*437bfbebSnyanmisaka
1002*437bfbebSnyanmisaka ERR_PROC:
1003*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1004*437bfbebSnyanmisaka task->dec.flags.ref_err ||
1005*437bfbebSnyanmisaka hw_regs->sw_interrupt.sw_dec_error_sta ||
1006*437bfbebSnyanmisaka hw_regs->sw_interrupt.sw_dec_timeout_sta ||
1007*437bfbebSnyanmisaka hw_regs->sw_interrupt.sw_dec_empty_sta) {
1008*437bfbebSnyanmisaka if (!reg_ctx->fast_mode) {
1009*437bfbebSnyanmisaka if (reg_ctx->dec_cb)
1010*437bfbebSnyanmisaka mpp_callback(reg_ctx->dec_cb, &task->dec);
1011*437bfbebSnyanmisaka } else {
1012*437bfbebSnyanmisaka MppFrame mframe = NULL;
1013*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1014*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1015*437bfbebSnyanmisaka if (mframe) {
1016*437bfbebSnyanmisaka reg_ctx->fast_mode_err_found = 1;
1017*437bfbebSnyanmisaka mpp_frame_set_errinfo(mframe, 1);
1018*437bfbebSnyanmisaka }
1019*437bfbebSnyanmisaka }
1020*437bfbebSnyanmisaka } else {
1021*437bfbebSnyanmisaka if (reg_ctx->fast_mode && reg_ctx->fast_mode_err_found) {
1022*437bfbebSnyanmisaka for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(task->dec.refer); i++) {
1023*437bfbebSnyanmisaka if (task->dec.refer[i] >= 0) {
1024*437bfbebSnyanmisaka MppFrame frame_ref = NULL;
1025*437bfbebSnyanmisaka
1026*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.refer[i],
1027*437bfbebSnyanmisaka SLOT_FRAME_PTR, &frame_ref);
1028*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_FAST_ERR, "refer[%d] %d frame %p\n",
1029*437bfbebSnyanmisaka i, task->dec.refer[i], frame_ref);
1030*437bfbebSnyanmisaka if (frame_ref && mpp_frame_get_errinfo(frame_ref)) {
1031*437bfbebSnyanmisaka MppFrame frame_out = NULL;
1032*437bfbebSnyanmisaka mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1033*437bfbebSnyanmisaka SLOT_FRAME_PTR, &frame_out);
1034*437bfbebSnyanmisaka mpp_frame_set_errinfo(frame_out, 1);
1035*437bfbebSnyanmisaka break;
1036*437bfbebSnyanmisaka }
1037*437bfbebSnyanmisaka }
1038*437bfbebSnyanmisaka }
1039*437bfbebSnyanmisaka }
1040*437bfbebSnyanmisaka }
1041*437bfbebSnyanmisaka
1042*437bfbebSnyanmisaka if (hal_h265d_debug & H265H_DBG_REG) {
1043*437bfbebSnyanmisaka h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[1]=0x%08X, regs[45]=0x%08x\n", ((RK_U32 *)hw_regs)[1], ((RK_U32 *)hw_regs)[45]);
1044*437bfbebSnyanmisaka }
1045*437bfbebSnyanmisaka
1046*437bfbebSnyanmisaka if (reg_ctx->fast_mode) {
1047*437bfbebSnyanmisaka reg_ctx->g_buf[index].use_flag = 0;
1048*437bfbebSnyanmisaka }
1049*437bfbebSnyanmisaka
1050*437bfbebSnyanmisaka return ret;
1051*437bfbebSnyanmisaka }
1052*437bfbebSnyanmisaka
hal_h265d_rkv_reset(void * hal)1053*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_reset(void *hal)
1054*437bfbebSnyanmisaka {
1055*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1056*437bfbebSnyanmisaka HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1057*437bfbebSnyanmisaka
1058*437bfbebSnyanmisaka p_hal->fast_mode_err_found = 0;
1059*437bfbebSnyanmisaka
1060*437bfbebSnyanmisaka return ret;
1061*437bfbebSnyanmisaka }
1062*437bfbebSnyanmisaka
1063*437bfbebSnyanmisaka const MppHalApi hal_h265d_rkv = {
1064*437bfbebSnyanmisaka .name = "h265d_rkdec",
1065*437bfbebSnyanmisaka .type = MPP_CTX_DEC,
1066*437bfbebSnyanmisaka .coding = MPP_VIDEO_CodingHEVC,
1067*437bfbebSnyanmisaka .ctx_size = sizeof(HalH265dCtx),
1068*437bfbebSnyanmisaka .flag = 0,
1069*437bfbebSnyanmisaka .init = hal_h265d_rkv_init,
1070*437bfbebSnyanmisaka .deinit = hal_h265d_rkv_deinit,
1071*437bfbebSnyanmisaka .reg_gen = hal_h265d_rkv_gen_regs,
1072*437bfbebSnyanmisaka .start = hal_h265d_rkv_start,
1073*437bfbebSnyanmisaka .wait = hal_h265d_rkv_wait,
1074*437bfbebSnyanmisaka .reset = hal_h265d_rkv_reset,
1075*437bfbebSnyanmisaka .flush = NULL,
1076*437bfbebSnyanmisaka .control = NULL,
1077*437bfbebSnyanmisaka };
1078