xref: /rockchip-linux_mpp/mpp/hal/rkdec/h265d/hal_h265d_rkv.c (revision 437bfbeb9567cca9cd9080e3f6954aa9d6a94f18)
1*437bfbebSnyanmisaka /*
2*437bfbebSnyanmisaka  * Copyright 2020 Rockchip Electronics Co. LTD
3*437bfbebSnyanmisaka  *
4*437bfbebSnyanmisaka  * Licensed under the Apache License, Version 2.0 (the "License");
5*437bfbebSnyanmisaka  * you may not use this file except in compliance with the License.
6*437bfbebSnyanmisaka  * You may obtain a copy of the License at
7*437bfbebSnyanmisaka  *
8*437bfbebSnyanmisaka  *      http://www.apache.org/licenses/LICENSE-2.0
9*437bfbebSnyanmisaka  *
10*437bfbebSnyanmisaka  * Unless required by applicable law or agreed to in writing, software
11*437bfbebSnyanmisaka  * distributed under the License is distributed on an "AS IS" BASIS,
12*437bfbebSnyanmisaka  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*437bfbebSnyanmisaka  * See the License for the specific language governing permissions and
14*437bfbebSnyanmisaka  * limitations under the License.
15*437bfbebSnyanmisaka  */
16*437bfbebSnyanmisaka 
17*437bfbebSnyanmisaka #define MODULE_TAG "hal_h265d_rkv"
18*437bfbebSnyanmisaka 
19*437bfbebSnyanmisaka #include <stdio.h>
20*437bfbebSnyanmisaka #include <string.h>
21*437bfbebSnyanmisaka 
22*437bfbebSnyanmisaka #include "mpp_mem.h"
23*437bfbebSnyanmisaka #include "mpp_bitread.h"
24*437bfbebSnyanmisaka #include "mpp_bitput.h"
25*437bfbebSnyanmisaka 
26*437bfbebSnyanmisaka #include "hal_h265d_debug.h"
27*437bfbebSnyanmisaka #include "hal_h265d_ctx.h"
28*437bfbebSnyanmisaka #include "hal_h265d_com.h"
29*437bfbebSnyanmisaka #include "hal_h265d_rkv.h"
30*437bfbebSnyanmisaka #include "hal_h265d_rkv_reg.h"
31*437bfbebSnyanmisaka #include "h265d_syntax.h"
32*437bfbebSnyanmisaka 
33*437bfbebSnyanmisaka /* #define dump */
34*437bfbebSnyanmisaka #ifdef dump
35*437bfbebSnyanmisaka static FILE *fp = NULL;
36*437bfbebSnyanmisaka #endif
37*437bfbebSnyanmisaka #define HW_RPS
38*437bfbebSnyanmisaka 
39*437bfbebSnyanmisaka #define PPS_SIZE                (96 * 64)
40*437bfbebSnyanmisaka 
hal_h265d_alloc_res(void * hal)41*437bfbebSnyanmisaka static MPP_RET hal_h265d_alloc_res(void *hal)
42*437bfbebSnyanmisaka {
43*437bfbebSnyanmisaka     RK_S32 i = 0;
44*437bfbebSnyanmisaka     RK_S32 ret = 0;
45*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
46*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
47*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
48*437bfbebSnyanmisaka             reg_ctx->g_buf[i].hw_regs =
49*437bfbebSnyanmisaka                 mpp_calloc_size(void, sizeof(H265d_REGS_t));
50*437bfbebSnyanmisaka             ret = mpp_buffer_get(reg_ctx->group,
51*437bfbebSnyanmisaka                                  &reg_ctx->g_buf[i].scaling_list_data,
52*437bfbebSnyanmisaka                                  SCALING_LIST_SIZE);
53*437bfbebSnyanmisaka             if (ret) {
54*437bfbebSnyanmisaka                 mpp_err("h265d scaling_list_data get buffer failed\n");
55*437bfbebSnyanmisaka                 return ret;
56*437bfbebSnyanmisaka             }
57*437bfbebSnyanmisaka 
58*437bfbebSnyanmisaka             ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->g_buf[i].pps_data,
59*437bfbebSnyanmisaka                                  PPS_SIZE);
60*437bfbebSnyanmisaka             if (ret) {
61*437bfbebSnyanmisaka                 mpp_err("h265d pps_data get buffer failed\n");
62*437bfbebSnyanmisaka                 return ret;
63*437bfbebSnyanmisaka             }
64*437bfbebSnyanmisaka 
65*437bfbebSnyanmisaka             ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->g_buf[i].rps_data,
66*437bfbebSnyanmisaka                                  RPS_SIZE);
67*437bfbebSnyanmisaka             if (ret) {
68*437bfbebSnyanmisaka                 mpp_err("h265d rps_data get buffer failed\n");
69*437bfbebSnyanmisaka                 return ret;
70*437bfbebSnyanmisaka             }
71*437bfbebSnyanmisaka         }
72*437bfbebSnyanmisaka     } else {
73*437bfbebSnyanmisaka         reg_ctx->hw_regs = mpp_calloc_size(void, sizeof(H265d_REGS_t));
74*437bfbebSnyanmisaka         ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->scaling_list_data,
75*437bfbebSnyanmisaka                              SCALING_LIST_SIZE);
76*437bfbebSnyanmisaka         if (ret) {
77*437bfbebSnyanmisaka             mpp_err("h265d scaling_list_data get buffer failed\n");
78*437bfbebSnyanmisaka             return ret;
79*437bfbebSnyanmisaka         }
80*437bfbebSnyanmisaka 
81*437bfbebSnyanmisaka         ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->pps_data, PPS_SIZE);
82*437bfbebSnyanmisaka         if (ret) {
83*437bfbebSnyanmisaka             mpp_err("h265d pps_data get buffer failed\n");
84*437bfbebSnyanmisaka             return ret;
85*437bfbebSnyanmisaka         }
86*437bfbebSnyanmisaka 
87*437bfbebSnyanmisaka         ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->rps_data, RPS_SIZE);
88*437bfbebSnyanmisaka         if (ret) {
89*437bfbebSnyanmisaka             mpp_err("h265d rps_data get buffer failed\n");
90*437bfbebSnyanmisaka             return ret;
91*437bfbebSnyanmisaka         }
92*437bfbebSnyanmisaka 
93*437bfbebSnyanmisaka     }
94*437bfbebSnyanmisaka     return MPP_OK;
95*437bfbebSnyanmisaka }
96*437bfbebSnyanmisaka 
hal_h265d_release_res(void * hal)97*437bfbebSnyanmisaka static MPP_RET hal_h265d_release_res(void *hal)
98*437bfbebSnyanmisaka {
99*437bfbebSnyanmisaka     RK_S32 ret = 0;
100*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
101*437bfbebSnyanmisaka     RK_S32 i = 0;
102*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
103*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
104*437bfbebSnyanmisaka             if (reg_ctx->g_buf[i].scaling_list_data) {
105*437bfbebSnyanmisaka                 ret = mpp_buffer_put(reg_ctx->g_buf[i].scaling_list_data);
106*437bfbebSnyanmisaka                 if (ret) {
107*437bfbebSnyanmisaka                     mpp_err("h265d scaling_list_data free buffer failed\n");
108*437bfbebSnyanmisaka                     return ret;
109*437bfbebSnyanmisaka                 }
110*437bfbebSnyanmisaka             }
111*437bfbebSnyanmisaka             if (reg_ctx->g_buf[i].pps_data) {
112*437bfbebSnyanmisaka                 ret = mpp_buffer_put(reg_ctx->g_buf[i].pps_data);
113*437bfbebSnyanmisaka                 if (ret) {
114*437bfbebSnyanmisaka                     mpp_err("h265d pps_data free buffer failed\n");
115*437bfbebSnyanmisaka                     return ret;
116*437bfbebSnyanmisaka                 }
117*437bfbebSnyanmisaka             }
118*437bfbebSnyanmisaka 
119*437bfbebSnyanmisaka             if (reg_ctx->g_buf[i].rps_data) {
120*437bfbebSnyanmisaka                 ret = mpp_buffer_put(reg_ctx->g_buf[i].rps_data);
121*437bfbebSnyanmisaka                 if (ret) {
122*437bfbebSnyanmisaka                     mpp_err("h265d rps_data free buffer failed\n");
123*437bfbebSnyanmisaka                     return ret;
124*437bfbebSnyanmisaka                 }
125*437bfbebSnyanmisaka             }
126*437bfbebSnyanmisaka 
127*437bfbebSnyanmisaka             if (reg_ctx->g_buf[i].hw_regs) {
128*437bfbebSnyanmisaka                 mpp_free(reg_ctx->g_buf[i].hw_regs);
129*437bfbebSnyanmisaka                 reg_ctx->g_buf[i].hw_regs = NULL;
130*437bfbebSnyanmisaka             }
131*437bfbebSnyanmisaka         }
132*437bfbebSnyanmisaka     } else {
133*437bfbebSnyanmisaka         if (reg_ctx->scaling_list_data) {
134*437bfbebSnyanmisaka             ret = mpp_buffer_put(reg_ctx->scaling_list_data);
135*437bfbebSnyanmisaka             if (ret) {
136*437bfbebSnyanmisaka                 mpp_err("h265d scaling_list_data free buffer failed\n");
137*437bfbebSnyanmisaka                 return ret;
138*437bfbebSnyanmisaka             }
139*437bfbebSnyanmisaka         }
140*437bfbebSnyanmisaka         if (reg_ctx->pps_data) {
141*437bfbebSnyanmisaka             ret = mpp_buffer_put(reg_ctx->pps_data);
142*437bfbebSnyanmisaka             if (ret) {
143*437bfbebSnyanmisaka                 mpp_err("h265d pps_data free buffer failed\n");
144*437bfbebSnyanmisaka                 return ret;
145*437bfbebSnyanmisaka             }
146*437bfbebSnyanmisaka         }
147*437bfbebSnyanmisaka 
148*437bfbebSnyanmisaka         if (reg_ctx->rps_data) {
149*437bfbebSnyanmisaka             ret = mpp_buffer_put(reg_ctx->rps_data);
150*437bfbebSnyanmisaka             if (ret) {
151*437bfbebSnyanmisaka                 mpp_err("h265d rps_data free buffer failed\n");
152*437bfbebSnyanmisaka                 return ret;
153*437bfbebSnyanmisaka             }
154*437bfbebSnyanmisaka         }
155*437bfbebSnyanmisaka 
156*437bfbebSnyanmisaka         if (reg_ctx->hw_regs) {
157*437bfbebSnyanmisaka             mpp_free(reg_ctx->hw_regs);
158*437bfbebSnyanmisaka             reg_ctx->hw_regs = NULL;
159*437bfbebSnyanmisaka         }
160*437bfbebSnyanmisaka     }
161*437bfbebSnyanmisaka     return MPP_OK;
162*437bfbebSnyanmisaka }
163*437bfbebSnyanmisaka 
hal_h265d_rkv_init(void * hal,MppHalCfg * cfg)164*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_init(void *hal, MppHalCfg *cfg)
165*437bfbebSnyanmisaka {
166*437bfbebSnyanmisaka     MPP_RET ret = MPP_NOK;
167*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
168*437bfbebSnyanmisaka 
169*437bfbebSnyanmisaka     mpp_slots_set_prop(reg_ctx->slots, SLOTS_HOR_ALIGN, hevc_hor_align);
170*437bfbebSnyanmisaka     mpp_slots_set_prop(reg_ctx->slots, SLOTS_VER_ALIGN, hevc_ver_align);
171*437bfbebSnyanmisaka 
172*437bfbebSnyanmisaka     reg_ctx->scaling_qm = mpp_calloc(DXVA_Qmatrix_HEVC, 1);
173*437bfbebSnyanmisaka     reg_ctx->sw_rps_buf = mpp_calloc(RK_U64, 400);
174*437bfbebSnyanmisaka 
175*437bfbebSnyanmisaka     if (reg_ctx->scaling_qm == NULL) {
176*437bfbebSnyanmisaka         mpp_err("scaling_org alloc fail");
177*437bfbebSnyanmisaka         return MPP_ERR_MALLOC;
178*437bfbebSnyanmisaka     }
179*437bfbebSnyanmisaka 
180*437bfbebSnyanmisaka     reg_ctx->scaling_rk = mpp_calloc(scalingFactor_t, 1);
181*437bfbebSnyanmisaka     if (reg_ctx->scaling_rk == NULL) {
182*437bfbebSnyanmisaka         mpp_err("scaling_rk alloc fail");
183*437bfbebSnyanmisaka         return MPP_ERR_MALLOC;
184*437bfbebSnyanmisaka     }
185*437bfbebSnyanmisaka 
186*437bfbebSnyanmisaka     if (reg_ctx->group == NULL) {
187*437bfbebSnyanmisaka         ret = mpp_buffer_group_get_internal(&reg_ctx->group, MPP_BUFFER_TYPE_ION);
188*437bfbebSnyanmisaka         if (ret) {
189*437bfbebSnyanmisaka             mpp_err("h265d mpp_buffer_group_get failed\n");
190*437bfbebSnyanmisaka             return ret;
191*437bfbebSnyanmisaka         }
192*437bfbebSnyanmisaka     }
193*437bfbebSnyanmisaka 
194*437bfbebSnyanmisaka     ret = mpp_buffer_get(reg_ctx->group, &reg_ctx->cabac_table_data, sizeof(cabac_table));
195*437bfbebSnyanmisaka     if (ret) {
196*437bfbebSnyanmisaka         mpp_err("h265d cabac_table get buffer failed\n");
197*437bfbebSnyanmisaka         return ret;
198*437bfbebSnyanmisaka     }
199*437bfbebSnyanmisaka 
200*437bfbebSnyanmisaka     ret = mpp_buffer_write(reg_ctx->cabac_table_data, 0, (void*)cabac_table, sizeof(cabac_table));
201*437bfbebSnyanmisaka     if (ret) {
202*437bfbebSnyanmisaka         mpp_err("h265d write cabac_table data failed\n");
203*437bfbebSnyanmisaka         return ret;
204*437bfbebSnyanmisaka     }
205*437bfbebSnyanmisaka     mpp_buffer_sync_end(reg_ctx->cabac_table_data);
206*437bfbebSnyanmisaka 
207*437bfbebSnyanmisaka     ret = hal_h265d_alloc_res(hal);
208*437bfbebSnyanmisaka     if (ret) {
209*437bfbebSnyanmisaka         mpp_err("hal_h265d_alloc_res failed\n");
210*437bfbebSnyanmisaka         return ret;
211*437bfbebSnyanmisaka     }
212*437bfbebSnyanmisaka 
213*437bfbebSnyanmisaka #ifdef dump
214*437bfbebSnyanmisaka     fp = fopen("/data/hal.bin", "wb");
215*437bfbebSnyanmisaka #endif
216*437bfbebSnyanmisaka     (void) cfg;
217*437bfbebSnyanmisaka     return MPP_OK;
218*437bfbebSnyanmisaka }
219*437bfbebSnyanmisaka 
hal_h265d_rkv_deinit(void * hal)220*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_deinit(void *hal)
221*437bfbebSnyanmisaka {
222*437bfbebSnyanmisaka     RK_S32 ret = 0;
223*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
224*437bfbebSnyanmisaka 
225*437bfbebSnyanmisaka     ret = mpp_buffer_put(reg_ctx->cabac_table_data);
226*437bfbebSnyanmisaka     if (ret) {
227*437bfbebSnyanmisaka         mpp_err("h265d cabac_table free buffer failed\n");
228*437bfbebSnyanmisaka         return ret;
229*437bfbebSnyanmisaka     }
230*437bfbebSnyanmisaka 
231*437bfbebSnyanmisaka     if (reg_ctx->scaling_qm) {
232*437bfbebSnyanmisaka         mpp_free(reg_ctx->scaling_qm);
233*437bfbebSnyanmisaka     }
234*437bfbebSnyanmisaka 
235*437bfbebSnyanmisaka     if (reg_ctx->sw_rps_buf) {
236*437bfbebSnyanmisaka         mpp_free(reg_ctx->sw_rps_buf);
237*437bfbebSnyanmisaka     }
238*437bfbebSnyanmisaka 
239*437bfbebSnyanmisaka     if (reg_ctx->scaling_rk) {
240*437bfbebSnyanmisaka         mpp_free(reg_ctx->scaling_rk);
241*437bfbebSnyanmisaka     }
242*437bfbebSnyanmisaka 
243*437bfbebSnyanmisaka     hal_h265d_release_res(hal);
244*437bfbebSnyanmisaka 
245*437bfbebSnyanmisaka     if (reg_ctx->group) {
246*437bfbebSnyanmisaka         ret = mpp_buffer_group_put(reg_ctx->group);
247*437bfbebSnyanmisaka         if (ret) {
248*437bfbebSnyanmisaka             mpp_err("h265d group free buffer failed\n");
249*437bfbebSnyanmisaka             return ret;
250*437bfbebSnyanmisaka         }
251*437bfbebSnyanmisaka     }
252*437bfbebSnyanmisaka     return MPP_OK;
253*437bfbebSnyanmisaka }
254*437bfbebSnyanmisaka 
hal_h265d_v345_output_pps_packet(void * hal,void * dxva)255*437bfbebSnyanmisaka static RK_S32 hal_h265d_v345_output_pps_packet(void *hal, void *dxva)
256*437bfbebSnyanmisaka {
257*437bfbebSnyanmisaka     RK_S32 fifo_len = 12;
258*437bfbebSnyanmisaka     RK_S32 i, j;
259*437bfbebSnyanmisaka     RK_U32 log2_min_cb_size;
260*437bfbebSnyanmisaka     RK_S32 width, height;
261*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
262*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
263*437bfbebSnyanmisaka     BitputCtx_t bp;
264*437bfbebSnyanmisaka     RK_U64 *pps_packet = mpp_calloc(RK_U64, fifo_len + 1);
265*437bfbebSnyanmisaka 
266*437bfbebSnyanmisaka     if (NULL == reg_ctx || dxva_cxt == NULL) {
267*437bfbebSnyanmisaka         mpp_err("%s:%s:%d reg_ctx or dxva_cxt is NULL",
268*437bfbebSnyanmisaka                 __FILE__, __FUNCTION__, __LINE__);
269*437bfbebSnyanmisaka         MPP_FREE(pps_packet);
270*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
271*437bfbebSnyanmisaka     }
272*437bfbebSnyanmisaka 
273*437bfbebSnyanmisaka     void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->pps_data);
274*437bfbebSnyanmisaka     if (NULL == pps_ptr) {
275*437bfbebSnyanmisaka         mpp_err("pps_data get ptr error");
276*437bfbebSnyanmisaka         return MPP_ERR_NOMEM;
277*437bfbebSnyanmisaka     }
278*437bfbebSnyanmisaka     memset(pps_ptr, 0, 96 * 64);
279*437bfbebSnyanmisaka     // pps_packet = (RK_U64 *)(pps_ptr + dxva_cxt->pp.pps_id * 80);
280*437bfbebSnyanmisaka 
281*437bfbebSnyanmisaka     for (i = 0; i < 12; i++) pps_packet[i] = 0;
282*437bfbebSnyanmisaka 
283*437bfbebSnyanmisaka     mpp_set_bitput_ctx(&bp, pps_packet, fifo_len);
284*437bfbebSnyanmisaka 
285*437bfbebSnyanmisaka     // SPS
286*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.vps_id                            , 4);
287*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_id                            , 4);
288*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.chroma_format_idc                 , 2);
289*437bfbebSnyanmisaka 
290*437bfbebSnyanmisaka     log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
291*437bfbebSnyanmisaka     width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
292*437bfbebSnyanmisaka     height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
293*437bfbebSnyanmisaka 
294*437bfbebSnyanmisaka     mpp_put_bits(&bp, width                                          , 13);
295*437bfbebSnyanmisaka     mpp_put_bits(&bp, height                                         , 13);
296*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_luma_minus8 + 8         , 4);
297*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_chroma_minus8 + 8       , 4);
298*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_max_pic_order_cnt_lsb_minus4 + 4      , 5);
299*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size   , 2); //log2_maxa_coding_block_depth
300*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3 , 3);
301*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_min_transform_block_size_minus2 + 2   , 3);
302*437bfbebSnyanmisaka     ///<-zrh comment ^  57 bit above
303*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_transform_block_size     , 2);
304*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_inter        , 3);
305*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_intra        , 3);
306*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.scaling_list_enabled_flag                  , 1);
307*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.amp_enabled_flag                           , 1);
308*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sample_adaptive_offset_enabled_flag        , 1);
309*437bfbebSnyanmisaka     ///<-zrh comment ^  68 bit above
310*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag                           , 1);
311*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0  , 4);
312*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0 , 4);
313*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_loop_filter_disabled_flag                                               , 1);
314*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_pcm_luma_coding_block_size                                , 3);
315*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
316*437bfbebSnyanmisaka 
317*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_short_term_ref_pic_sets             , 7);
318*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.long_term_ref_pics_present_flag         , 1);
319*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_long_term_ref_pics_sps              , 6);
320*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_temporal_mvp_enabled_flag           , 1);
321*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.strong_intra_smoothing_enabled_flag     , 1);
322*437bfbebSnyanmisaka     ///<-zrh comment ^ 100 bit above
323*437bfbebSnyanmisaka 
324*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0                                                    , 7 );
325*437bfbebSnyanmisaka 
326*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_max_dec_pic_buffering_minus1,       4);
327*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0, 3);
328*437bfbebSnyanmisaka     mpp_put_align(&bp                                                        , 32, 0xf); //128
329*437bfbebSnyanmisaka 
330*437bfbebSnyanmisaka     // PPS
331*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_id                                    , 6 );
332*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_id                                    , 4 );
333*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.dependent_slice_segments_enabled_flag     , 1 );
334*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.output_flag_present_flag                  , 1 );
335*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_extra_slice_header_bits               , 13);
336*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sign_data_hiding_enabled_flag , 1);
337*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.cabac_init_present_flag                   , 1);
338*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l0_default_active_minus1 + 1  , 4);
339*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l1_default_active_minus1 + 1  , 4);
340*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.init_qp_minus26                           , 7);
341*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.constrained_intra_pred_flag               , 1);
342*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.transform_skip_enabled_flag               , 1);
343*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.cu_qp_delta_enabled_flag                  , 1); //164
344*437bfbebSnyanmisaka 
345*437bfbebSnyanmisaka     mpp_put_bits(&bp, log2_min_cb_size +
346*437bfbebSnyanmisaka                  dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size -
347*437bfbebSnyanmisaka                  dxva_cxt->pp.diff_cu_qp_delta_depth                             , 3);
348*437bfbebSnyanmisaka 
349*437bfbebSnyanmisaka     h265h_dbg(H265H_DBG_PPS, "log2_min_cb_size %d %d %d \n", log2_min_cb_size,
350*437bfbebSnyanmisaka               dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size, dxva_cxt->pp.diff_cu_qp_delta_depth );
351*437bfbebSnyanmisaka 
352*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_cb_qp_offset                            , 5);
353*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_cr_qp_offset                            , 5);
354*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_slice_chroma_qp_offsets_present_flag    , 1);
355*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.weighted_pred_flag                          , 1);
356*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.weighted_bipred_flag                        , 1);
357*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.transquant_bypass_enabled_flag              , 1 );
358*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag                          , 1 );
359*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.entropy_coding_sync_enabled_flag            , 1);
360*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_loop_filter_across_slices_enabled_flag  , 1);
361*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.loop_filter_across_tiles_enabled_flag       , 1); //185
362*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.deblocking_filter_override_enabled_flag     , 1);
363*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_deblocking_filter_disabled_flag         , 1);
364*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_beta_offset_div2                        , 4);
365*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_tc_offset_div2                          , 4);
366*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.lists_modification_present_flag             , 1);
367*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_parallel_merge_level_minus2 + 2        , 3);
368*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.slice_segment_header_extension_present_flag , 1);
369*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0                                                        , 3);
370*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag ? dxva_cxt->pp.num_tile_columns_minus1 + 1 : 0, 5);
371*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag ? dxva_cxt->pp.num_tile_rows_minus1 + 1 : 0 , 5 );
372*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0, 4); //mSps_Pps[i]->mMode
373*437bfbebSnyanmisaka     mpp_put_align(&bp, 64, 0xf);
374*437bfbebSnyanmisaka     {
375*437bfbebSnyanmisaka         /// tiles info begin
376*437bfbebSnyanmisaka         RK_U16 column_width[20];
377*437bfbebSnyanmisaka         RK_U16 row_height[22];
378*437bfbebSnyanmisaka 
379*437bfbebSnyanmisaka         memset(column_width, 0, sizeof(column_width));
380*437bfbebSnyanmisaka         memset(row_height, 0, sizeof(row_height));
381*437bfbebSnyanmisaka 
382*437bfbebSnyanmisaka         if (dxva_cxt->pp.tiles_enabled_flag) {
383*437bfbebSnyanmisaka 
384*437bfbebSnyanmisaka             if (dxva_cxt->pp.uniform_spacing_flag == 0) {
385*437bfbebSnyanmisaka                 RK_S32 maxcuwidth = dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
386*437bfbebSnyanmisaka                 RK_S32 ctu_width_in_pic = (width +
387*437bfbebSnyanmisaka                                            (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
388*437bfbebSnyanmisaka                 RK_S32 ctu_height_in_pic = (height +
389*437bfbebSnyanmisaka                                             (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
390*437bfbebSnyanmisaka                 RK_S32 sum = 0;
391*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1; i++) {
392*437bfbebSnyanmisaka                     column_width[i] = dxva_cxt->pp.column_width_minus1[i] + 1;
393*437bfbebSnyanmisaka                     sum += column_width[i]  ;
394*437bfbebSnyanmisaka                 }
395*437bfbebSnyanmisaka                 column_width[i] = ctu_width_in_pic - sum;
396*437bfbebSnyanmisaka 
397*437bfbebSnyanmisaka                 sum = 0;
398*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1; i++) {
399*437bfbebSnyanmisaka                     row_height[i] = dxva_cxt->pp.row_height_minus1[i] + 1;
400*437bfbebSnyanmisaka                     sum += row_height[i];
401*437bfbebSnyanmisaka                 }
402*437bfbebSnyanmisaka                 row_height[i] = ctu_height_in_pic - sum;
403*437bfbebSnyanmisaka             } // end of (pps->uniform_spacing_flag == 0)
404*437bfbebSnyanmisaka             else {
405*437bfbebSnyanmisaka 
406*437bfbebSnyanmisaka                 RK_S32    pic_in_cts_width = (width +
407*437bfbebSnyanmisaka                                               (1 << (log2_min_cb_size +
408*437bfbebSnyanmisaka                                                      dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
409*437bfbebSnyanmisaka                                              / (1 << (log2_min_cb_size +
410*437bfbebSnyanmisaka                                                       dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
411*437bfbebSnyanmisaka                 RK_S32 pic_in_cts_height = (height +
412*437bfbebSnyanmisaka                                             (1 << (log2_min_cb_size +
413*437bfbebSnyanmisaka                                                    dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
414*437bfbebSnyanmisaka                                            / (1 << (log2_min_cb_size +
415*437bfbebSnyanmisaka                                                     dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
416*437bfbebSnyanmisaka 
417*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1 + 1; i++)
418*437bfbebSnyanmisaka                     column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1) -
419*437bfbebSnyanmisaka                                       (i * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1);
420*437bfbebSnyanmisaka 
421*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1 + 1; i++)
422*437bfbebSnyanmisaka                     row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1) -
423*437bfbebSnyanmisaka                                     (i * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1);
424*437bfbebSnyanmisaka             }
425*437bfbebSnyanmisaka         } // pps->tiles_enabled_flag
426*437bfbebSnyanmisaka         else {
427*437bfbebSnyanmisaka             RK_S32 MaxCUWidth = (1 << (dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
428*437bfbebSnyanmisaka             column_width[0] = (width  + MaxCUWidth - 1) / MaxCUWidth;
429*437bfbebSnyanmisaka             row_height[0]   = (height + MaxCUWidth - 1) / MaxCUWidth;
430*437bfbebSnyanmisaka         }
431*437bfbebSnyanmisaka 
432*437bfbebSnyanmisaka         for (j = 0; j < 20; j++) {
433*437bfbebSnyanmisaka             if (column_width[j] > 0)
434*437bfbebSnyanmisaka                 column_width[j]--;
435*437bfbebSnyanmisaka             mpp_put_bits(&bp, column_width[j], 8);
436*437bfbebSnyanmisaka         }
437*437bfbebSnyanmisaka 
438*437bfbebSnyanmisaka         for (j = 0; j < 22; j++) {
439*437bfbebSnyanmisaka             if (row_height[j] > 0)
440*437bfbebSnyanmisaka                 row_height[j]--;
441*437bfbebSnyanmisaka             mpp_put_bits(&bp, row_height[j], 8);
442*437bfbebSnyanmisaka         }
443*437bfbebSnyanmisaka     }
444*437bfbebSnyanmisaka 
445*437bfbebSnyanmisaka     {
446*437bfbebSnyanmisaka         RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->scaling_list_data);
447*437bfbebSnyanmisaka         RK_U32 fd = mpp_buffer_get_fd(reg_ctx->scaling_list_data);
448*437bfbebSnyanmisaka 
449*437bfbebSnyanmisaka         hal_h265d_output_scalinglist_packet(hal, ptr_scaling, dxva);
450*437bfbebSnyanmisaka         mpp_put_bits(&bp, fd, 32);
451*437bfbebSnyanmisaka         mpp_put_bits(&bp, 0, 60);
452*437bfbebSnyanmisaka         mpp_put_align(&bp, 128, 0xf);
453*437bfbebSnyanmisaka     }
454*437bfbebSnyanmisaka 
455*437bfbebSnyanmisaka     for (i = 0; i < 64; i++)
456*437bfbebSnyanmisaka         memcpy(pps_ptr + i * 96, pps_packet, 96);
457*437bfbebSnyanmisaka 
458*437bfbebSnyanmisaka #ifdef dump
459*437bfbebSnyanmisaka     fwrite(pps_ptr, 1, 80 * 64, fp);
460*437bfbebSnyanmisaka     RK_U32 *tmp = (RK_U32 *)pps_ptr;
461*437bfbebSnyanmisaka     for (i = 0; i < 96 / 4; i++) {
462*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_PPS, "pps[%3d] = 0x%08x\n", i, tmp[i]);
463*437bfbebSnyanmisaka     }
464*437bfbebSnyanmisaka #endif
465*437bfbebSnyanmisaka     MPP_FREE(pps_packet);
466*437bfbebSnyanmisaka     return 0;
467*437bfbebSnyanmisaka }
468*437bfbebSnyanmisaka 
hal_h265d_output_pps_packet(void * hal,void * dxva)469*437bfbebSnyanmisaka static RK_S32 hal_h265d_output_pps_packet(void *hal, void *dxva)
470*437bfbebSnyanmisaka {
471*437bfbebSnyanmisaka     RK_S32 fifo_len = 10;
472*437bfbebSnyanmisaka     RK_S32 i, j;
473*437bfbebSnyanmisaka     RK_U32 log2_min_cb_size;
474*437bfbebSnyanmisaka     RK_S32 width, height;
475*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
476*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_cxt = (h265d_dxva2_picture_context_t*)dxva;
477*437bfbebSnyanmisaka     BitputCtx_t bp;
478*437bfbebSnyanmisaka     RK_U64 *pps_packet = mpp_calloc(RK_U64, fifo_len + 1);
479*437bfbebSnyanmisaka 
480*437bfbebSnyanmisaka     if (NULL == reg_ctx || dxva_cxt == NULL) {
481*437bfbebSnyanmisaka         mpp_err("%s:%s:%d reg_ctx or dxva_cxt is NULL",
482*437bfbebSnyanmisaka                 __FILE__, __FUNCTION__, __LINE__);
483*437bfbebSnyanmisaka         MPP_FREE(pps_packet);
484*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
485*437bfbebSnyanmisaka     }
486*437bfbebSnyanmisaka 
487*437bfbebSnyanmisaka     void *pps_ptr = mpp_buffer_get_ptr(reg_ctx->pps_data);
488*437bfbebSnyanmisaka     if (NULL == pps_ptr) {
489*437bfbebSnyanmisaka         mpp_err("pps_data get ptr error");
490*437bfbebSnyanmisaka         return MPP_ERR_NOMEM;
491*437bfbebSnyanmisaka     }
492*437bfbebSnyanmisaka     memset(pps_ptr, 0, 80 * 64);
493*437bfbebSnyanmisaka     // pps_packet = (RK_U64 *)(pps_ptr + dxva_cxt->pp.pps_id * 80);
494*437bfbebSnyanmisaka 
495*437bfbebSnyanmisaka     for (i = 0; i < 10; i++) pps_packet[i] = 0;
496*437bfbebSnyanmisaka 
497*437bfbebSnyanmisaka     mpp_set_bitput_ctx(&bp, pps_packet, fifo_len);
498*437bfbebSnyanmisaka 
499*437bfbebSnyanmisaka     // SPS
500*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.vps_id                            , 4);
501*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_id                            , 4);
502*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.chroma_format_idc                 , 2);
503*437bfbebSnyanmisaka 
504*437bfbebSnyanmisaka     log2_min_cb_size = dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3;
505*437bfbebSnyanmisaka     width = (dxva_cxt->pp.PicWidthInMinCbsY << log2_min_cb_size);
506*437bfbebSnyanmisaka     height = (dxva_cxt->pp.PicHeightInMinCbsY << log2_min_cb_size);
507*437bfbebSnyanmisaka 
508*437bfbebSnyanmisaka     mpp_put_bits(&bp, width                                          , 13);
509*437bfbebSnyanmisaka     mpp_put_bits(&bp, height                                         , 13);
510*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_luma_minus8 + 8         , 4);
511*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.bit_depth_chroma_minus8 + 8       , 4);
512*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_max_pic_order_cnt_lsb_minus4 + 4      , 5);
513*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size   , 2); //log2_maxa_coding_block_depth
514*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_min_luma_coding_block_size_minus3 + 3 , 3);
515*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_min_transform_block_size_minus2 + 2   , 3);
516*437bfbebSnyanmisaka     ///<-zrh comment ^  57 bit above
517*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_transform_block_size     , 2);
518*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_inter        , 3);
519*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.max_transform_hierarchy_depth_intra        , 3);
520*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.scaling_list_enabled_flag                  , 1);
521*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.amp_enabled_flag                           , 1);
522*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sample_adaptive_offset_enabled_flag        , 1);
523*437bfbebSnyanmisaka     ///<-zrh comment ^  68 bit above
524*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag                           , 1);
525*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_luma_minus1 + 1) : 0  , 4);
526*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.pcm_sample_bit_depth_chroma_minus1 + 1) : 0 , 4);
527*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_loop_filter_disabled_flag                                               , 1);
528*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_diff_max_min_pcm_luma_coding_block_size                                , 3);
529*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pcm_enabled_flag ? (dxva_cxt->pp.log2_min_pcm_luma_coding_block_size_minus3 + 3) : 0, 3);
530*437bfbebSnyanmisaka 
531*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_short_term_ref_pic_sets             , 7);
532*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.long_term_ref_pics_present_flag         , 1);
533*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_long_term_ref_pics_sps              , 6);
534*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_temporal_mvp_enabled_flag           , 1);
535*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.strong_intra_smoothing_enabled_flag     , 1);
536*437bfbebSnyanmisaka     ///<-zrh comment ^ 100 bit above
537*437bfbebSnyanmisaka 
538*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0                                                    , 7 );
539*437bfbebSnyanmisaka     mpp_put_align(&bp                                                         , 32, 0xf);
540*437bfbebSnyanmisaka 
541*437bfbebSnyanmisaka     // PPS
542*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_id                                    , 6 );
543*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sps_id                                    , 4 );
544*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.dependent_slice_segments_enabled_flag     , 1 );
545*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.output_flag_present_flag                  , 1 );
546*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_extra_slice_header_bits               , 13);
547*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.sign_data_hiding_enabled_flag , 1);
548*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.cabac_init_present_flag                   , 1);
549*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l0_default_active_minus1 + 1  , 4);
550*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_ref_idx_l1_default_active_minus1 + 1  , 4);
551*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.init_qp_minus26                           , 7);
552*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.constrained_intra_pred_flag               , 1);
553*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.transform_skip_enabled_flag               , 1);
554*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.cu_qp_delta_enabled_flag                  , 1);
555*437bfbebSnyanmisaka 
556*437bfbebSnyanmisaka     mpp_put_bits(&bp, log2_min_cb_size +
557*437bfbebSnyanmisaka                  dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size -
558*437bfbebSnyanmisaka                  dxva_cxt->pp.diff_cu_qp_delta_depth                             , 3);
559*437bfbebSnyanmisaka 
560*437bfbebSnyanmisaka     h265h_dbg(H265H_DBG_PPS, "log2_min_cb_size %d %d %d \n", log2_min_cb_size,
561*437bfbebSnyanmisaka               dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size, dxva_cxt->pp.diff_cu_qp_delta_depth );
562*437bfbebSnyanmisaka 
563*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_cb_qp_offset                            , 5);
564*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_cr_qp_offset                            , 5);
565*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_slice_chroma_qp_offsets_present_flag    , 1);
566*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.weighted_pred_flag                          , 1);
567*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.weighted_bipred_flag                        , 1);
568*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.transquant_bypass_enabled_flag              , 1 );
569*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.tiles_enabled_flag                          , 1 );
570*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.entropy_coding_sync_enabled_flag            , 1);
571*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_loop_filter_across_slices_enabled_flag  , 1);
572*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.loop_filter_across_tiles_enabled_flag       , 1);
573*437bfbebSnyanmisaka 
574*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.deblocking_filter_override_enabled_flag     , 1);
575*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_deblocking_filter_disabled_flag         , 1);
576*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_beta_offset_div2                        , 4);
577*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.pps_tc_offset_div2                          , 4);
578*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.lists_modification_present_flag             , 1);
579*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.log2_parallel_merge_level_minus2 + 2        , 3);
580*437bfbebSnyanmisaka     /*slice_segment_header_extension_present_flag need set 0 */
581*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0                                                        , 1);
582*437bfbebSnyanmisaka     mpp_put_bits(&bp, 0                                                        , 3);
583*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_tile_columns_minus1 + 1, 5);
584*437bfbebSnyanmisaka     mpp_put_bits(&bp, dxva_cxt->pp.num_tile_rows_minus1 + 1 , 5 );
585*437bfbebSnyanmisaka     mpp_put_bits(&bp, 3, 2); //mSps_Pps[i]->mMode
586*437bfbebSnyanmisaka     mpp_put_align(&bp, 64, 0xf);
587*437bfbebSnyanmisaka 
588*437bfbebSnyanmisaka     {
589*437bfbebSnyanmisaka         /// tiles info begin
590*437bfbebSnyanmisaka         RK_U16 column_width[20];
591*437bfbebSnyanmisaka         RK_U16 row_height[22];
592*437bfbebSnyanmisaka 
593*437bfbebSnyanmisaka         memset(column_width, 0, sizeof(column_width));
594*437bfbebSnyanmisaka         memset(row_height, 0, sizeof(row_height));
595*437bfbebSnyanmisaka 
596*437bfbebSnyanmisaka         if (dxva_cxt->pp.tiles_enabled_flag) {
597*437bfbebSnyanmisaka             if (dxva_cxt->pp.uniform_spacing_flag == 0) {
598*437bfbebSnyanmisaka                 RK_S32 maxcuwidth = dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size;
599*437bfbebSnyanmisaka                 RK_S32 ctu_width_in_pic = (width +
600*437bfbebSnyanmisaka                                            (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
601*437bfbebSnyanmisaka                 RK_S32 ctu_height_in_pic = (height +
602*437bfbebSnyanmisaka                                             (1 << maxcuwidth) - 1) / (1 << maxcuwidth) ;
603*437bfbebSnyanmisaka                 RK_S32 sum = 0;
604*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1; i++) {
605*437bfbebSnyanmisaka                     column_width[i] = dxva_cxt->pp.column_width_minus1[i] + 1;
606*437bfbebSnyanmisaka                     sum += column_width[i]  ;
607*437bfbebSnyanmisaka                 }
608*437bfbebSnyanmisaka                 column_width[i] = ctu_width_in_pic - sum;
609*437bfbebSnyanmisaka 
610*437bfbebSnyanmisaka                 sum = 0;
611*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1; i++) {
612*437bfbebSnyanmisaka                     row_height[i] = dxva_cxt->pp.row_height_minus1[i] + 1;
613*437bfbebSnyanmisaka                     sum += row_height[i];
614*437bfbebSnyanmisaka                 }
615*437bfbebSnyanmisaka                 row_height[i] = ctu_height_in_pic - sum;
616*437bfbebSnyanmisaka             } // end of (pps->uniform_spacing_flag == 0)
617*437bfbebSnyanmisaka             else {
618*437bfbebSnyanmisaka 
619*437bfbebSnyanmisaka                 RK_S32    pic_in_cts_width = (width +
620*437bfbebSnyanmisaka                                               (1 << (log2_min_cb_size +
621*437bfbebSnyanmisaka                                                      dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
622*437bfbebSnyanmisaka                                              / (1 << (log2_min_cb_size +
623*437bfbebSnyanmisaka                                                       dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
624*437bfbebSnyanmisaka                 RK_S32 pic_in_cts_height = (height +
625*437bfbebSnyanmisaka                                             (1 << (log2_min_cb_size +
626*437bfbebSnyanmisaka                                                    dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size)) - 1)
627*437bfbebSnyanmisaka                                            / (1 << (log2_min_cb_size +
628*437bfbebSnyanmisaka                                                     dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size));
629*437bfbebSnyanmisaka 
630*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_columns_minus1 + 1; i++)
631*437bfbebSnyanmisaka                     column_width[i] = ((i + 1) * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1) -
632*437bfbebSnyanmisaka                                       (i * pic_in_cts_width) / (dxva_cxt->pp.num_tile_columns_minus1 + 1);
633*437bfbebSnyanmisaka 
634*437bfbebSnyanmisaka                 for (i = 0; i < dxva_cxt->pp.num_tile_rows_minus1 + 1; i++)
635*437bfbebSnyanmisaka                     row_height[i] = ((i + 1) * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1) -
636*437bfbebSnyanmisaka                                     (i * pic_in_cts_height) / (dxva_cxt->pp.num_tile_rows_minus1 + 1);
637*437bfbebSnyanmisaka             }
638*437bfbebSnyanmisaka         } // pps->tiles_enabled_flag
639*437bfbebSnyanmisaka         else {
640*437bfbebSnyanmisaka             RK_S32 MaxCUWidth = (1 << (dxva_cxt->pp.log2_diff_max_min_luma_coding_block_size + log2_min_cb_size));
641*437bfbebSnyanmisaka             column_width[0] = (width  + MaxCUWidth - 1) / MaxCUWidth;
642*437bfbebSnyanmisaka             row_height[0]   = (height + MaxCUWidth - 1) / MaxCUWidth;
643*437bfbebSnyanmisaka         }
644*437bfbebSnyanmisaka 
645*437bfbebSnyanmisaka         for (j = 0; j < 20; j++) {
646*437bfbebSnyanmisaka             if (column_width[j] > 0)
647*437bfbebSnyanmisaka                 column_width[j]--;
648*437bfbebSnyanmisaka             mpp_put_bits(&bp, column_width[j], 8);
649*437bfbebSnyanmisaka         }
650*437bfbebSnyanmisaka 
651*437bfbebSnyanmisaka         for (j = 0; j < 22; j++) {
652*437bfbebSnyanmisaka             if (row_height[j] > 0)
653*437bfbebSnyanmisaka                 row_height[j]--;
654*437bfbebSnyanmisaka             mpp_put_bits(&bp, row_height[j], 8);
655*437bfbebSnyanmisaka         }
656*437bfbebSnyanmisaka     }
657*437bfbebSnyanmisaka 
658*437bfbebSnyanmisaka     {
659*437bfbebSnyanmisaka         RK_U8 *ptr_scaling = (RK_U8 *)mpp_buffer_get_ptr(reg_ctx->scaling_list_data);
660*437bfbebSnyanmisaka         RK_U32 fd = mpp_buffer_get_fd(reg_ctx->scaling_list_data);
661*437bfbebSnyanmisaka 
662*437bfbebSnyanmisaka         hal_h265d_output_scalinglist_packet(hal, ptr_scaling, dxva);
663*437bfbebSnyanmisaka         mpp_put_bits(&bp, fd, 32);
664*437bfbebSnyanmisaka         mpp_put_align(&bp, 64, 0xf);
665*437bfbebSnyanmisaka     }
666*437bfbebSnyanmisaka 
667*437bfbebSnyanmisaka     for (i = 0; i < 64; i++)
668*437bfbebSnyanmisaka         memcpy(pps_ptr + i * 80, pps_packet, 80);
669*437bfbebSnyanmisaka 
670*437bfbebSnyanmisaka #ifdef dump
671*437bfbebSnyanmisaka     fwrite(pps_ptr, 1, 80 * 64, fp);
672*437bfbebSnyanmisaka     fflush(fp);
673*437bfbebSnyanmisaka #endif
674*437bfbebSnyanmisaka 
675*437bfbebSnyanmisaka     MPP_FREE(pps_packet);
676*437bfbebSnyanmisaka     return 0;
677*437bfbebSnyanmisaka }
678*437bfbebSnyanmisaka 
update_stream_buffer(MppBuffer streambuf,HalTaskInfo * syn)679*437bfbebSnyanmisaka static void update_stream_buffer(MppBuffer streambuf, HalTaskInfo *syn)
680*437bfbebSnyanmisaka {
681*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_cxt =
682*437bfbebSnyanmisaka         (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
683*437bfbebSnyanmisaka     RK_U8 *ptr = (RK_U8*)mpp_buffer_get_ptr(streambuf);
684*437bfbebSnyanmisaka     RK_U8 bit_left = 0;
685*437bfbebSnyanmisaka     RK_U16 start_byte, end_byte, i = 0;
686*437bfbebSnyanmisaka     RK_U32 stream_size = dxva_cxt->bitstream_size;
687*437bfbebSnyanmisaka     RK_U8 *buf = NULL;
688*437bfbebSnyanmisaka     RK_U8 *temp = NULL;
689*437bfbebSnyanmisaka     RK_U32 cut_byte = 0, cut_byte_acc = 0;
690*437bfbebSnyanmisaka 
691*437bfbebSnyanmisaka     for (i = 0; i < dxva_cxt->slice_count; i++) {
692*437bfbebSnyanmisaka         if (dxva_cxt->slice_cut_param[i].is_enable) {
693*437bfbebSnyanmisaka 
694*437bfbebSnyanmisaka             bit_left = 8 - (dxva_cxt->slice_cut_param[i].start_bit & 0x7);
695*437bfbebSnyanmisaka             start_byte = dxva_cxt->slice_cut_param[i].start_bit >> 3;
696*437bfbebSnyanmisaka             end_byte = (dxva_cxt->slice_cut_param[i].end_bit + 7) >> 3;
697*437bfbebSnyanmisaka             buf = ptr + (dxva_cxt->slice_short[i].BSNALunitDataLocation - cut_byte_acc);
698*437bfbebSnyanmisaka             temp = buf + start_byte;
699*437bfbebSnyanmisaka 
700*437bfbebSnyanmisaka             h265h_dbg(H265H_DBG_FUNCTION, "start bit %d start byte[%d] 0x%x end bit %d end byte[%d] 0x%x\n",
701*437bfbebSnyanmisaka                       dxva_cxt->slice_cut_param[i].start_bit, start_byte, buf[start_byte],
702*437bfbebSnyanmisaka                       dxva_cxt->slice_cut_param[i].end_bit, end_byte, buf[end_byte]);
703*437bfbebSnyanmisaka             if (bit_left < 8) {
704*437bfbebSnyanmisaka                 *temp = (*temp >> bit_left) << bit_left;
705*437bfbebSnyanmisaka                 *temp |= 1 << (bit_left - 1);
706*437bfbebSnyanmisaka             } else {
707*437bfbebSnyanmisaka                 *temp = 0x80;
708*437bfbebSnyanmisaka             }
709*437bfbebSnyanmisaka             if ((dxva_cxt->slice_cut_param[i].end_bit & 0x7) == 0 && buf[end_byte] == 0x80)
710*437bfbebSnyanmisaka                 end_byte += 1;
711*437bfbebSnyanmisaka 
712*437bfbebSnyanmisaka             h265h_dbg(H265H_DBG_FUNCTION, "i %d location %d count %d SliceBytesInBuffer %d bitstream_size %d\n",
713*437bfbebSnyanmisaka                       i, dxva_cxt->slice_short[i].BSNALunitDataLocation, dxva_cxt->slice_count,
714*437bfbebSnyanmisaka                       dxva_cxt->slice_short[i].SliceBytesInBuffer, dxva_cxt->bitstream_size);
715*437bfbebSnyanmisaka 
716*437bfbebSnyanmisaka             memmove(buf + start_byte + 1, buf + end_byte,
717*437bfbebSnyanmisaka                     stream_size - dxva_cxt->slice_short[i].BSNALunitDataLocation - end_byte);
718*437bfbebSnyanmisaka 
719*437bfbebSnyanmisaka             cut_byte = end_byte - start_byte - 1;
720*437bfbebSnyanmisaka             dxva_cxt->slice_short[i].SliceBytesInBuffer -= cut_byte;
721*437bfbebSnyanmisaka             dxva_cxt->bitstream_size -= cut_byte;
722*437bfbebSnyanmisaka             cut_byte_acc += cut_byte;
723*437bfbebSnyanmisaka         }
724*437bfbebSnyanmisaka     }
725*437bfbebSnyanmisaka }
726*437bfbebSnyanmisaka 
hal_h265d_rkv_gen_regs(void * hal,HalTaskInfo * syn)727*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_gen_regs(void *hal,  HalTaskInfo *syn)
728*437bfbebSnyanmisaka {
729*437bfbebSnyanmisaka     RK_S32 i = 0;
730*437bfbebSnyanmisaka     RK_S32 stride_y, stride_uv, virstrid_y, virstrid_yuv;
731*437bfbebSnyanmisaka     H265d_REGS_t *hw_regs;
732*437bfbebSnyanmisaka     RK_S32 ret = MPP_SUCCESS;
733*437bfbebSnyanmisaka     MppBuffer streambuf = NULL;
734*437bfbebSnyanmisaka     RK_S32 aglin_offset = 0;
735*437bfbebSnyanmisaka     RK_S32 valid_ref = -1;
736*437bfbebSnyanmisaka     MppBuffer framebuf = NULL;
737*437bfbebSnyanmisaka     RK_U32 sw_ref_valid = 0;
738*437bfbebSnyanmisaka     RK_U32 stream_buf_size = 0;
739*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = ( HalH265dCtx *)hal;
740*437bfbebSnyanmisaka     MppFrame mframe;
741*437bfbebSnyanmisaka 
742*437bfbebSnyanmisaka     if (syn->dec.flags.parse_err ||
743*437bfbebSnyanmisaka         (syn->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
744*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
745*437bfbebSnyanmisaka         return MPP_OK;
746*437bfbebSnyanmisaka     }
747*437bfbebSnyanmisaka 
748*437bfbebSnyanmisaka     h265d_dxva2_picture_context_t *dxva_cxt =
749*437bfbebSnyanmisaka         (h265d_dxva2_picture_context_t *)syn->dec.syntax.data;
750*437bfbebSnyanmisaka 
751*437bfbebSnyanmisaka     void *rps_ptr = NULL;
752*437bfbebSnyanmisaka     if (reg_ctx ->fast_mode) {
753*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
754*437bfbebSnyanmisaka             if (!reg_ctx->g_buf[i].use_flag) {
755*437bfbebSnyanmisaka                 syn->dec.reg_index = i;
756*437bfbebSnyanmisaka                 reg_ctx->rps_data = reg_ctx->g_buf[i].rps_data;
757*437bfbebSnyanmisaka                 reg_ctx->scaling_list_data =
758*437bfbebSnyanmisaka                     reg_ctx->g_buf[i].scaling_list_data;
759*437bfbebSnyanmisaka                 reg_ctx->pps_data = reg_ctx->g_buf[i].pps_data;
760*437bfbebSnyanmisaka                 reg_ctx->hw_regs = reg_ctx->g_buf[i].hw_regs;
761*437bfbebSnyanmisaka                 reg_ctx->g_buf[i].use_flag = 1;
762*437bfbebSnyanmisaka                 break;
763*437bfbebSnyanmisaka             }
764*437bfbebSnyanmisaka         }
765*437bfbebSnyanmisaka         if (i == MAX_GEN_REG) {
766*437bfbebSnyanmisaka             mpp_err("hevc rps buf all used");
767*437bfbebSnyanmisaka             return MPP_ERR_NOMEM;
768*437bfbebSnyanmisaka         }
769*437bfbebSnyanmisaka     } else {
770*437bfbebSnyanmisaka         syn->dec.reg_index = 0;
771*437bfbebSnyanmisaka     }
772*437bfbebSnyanmisaka     rps_ptr = mpp_buffer_get_ptr(reg_ctx->rps_data);
773*437bfbebSnyanmisaka     if (NULL == rps_ptr) {
774*437bfbebSnyanmisaka 
775*437bfbebSnyanmisaka         mpp_err("rps_data get ptr error");
776*437bfbebSnyanmisaka         return MPP_ERR_NOMEM;
777*437bfbebSnyanmisaka     }
778*437bfbebSnyanmisaka 
779*437bfbebSnyanmisaka 
780*437bfbebSnyanmisaka     if (syn->dec.syntax.data == NULL) {
781*437bfbebSnyanmisaka         mpp_err("%s:%s:%d dxva is NULL", __FILE__, __FUNCTION__, __LINE__);
782*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
783*437bfbebSnyanmisaka     }
784*437bfbebSnyanmisaka 
785*437bfbebSnyanmisaka     /* output pps */
786*437bfbebSnyanmisaka     if (reg_ctx->is_v345) {
787*437bfbebSnyanmisaka         hal_h265d_v345_output_pps_packet(hal, syn->dec.syntax.data);
788*437bfbebSnyanmisaka     } else {
789*437bfbebSnyanmisaka         hal_h265d_output_pps_packet(hal, syn->dec.syntax.data);
790*437bfbebSnyanmisaka     }
791*437bfbebSnyanmisaka 
792*437bfbebSnyanmisaka     if (NULL == reg_ctx->hw_regs) {
793*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
794*437bfbebSnyanmisaka     }
795*437bfbebSnyanmisaka 
796*437bfbebSnyanmisaka     hw_regs = (H265d_REGS_t*)reg_ctx->hw_regs;
797*437bfbebSnyanmisaka     memset(hw_regs, 0, sizeof(H265d_REGS_t));
798*437bfbebSnyanmisaka 
799*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
800*437bfbebSnyanmisaka                           SLOT_FRAME_PTR, &mframe);
801*437bfbebSnyanmisaka     stride_y = mpp_frame_get_hor_stride(mframe);
802*437bfbebSnyanmisaka     stride_uv = mpp_frame_get_hor_stride(mframe);
803*437bfbebSnyanmisaka     virstrid_y = mpp_frame_get_ver_stride(mframe) * stride_y;
804*437bfbebSnyanmisaka     virstrid_yuv  = virstrid_y + stride_uv * mpp_frame_get_ver_stride(mframe) / 2;
805*437bfbebSnyanmisaka 
806*437bfbebSnyanmisaka     hw_regs->sw_picparameter.sw_slice_num = dxva_cxt->slice_count;
807*437bfbebSnyanmisaka     hw_regs->sw_picparameter.sw_y_hor_virstride = stride_y >> 4;
808*437bfbebSnyanmisaka     hw_regs->sw_picparameter.sw_uv_hor_virstride = stride_uv >> 4;
809*437bfbebSnyanmisaka     hw_regs->sw_y_virstride = virstrid_y >> 4;
810*437bfbebSnyanmisaka     hw_regs->sw_yuv_virstride = virstrid_yuv >> 4;
811*437bfbebSnyanmisaka     hw_regs->sw_sysctrl.sw_h26x_rps_mode = 0;
812*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(reg_ctx->slots, dxva_cxt->pp.CurrPic.Index7Bits,
813*437bfbebSnyanmisaka                           SLOT_BUFFER, &framebuf);
814*437bfbebSnyanmisaka     hw_regs->sw_decout_base  = mpp_buffer_get_fd(framebuf); //just index need map
815*437bfbebSnyanmisaka 
816*437bfbebSnyanmisaka     /*if out_base is equal to zero it means this frame may error
817*437bfbebSnyanmisaka     we return directly add by csy*/
818*437bfbebSnyanmisaka 
819*437bfbebSnyanmisaka     if (hw_regs->sw_decout_base == 0) {
820*437bfbebSnyanmisaka         return 0;
821*437bfbebSnyanmisaka     }
822*437bfbebSnyanmisaka 
823*437bfbebSnyanmisaka     hw_regs->sw_cur_poc = dxva_cxt->pp.CurrPicOrderCntVal;
824*437bfbebSnyanmisaka 
825*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(reg_ctx->packet_slots, syn->dec.input, SLOT_BUFFER,
826*437bfbebSnyanmisaka                           &streambuf);
827*437bfbebSnyanmisaka 
828*437bfbebSnyanmisaka     if ( dxva_cxt->bitstream == NULL) {
829*437bfbebSnyanmisaka         dxva_cxt->bitstream = mpp_buffer_get_ptr(streambuf);
830*437bfbebSnyanmisaka     }
831*437bfbebSnyanmisaka     if (reg_ctx->is_v345) {
832*437bfbebSnyanmisaka #ifdef HW_RPS
833*437bfbebSnyanmisaka         hw_regs->sw_sysctrl.sw_wait_reset_en = 1;
834*437bfbebSnyanmisaka         hw_regs->v345_reg_ends.reg064_mvc0.refp_layer_same_with_cur = 0xffff;
835*437bfbebSnyanmisaka         hal_h265d_slice_hw_rps(syn->dec.syntax.data, rps_ptr, reg_ctx->sw_rps_buf, reg_ctx->fast_mode);
836*437bfbebSnyanmisaka #else
837*437bfbebSnyanmisaka         hw_regs->sw_sysctrl.sw_h26x_rps_mode = 1;
838*437bfbebSnyanmisaka         hal_h265d_slice_output_rps(syn->dec.syntax.data, rps_ptr);
839*437bfbebSnyanmisaka #endif
840*437bfbebSnyanmisaka     } else {
841*437bfbebSnyanmisaka         hal_h265d_slice_output_rps(syn->dec.syntax.data, rps_ptr);
842*437bfbebSnyanmisaka     }
843*437bfbebSnyanmisaka 
844*437bfbebSnyanmisaka     if (dxva_cxt->pp.slice_segment_header_extension_present_flag && !reg_ctx->is_v345) {
845*437bfbebSnyanmisaka         update_stream_buffer(streambuf, syn);
846*437bfbebSnyanmisaka         mpp_buffer_sync_end(streambuf);
847*437bfbebSnyanmisaka     }
848*437bfbebSnyanmisaka 
849*437bfbebSnyanmisaka     hw_regs->sw_cabactbl_base   =  mpp_buffer_get_fd(reg_ctx->cabac_table_data);
850*437bfbebSnyanmisaka     hw_regs->sw_pps_base        =  mpp_buffer_get_fd(reg_ctx->pps_data);
851*437bfbebSnyanmisaka     hw_regs->sw_rps_base        =  mpp_buffer_get_fd(reg_ctx->rps_data);
852*437bfbebSnyanmisaka     hw_regs->sw_strm_rlc_base   =  mpp_buffer_get_fd(streambuf);
853*437bfbebSnyanmisaka     stream_buf_size             =  mpp_buffer_get_size(streambuf);
854*437bfbebSnyanmisaka 
855*437bfbebSnyanmisaka     hw_regs->sw_stream_len      = ((dxva_cxt->bitstream_size + 15)
856*437bfbebSnyanmisaka                                    & (~15)) + 64;
857*437bfbebSnyanmisaka     hw_regs->sw_stream_len      = stream_buf_size >  hw_regs->sw_stream_len ?
858*437bfbebSnyanmisaka                                   hw_regs->sw_stream_len : stream_buf_size;
859*437bfbebSnyanmisaka 
860*437bfbebSnyanmisaka     aglin_offset =  hw_regs->sw_stream_len - dxva_cxt->bitstream_size;
861*437bfbebSnyanmisaka     if (aglin_offset > 0) {
862*437bfbebSnyanmisaka         memset((void *)(dxva_cxt->bitstream + dxva_cxt->bitstream_size), 0,
863*437bfbebSnyanmisaka                aglin_offset);
864*437bfbebSnyanmisaka     }
865*437bfbebSnyanmisaka     hw_regs->sw_interrupt.sw_dec_e         = 1;
866*437bfbebSnyanmisaka     hw_regs->sw_interrupt.sw_dec_timeout_e = 1;
867*437bfbebSnyanmisaka     hw_regs->sw_interrupt.sw_wr_ddr_align_en = dxva_cxt->pp.tiles_enabled_flag
868*437bfbebSnyanmisaka                                                ? 0 : 1;
869*437bfbebSnyanmisaka 
870*437bfbebSnyanmisaka     ///find s->rps_model[i] position, and set register
871*437bfbebSnyanmisaka     hw_regs->cabac_error_en = 0xfdfffffd;
872*437bfbebSnyanmisaka     hw_regs->rkv_reg_ends.extern_error_en = 0x30000000;
873*437bfbebSnyanmisaka 
874*437bfbebSnyanmisaka     valid_ref = hw_regs->sw_decout_base;
875*437bfbebSnyanmisaka     for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(dxva_cxt->pp.RefPicList); i++) {
876*437bfbebSnyanmisaka         if (dxva_cxt->pp.RefPicList[i].bPicEntry != 0xff &&
877*437bfbebSnyanmisaka             dxva_cxt->pp.RefPicList[i].bPicEntry != 0x7f) {
878*437bfbebSnyanmisaka             hw_regs->sw_refer_poc[i] = dxva_cxt->pp.PicOrderCntValList[i];
879*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots,
880*437bfbebSnyanmisaka                                   dxva_cxt->pp.RefPicList[i].Index7Bits,
881*437bfbebSnyanmisaka                                   SLOT_BUFFER, &framebuf);
882*437bfbebSnyanmisaka             if (framebuf != NULL) {
883*437bfbebSnyanmisaka                 hw_regs->sw_refer_base[i] = mpp_buffer_get_fd(framebuf);
884*437bfbebSnyanmisaka                 valid_ref = hw_regs->sw_refer_base[i];
885*437bfbebSnyanmisaka             } else {
886*437bfbebSnyanmisaka                 hw_regs->sw_refer_base[i] = valid_ref;
887*437bfbebSnyanmisaka             }
888*437bfbebSnyanmisaka             sw_ref_valid          |=   (1 << i);
889*437bfbebSnyanmisaka         } else {
890*437bfbebSnyanmisaka             hw_regs->sw_refer_base[i] = hw_regs->sw_decout_base;
891*437bfbebSnyanmisaka         }
892*437bfbebSnyanmisaka     }
893*437bfbebSnyanmisaka 
894*437bfbebSnyanmisaka     if (sw_ref_valid) {
895*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(reg_ctx->dev, 10, sw_ref_valid & 0xf);
896*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(reg_ctx->dev, 11, ((sw_ref_valid >> 4) & 0xf));
897*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(reg_ctx->dev, 12, ((sw_ref_valid >> 8) & 0xf));
898*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(reg_ctx->dev, 13, ((sw_ref_valid >> 12) & 0xf));
899*437bfbebSnyanmisaka     }
900*437bfbebSnyanmisaka     mpp_buffer_sync_end(reg_ctx->scaling_list_data);
901*437bfbebSnyanmisaka     mpp_buffer_sync_end(reg_ctx->pps_data);
902*437bfbebSnyanmisaka     mpp_buffer_sync_end(reg_ctx->rps_data);
903*437bfbebSnyanmisaka 
904*437bfbebSnyanmisaka     return ret;
905*437bfbebSnyanmisaka }
906*437bfbebSnyanmisaka 
hal_h265d_rkv_start(void * hal,HalTaskInfo * task)907*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_start(void *hal, HalTaskInfo *task)
908*437bfbebSnyanmisaka {
909*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
910*437bfbebSnyanmisaka     H265d_REGS_t *hw_regs = NULL;
911*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
912*437bfbebSnyanmisaka     RK_S32 index =  task->dec.reg_index;
913*437bfbebSnyanmisaka 
914*437bfbebSnyanmisaka     RK_U32 i;
915*437bfbebSnyanmisaka 
916*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
917*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
918*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
919*437bfbebSnyanmisaka         return MPP_OK;
920*437bfbebSnyanmisaka     }
921*437bfbebSnyanmisaka 
922*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
923*437bfbebSnyanmisaka         hw_regs = ( H265d_REGS_t *)reg_ctx->g_buf[index].hw_regs;
924*437bfbebSnyanmisaka     } else {
925*437bfbebSnyanmisaka         hw_regs = ( H265d_REGS_t *)reg_ctx->hw_regs;
926*437bfbebSnyanmisaka     }
927*437bfbebSnyanmisaka 
928*437bfbebSnyanmisaka     if (hw_regs == NULL) {
929*437bfbebSnyanmisaka         mpp_err("hal_h265d_start hw_regs is NULL");
930*437bfbebSnyanmisaka         return MPP_ERR_NULL_PTR;
931*437bfbebSnyanmisaka     }
932*437bfbebSnyanmisaka 
933*437bfbebSnyanmisaka     do {
934*437bfbebSnyanmisaka         MppDevRegWrCfg wr_cfg;
935*437bfbebSnyanmisaka         MppDevRegRdCfg rd_cfg;
936*437bfbebSnyanmisaka 
937*437bfbebSnyanmisaka         RK_U32 reg_size = (reg_ctx->is_v341 || reg_ctx->is_v345) ? V345_HEVC_REGISTERS :
938*437bfbebSnyanmisaka                           (reg_ctx->client_type == VPU_CLIENT_RKVDEC) ?
939*437bfbebSnyanmisaka                           RKVDEC_V1_REGISTERS : RKVDEC_HEVC_REGISTERS;
940*437bfbebSnyanmisaka 
941*437bfbebSnyanmisaka         reg_size *= sizeof(RK_U32);
942*437bfbebSnyanmisaka 
943*437bfbebSnyanmisaka         wr_cfg.reg = hw_regs;
944*437bfbebSnyanmisaka         wr_cfg.size = reg_size;
945*437bfbebSnyanmisaka         wr_cfg.offset = 0;
946*437bfbebSnyanmisaka 
947*437bfbebSnyanmisaka         if (hal_h265d_debug & H265H_DBG_REG) {
948*437bfbebSnyanmisaka             for (i = 0; i < reg_size / sizeof(RK_U32); i++)
949*437bfbebSnyanmisaka                 h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[%02d]=%08X\n", i, ((RK_U32 *)hw_regs)[i]);
950*437bfbebSnyanmisaka         }
951*437bfbebSnyanmisaka 
952*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_WR, &wr_cfg);
953*437bfbebSnyanmisaka         if (ret) {
954*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
955*437bfbebSnyanmisaka             break;
956*437bfbebSnyanmisaka         }
957*437bfbebSnyanmisaka 
958*437bfbebSnyanmisaka         rd_cfg.reg = hw_regs;
959*437bfbebSnyanmisaka         rd_cfg.size = reg_size;
960*437bfbebSnyanmisaka         rd_cfg.offset = 0;
961*437bfbebSnyanmisaka 
962*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_REG_RD, &rd_cfg);
963*437bfbebSnyanmisaka         if (ret) {
964*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
965*437bfbebSnyanmisaka             break;
966*437bfbebSnyanmisaka         }
967*437bfbebSnyanmisaka 
968*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_SEND, NULL);
969*437bfbebSnyanmisaka         if (ret) {
970*437bfbebSnyanmisaka             mpp_err_f("send cmd failed %d\n", ret);
971*437bfbebSnyanmisaka             break;
972*437bfbebSnyanmisaka         }
973*437bfbebSnyanmisaka     } while (0);
974*437bfbebSnyanmisaka 
975*437bfbebSnyanmisaka     return ret;
976*437bfbebSnyanmisaka }
977*437bfbebSnyanmisaka 
hal_h265d_rkv_wait(void * hal,HalTaskInfo * task)978*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_wait(void *hal, HalTaskInfo *task)
979*437bfbebSnyanmisaka {
980*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
981*437bfbebSnyanmisaka     RK_S32 index =  task->dec.reg_index;
982*437bfbebSnyanmisaka     HalH265dCtx *reg_ctx = (HalH265dCtx *)hal;
983*437bfbebSnyanmisaka     H265d_REGS_t *hw_regs = NULL;
984*437bfbebSnyanmisaka     RK_S32 i;
985*437bfbebSnyanmisaka 
986*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
987*437bfbebSnyanmisaka         hw_regs = ( H265d_REGS_t *)reg_ctx->g_buf[index].hw_regs;
988*437bfbebSnyanmisaka     } else {
989*437bfbebSnyanmisaka         hw_regs = ( H265d_REGS_t *)reg_ctx->hw_regs;
990*437bfbebSnyanmisaka     }
991*437bfbebSnyanmisaka 
992*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
993*437bfbebSnyanmisaka         (task->dec.flags.ref_err && !reg_ctx->cfg->base.disable_error)) {
994*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_TASK_ERR, "%s found task error\n", __FUNCTION__);
995*437bfbebSnyanmisaka         goto ERR_PROC;
996*437bfbebSnyanmisaka     }
997*437bfbebSnyanmisaka 
998*437bfbebSnyanmisaka     ret = mpp_dev_ioctl(reg_ctx->dev, MPP_DEV_CMD_POLL, NULL);
999*437bfbebSnyanmisaka     if (ret)
1000*437bfbebSnyanmisaka         mpp_err_f("poll cmd failed %d\n", ret);
1001*437bfbebSnyanmisaka 
1002*437bfbebSnyanmisaka ERR_PROC:
1003*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
1004*437bfbebSnyanmisaka         task->dec.flags.ref_err ||
1005*437bfbebSnyanmisaka         hw_regs->sw_interrupt.sw_dec_error_sta ||
1006*437bfbebSnyanmisaka         hw_regs->sw_interrupt.sw_dec_timeout_sta ||
1007*437bfbebSnyanmisaka         hw_regs->sw_interrupt.sw_dec_empty_sta) {
1008*437bfbebSnyanmisaka         if (!reg_ctx->fast_mode) {
1009*437bfbebSnyanmisaka             if (reg_ctx->dec_cb)
1010*437bfbebSnyanmisaka                 mpp_callback(reg_ctx->dec_cb, &task->dec);
1011*437bfbebSnyanmisaka         } else {
1012*437bfbebSnyanmisaka             MppFrame mframe = NULL;
1013*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1014*437bfbebSnyanmisaka                                   SLOT_FRAME_PTR, &mframe);
1015*437bfbebSnyanmisaka             if (mframe) {
1016*437bfbebSnyanmisaka                 reg_ctx->fast_mode_err_found = 1;
1017*437bfbebSnyanmisaka                 mpp_frame_set_errinfo(mframe, 1);
1018*437bfbebSnyanmisaka             }
1019*437bfbebSnyanmisaka         }
1020*437bfbebSnyanmisaka     } else {
1021*437bfbebSnyanmisaka         if (reg_ctx->fast_mode && reg_ctx->fast_mode_err_found) {
1022*437bfbebSnyanmisaka             for (i = 0; i < (RK_S32)MPP_ARRAY_ELEMS(task->dec.refer); i++) {
1023*437bfbebSnyanmisaka                 if (task->dec.refer[i] >= 0) {
1024*437bfbebSnyanmisaka                     MppFrame frame_ref = NULL;
1025*437bfbebSnyanmisaka 
1026*437bfbebSnyanmisaka                     mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.refer[i],
1027*437bfbebSnyanmisaka                                           SLOT_FRAME_PTR, &frame_ref);
1028*437bfbebSnyanmisaka                     h265h_dbg(H265H_DBG_FAST_ERR, "refer[%d] %d frame %p\n",
1029*437bfbebSnyanmisaka                               i, task->dec.refer[i], frame_ref);
1030*437bfbebSnyanmisaka                     if (frame_ref && mpp_frame_get_errinfo(frame_ref)) {
1031*437bfbebSnyanmisaka                         MppFrame frame_out = NULL;
1032*437bfbebSnyanmisaka                         mpp_buf_slot_get_prop(reg_ctx->slots, task->dec.output,
1033*437bfbebSnyanmisaka                                               SLOT_FRAME_PTR, &frame_out);
1034*437bfbebSnyanmisaka                         mpp_frame_set_errinfo(frame_out, 1);
1035*437bfbebSnyanmisaka                         break;
1036*437bfbebSnyanmisaka                     }
1037*437bfbebSnyanmisaka                 }
1038*437bfbebSnyanmisaka             }
1039*437bfbebSnyanmisaka         }
1040*437bfbebSnyanmisaka     }
1041*437bfbebSnyanmisaka 
1042*437bfbebSnyanmisaka     if (hal_h265d_debug & H265H_DBG_REG) {
1043*437bfbebSnyanmisaka         h265h_dbg(H265H_DBG_REG, "RK_HEVC_DEC: regs[1]=0x%08X, regs[45]=0x%08x\n", ((RK_U32 *)hw_regs)[1], ((RK_U32 *)hw_regs)[45]);
1044*437bfbebSnyanmisaka     }
1045*437bfbebSnyanmisaka 
1046*437bfbebSnyanmisaka     if (reg_ctx->fast_mode) {
1047*437bfbebSnyanmisaka         reg_ctx->g_buf[index].use_flag = 0;
1048*437bfbebSnyanmisaka     }
1049*437bfbebSnyanmisaka 
1050*437bfbebSnyanmisaka     return ret;
1051*437bfbebSnyanmisaka }
1052*437bfbebSnyanmisaka 
hal_h265d_rkv_reset(void * hal)1053*437bfbebSnyanmisaka MPP_RET hal_h265d_rkv_reset(void *hal)
1054*437bfbebSnyanmisaka {
1055*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
1056*437bfbebSnyanmisaka     HalH265dCtx *p_hal = (HalH265dCtx *)hal;
1057*437bfbebSnyanmisaka 
1058*437bfbebSnyanmisaka     p_hal->fast_mode_err_found = 0;
1059*437bfbebSnyanmisaka 
1060*437bfbebSnyanmisaka     return ret;
1061*437bfbebSnyanmisaka }
1062*437bfbebSnyanmisaka 
1063*437bfbebSnyanmisaka const MppHalApi hal_h265d_rkv = {
1064*437bfbebSnyanmisaka     .name = "h265d_rkdec",
1065*437bfbebSnyanmisaka     .type = MPP_CTX_DEC,
1066*437bfbebSnyanmisaka     .coding = MPP_VIDEO_CodingHEVC,
1067*437bfbebSnyanmisaka     .ctx_size = sizeof(HalH265dCtx),
1068*437bfbebSnyanmisaka     .flag = 0,
1069*437bfbebSnyanmisaka     .init = hal_h265d_rkv_init,
1070*437bfbebSnyanmisaka     .deinit = hal_h265d_rkv_deinit,
1071*437bfbebSnyanmisaka     .reg_gen = hal_h265d_rkv_gen_regs,
1072*437bfbebSnyanmisaka     .start = hal_h265d_rkv_start,
1073*437bfbebSnyanmisaka     .wait = hal_h265d_rkv_wait,
1074*437bfbebSnyanmisaka     .reset = hal_h265d_rkv_reset,
1075*437bfbebSnyanmisaka     .flush = NULL,
1076*437bfbebSnyanmisaka     .control = NULL,
1077*437bfbebSnyanmisaka };
1078