xref: /rockchip-linux_mpp/mpp/hal/rkdec/avs2d/hal_avs2d_vdpu383.c (revision 437bfbeb9567cca9cd9080e3f6954aa9d6a94f18)
1*437bfbebSnyanmisaka /* SPDX-License-Identifier: Apache-2.0 OR MIT */
2*437bfbebSnyanmisaka /*
3*437bfbebSnyanmisaka  * Copyright (c) 2024 Rockchip Electronics Co., Ltd.
4*437bfbebSnyanmisaka  */
5*437bfbebSnyanmisaka 
6*437bfbebSnyanmisaka #define MODULE_TAG "hal_avs2d_vdpu383"
7*437bfbebSnyanmisaka 
8*437bfbebSnyanmisaka #include <string.h>
9*437bfbebSnyanmisaka #include <stdio.h>
10*437bfbebSnyanmisaka 
11*437bfbebSnyanmisaka #include "mpp_env.h"
12*437bfbebSnyanmisaka #include "mpp_log.h"
13*437bfbebSnyanmisaka #include "mpp_mem.h"
14*437bfbebSnyanmisaka #include "mpp_common.h"
15*437bfbebSnyanmisaka #include "mpp_debug.h"
16*437bfbebSnyanmisaka #include "mpp_bitput.h"
17*437bfbebSnyanmisaka #include "mpp_buffer_impl.h"
18*437bfbebSnyanmisaka 
19*437bfbebSnyanmisaka #include "avs2d_syntax.h"
20*437bfbebSnyanmisaka #include "vdpu383_com.h"
21*437bfbebSnyanmisaka #include "vdpu383_avs2d.h"
22*437bfbebSnyanmisaka #include "hal_avs2d_global.h"
23*437bfbebSnyanmisaka #include "hal_avs2d_vdpu383.h"
24*437bfbebSnyanmisaka #include "mpp_dec_cb_param.h"
25*437bfbebSnyanmisaka 
26*437bfbebSnyanmisaka #define VDPU383_FAST_REG_SET_CNT    (3)
27*437bfbebSnyanmisaka #define MAX_REF_NUM                 (8)
28*437bfbebSnyanmisaka #define AVS2_383_SHPH_SIZE          (208)            /* bytes */
29*437bfbebSnyanmisaka #define AVS2_383_SCALIST_SIZE       (80)             /* bytes */
30*437bfbebSnyanmisaka #define VDPU34x_TOTAL_REG_CNT       (278)
31*437bfbebSnyanmisaka 
32*437bfbebSnyanmisaka #define AVS2_383_SHPH_ALIGNED_SIZE          (MPP_ALIGN(AVS2_383_SHPH_SIZE, SZ_4K))
33*437bfbebSnyanmisaka #define AVS2_383_SCALIST_ALIGNED_SIZE       (MPP_ALIGN(AVS2_383_SCALIST_SIZE, SZ_4K))
34*437bfbebSnyanmisaka #define AVS2_383_STREAM_INFO_SET_SIZE       (AVS2_383_SHPH_ALIGNED_SIZE + \
35*437bfbebSnyanmisaka                                             AVS2_383_SCALIST_ALIGNED_SIZE)
36*437bfbebSnyanmisaka #define AVS2_ALL_TBL_BUF_SIZE(cnt)          (AVS2_383_STREAM_INFO_SET_SIZE * (cnt))
37*437bfbebSnyanmisaka #define AVS2_SHPH_OFFSET(pos)               (AVS2_383_STREAM_INFO_SET_SIZE * (pos))
38*437bfbebSnyanmisaka #define AVS2_SCALIST_OFFSET(pos)            (AVS2_SHPH_OFFSET(pos) + AVS2_383_SHPH_ALIGNED_SIZE)
39*437bfbebSnyanmisaka 
40*437bfbebSnyanmisaka #define COLMV_COMPRESS_EN       (1)
41*437bfbebSnyanmisaka #define COLMV_BLOCK_SIZE        (16)
42*437bfbebSnyanmisaka #define COLMV_BYTES             (16)
43*437bfbebSnyanmisaka 
44*437bfbebSnyanmisaka typedef struct avs2d_buf_t {
45*437bfbebSnyanmisaka     RK_U32                  valid;
46*437bfbebSnyanmisaka     RK_U32                  offset_shph;
47*437bfbebSnyanmisaka     RK_U32                  offset_sclst;
48*437bfbebSnyanmisaka     Vdpu383Avs2dRegSet      *regs;
49*437bfbebSnyanmisaka } Avs2dRkvBuf_t;
50*437bfbebSnyanmisaka 
51*437bfbebSnyanmisaka typedef struct avs2d_reg_ctx_t {
52*437bfbebSnyanmisaka     Avs2dRkvBuf_t           reg_buf[VDPU383_FAST_REG_SET_CNT];
53*437bfbebSnyanmisaka 
54*437bfbebSnyanmisaka     RK_U32                  shph_offset;
55*437bfbebSnyanmisaka     RK_U32                  sclst_offset;
56*437bfbebSnyanmisaka 
57*437bfbebSnyanmisaka     Vdpu383Avs2dRegSet      *regs;
58*437bfbebSnyanmisaka 
59*437bfbebSnyanmisaka     RK_U8                   shph_dat[AVS2_383_SHPH_SIZE];
60*437bfbebSnyanmisaka     RK_U8                   scalist_dat[AVS2_383_SCALIST_SIZE];
61*437bfbebSnyanmisaka 
62*437bfbebSnyanmisaka     MppBuffer               bufs;
63*437bfbebSnyanmisaka     RK_S32                  bufs_fd;
64*437bfbebSnyanmisaka     void                    *bufs_ptr;
65*437bfbebSnyanmisaka 
66*437bfbebSnyanmisaka     MppBuffer               rcb_buf[VDPU383_FAST_REG_SET_CNT];
67*437bfbebSnyanmisaka     RK_S32                  rcb_buf_size;
68*437bfbebSnyanmisaka     Vdpu383RcbInfo          rcb_info[RCB_BUF_COUNT];
69*437bfbebSnyanmisaka     RK_U32                  reg_out[VDPU34x_TOTAL_REG_CNT];
70*437bfbebSnyanmisaka 
71*437bfbebSnyanmisaka } Avs2dRkvRegCtx_t;
72*437bfbebSnyanmisaka 
73*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu383_deinit(void *hal);
avs2d_ver_align(RK_U32 val)74*437bfbebSnyanmisaka static RK_U32 avs2d_ver_align(RK_U32 val)
75*437bfbebSnyanmisaka {
76*437bfbebSnyanmisaka     return MPP_ALIGN(val, 16);
77*437bfbebSnyanmisaka }
78*437bfbebSnyanmisaka 
avs2d_len_align(RK_U32 val)79*437bfbebSnyanmisaka static RK_U32 avs2d_len_align(RK_U32 val)
80*437bfbebSnyanmisaka {
81*437bfbebSnyanmisaka     return (2 * MPP_ALIGN(val, 16));
82*437bfbebSnyanmisaka }
83*437bfbebSnyanmisaka 
prepare_header(Avs2dHalCtx_t * p_hal,RK_U8 * data,RK_U32 len)84*437bfbebSnyanmisaka static MPP_RET prepare_header(Avs2dHalCtx_t *p_hal, RK_U8 *data, RK_U32 len)
85*437bfbebSnyanmisaka {
86*437bfbebSnyanmisaka     RK_U32 i, j;
87*437bfbebSnyanmisaka     BitputCtx_t bp;
88*437bfbebSnyanmisaka     RK_U64 *bit_buf = (RK_U64 *)data;
89*437bfbebSnyanmisaka     Avs2dSyntax_t *syntax = &p_hal->syntax;
90*437bfbebSnyanmisaka     PicParams_Avs2d *pp   = &syntax->pp;
91*437bfbebSnyanmisaka     AlfParams_Avs2d *alfp = &syntax->alfp;
92*437bfbebSnyanmisaka     RefParams_Avs2d *refp = &syntax->refp;
93*437bfbebSnyanmisaka     WqmParams_Avs2d *wqmp = &syntax->wqmp;
94*437bfbebSnyanmisaka 
95*437bfbebSnyanmisaka     memset(data, 0, len);
96*437bfbebSnyanmisaka 
97*437bfbebSnyanmisaka     mpp_set_bitput_ctx(&bp, bit_buf, len);
98*437bfbebSnyanmisaka 
99*437bfbebSnyanmisaka     //!< sequence header syntax
100*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->chroma_format_idc, 2);
101*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->pic_width_in_luma_samples, 16);
102*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->pic_height_in_luma_samples, 16);
103*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->bit_depth_luma_minus8, 3);
104*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->bit_depth_chroma_minus8, 3);
105*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->lcu_size, 3);
106*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->progressive_sequence, 1);
107*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->field_coded_sequence, 1);
108*437bfbebSnyanmisaka 
109*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->secondary_transform_enable_flag, 1);
110*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->sample_adaptive_offset_enable_flag, 1);
111*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->adaptive_loop_filter_enable_flag, 1);
112*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->pmvr_enable_flag, 1);
113*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->cross_slice_loopfilter_enable_flag, 1);
114*437bfbebSnyanmisaka 
115*437bfbebSnyanmisaka     //!< picture header syntax
116*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->picture_type, 3);
117*437bfbebSnyanmisaka     mpp_put_bits(&bp, refp->ref_pic_num, 3);
118*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->scene_reference_enable_flag, 1);
119*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->bottom_field_picture_flag, 1);
120*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->fixed_picture_qp, 1);
121*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->picture_qp, 7);
122*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->loop_filter_disable_flag, 1);
123*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->alpha_c_offset, 5);
124*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->beta_offset, 5);
125*437bfbebSnyanmisaka 
126*437bfbebSnyanmisaka     //!< weight quant param
127*437bfbebSnyanmisaka     mpp_put_bits(&bp, wqmp->chroma_quant_param_delta_cb, 6);
128*437bfbebSnyanmisaka     mpp_put_bits(&bp, wqmp->chroma_quant_param_delta_cr, 6);
129*437bfbebSnyanmisaka     mpp_put_bits(&bp, wqmp->pic_weight_quant_enable_flag, 1);
130*437bfbebSnyanmisaka 
131*437bfbebSnyanmisaka     //!< alf param
132*437bfbebSnyanmisaka     mpp_put_bits(&bp, alfp->enable_pic_alf_y, 1);
133*437bfbebSnyanmisaka     mpp_put_bits(&bp, alfp->enable_pic_alf_cb, 1);
134*437bfbebSnyanmisaka     mpp_put_bits(&bp, alfp->enable_pic_alf_cr, 1);
135*437bfbebSnyanmisaka 
136*437bfbebSnyanmisaka     mpp_put_bits(&bp, alfp->alf_filter_num_minus1, 4);
137*437bfbebSnyanmisaka     for (i = 0; i < 16; i++)
138*437bfbebSnyanmisaka         mpp_put_bits(&bp, alfp->alf_coeff_idx_tab[i], 4);
139*437bfbebSnyanmisaka 
140*437bfbebSnyanmisaka     for (i = 0; i < 16; i++)
141*437bfbebSnyanmisaka         for (j = 0; j < 9; j++)
142*437bfbebSnyanmisaka             mpp_put_bits(&bp, alfp->alf_coeff_y[i][j], 7);
143*437bfbebSnyanmisaka 
144*437bfbebSnyanmisaka     for (j = 0; j < 9; j++)
145*437bfbebSnyanmisaka         mpp_put_bits(&bp, alfp->alf_coeff_cb[j], 7);
146*437bfbebSnyanmisaka 
147*437bfbebSnyanmisaka     for (j = 0; j < 9; j++)
148*437bfbebSnyanmisaka         mpp_put_bits(&bp, alfp->alf_coeff_cr[j], 7);
149*437bfbebSnyanmisaka 
150*437bfbebSnyanmisaka     /* other flags */
151*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->multi_hypothesis_skip_enable_flag, 1);
152*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->dual_hypothesis_prediction_enable_flag, 1);
153*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->weighted_skip_enable_flag, 1);
154*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->asymmetrc_motion_partitions_enable_flag, 1);
155*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->nonsquare_quadtree_transform_enable_flag, 1);
156*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->nonsquare_intra_prediction_enable_flag, 1);
157*437bfbebSnyanmisaka 
158*437bfbebSnyanmisaka     //!< picture reference params
159*437bfbebSnyanmisaka     mpp_put_bits(&bp, pp->cur_poc, 32);
160*437bfbebSnyanmisaka     for (i = 0; i < 8; i++)
161*437bfbebSnyanmisaka         mpp_put_bits(&bp, (i < refp->ref_pic_num) ? refp->ref_poc_list[i] : 0, 32);
162*437bfbebSnyanmisaka     for (i = 0; i < 8; i++)
163*437bfbebSnyanmisaka         mpp_put_bits(&bp, (i < refp->ref_pic_num) ? pp->field_coded_sequence : 0, 1);
164*437bfbebSnyanmisaka     for (i = 0; i < 8; i++)
165*437bfbebSnyanmisaka         mpp_put_bits(&bp, (i < refp->ref_pic_num) ? pp->bottom_field_picture_flag : 0, 1);
166*437bfbebSnyanmisaka     for (i = 0; i < 8; i++)
167*437bfbebSnyanmisaka         mpp_put_bits(&bp, (i < refp->ref_pic_num), 1);
168*437bfbebSnyanmisaka 
169*437bfbebSnyanmisaka     return MPP_OK;
170*437bfbebSnyanmisaka }
171*437bfbebSnyanmisaka 
prepare_scalist(Avs2dHalCtx_t * p_hal,RK_U8 * data,RK_U32 len)172*437bfbebSnyanmisaka static MPP_RET prepare_scalist(Avs2dHalCtx_t *p_hal, RK_U8 *data, RK_U32 len)
173*437bfbebSnyanmisaka {
174*437bfbebSnyanmisaka     Avs2dSyntax_t *syntax = &p_hal->syntax;
175*437bfbebSnyanmisaka     WqmParams_Avs2d *wqmp = &syntax->wqmp;
176*437bfbebSnyanmisaka     RK_U32 i = 0;
177*437bfbebSnyanmisaka     RK_U32 n = 0;
178*437bfbebSnyanmisaka 
179*437bfbebSnyanmisaka     if (!wqmp->pic_weight_quant_enable_flag)
180*437bfbebSnyanmisaka         return MPP_OK;
181*437bfbebSnyanmisaka 
182*437bfbebSnyanmisaka     memset(data, 0, len);
183*437bfbebSnyanmisaka 
184*437bfbebSnyanmisaka     /* dump by block4x4, vectial direction */
185*437bfbebSnyanmisaka     for (i = 0; i < 4; i++) {
186*437bfbebSnyanmisaka         data[n++] = wqmp->wq_matrix[0][i + 0];
187*437bfbebSnyanmisaka         data[n++] = wqmp->wq_matrix[0][i + 4];
188*437bfbebSnyanmisaka         data[n++] = wqmp->wq_matrix[0][i + 8];
189*437bfbebSnyanmisaka         data[n++] = wqmp->wq_matrix[0][i + 12];
190*437bfbebSnyanmisaka     }
191*437bfbebSnyanmisaka 
192*437bfbebSnyanmisaka     /* block8x8 */
193*437bfbebSnyanmisaka     {
194*437bfbebSnyanmisaka         RK_S32 blk4_x = 0, blk4_y = 0;
195*437bfbebSnyanmisaka 
196*437bfbebSnyanmisaka         /* dump by block4x4, vectial direction */
197*437bfbebSnyanmisaka         for (blk4_x = 0; blk4_x < 8; blk4_x += 4) {
198*437bfbebSnyanmisaka             for (blk4_y = 0; blk4_y < 8; blk4_y += 4) {
199*437bfbebSnyanmisaka                 RK_S32 pos = blk4_y * 8 + blk4_x;
200*437bfbebSnyanmisaka 
201*437bfbebSnyanmisaka                 for (i = 0; i < 4; i++) {
202*437bfbebSnyanmisaka                     data[n++] = wqmp->wq_matrix[1][pos + i + 0];
203*437bfbebSnyanmisaka                     data[n++] = wqmp->wq_matrix[1][pos + i + 8];
204*437bfbebSnyanmisaka                     data[n++] = wqmp->wq_matrix[1][pos + i + 16];
205*437bfbebSnyanmisaka                     data[n++] = wqmp->wq_matrix[1][pos + i + 24];
206*437bfbebSnyanmisaka                 }
207*437bfbebSnyanmisaka             }
208*437bfbebSnyanmisaka         }
209*437bfbebSnyanmisaka     }
210*437bfbebSnyanmisaka 
211*437bfbebSnyanmisaka     return MPP_OK;
212*437bfbebSnyanmisaka }
213*437bfbebSnyanmisaka 
get_frame_fd(Avs2dHalCtx_t * p_hal,RK_S32 idx)214*437bfbebSnyanmisaka static RK_S32 get_frame_fd(Avs2dHalCtx_t *p_hal, RK_S32 idx)
215*437bfbebSnyanmisaka {
216*437bfbebSnyanmisaka     RK_S32 ret_fd = 0;
217*437bfbebSnyanmisaka     MppBuffer mbuffer = NULL;
218*437bfbebSnyanmisaka 
219*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->frame_slots, idx, SLOT_BUFFER, &mbuffer);
220*437bfbebSnyanmisaka     ret_fd = mpp_buffer_get_fd(mbuffer);
221*437bfbebSnyanmisaka 
222*437bfbebSnyanmisaka     return ret_fd;
223*437bfbebSnyanmisaka }
224*437bfbebSnyanmisaka 
get_packet_fd(Avs2dHalCtx_t * p_hal,RK_S32 idx)225*437bfbebSnyanmisaka static RK_S32 get_packet_fd(Avs2dHalCtx_t *p_hal, RK_S32 idx)
226*437bfbebSnyanmisaka {
227*437bfbebSnyanmisaka     RK_S32 ret_fd = 0;
228*437bfbebSnyanmisaka     MppBuffer mbuffer = NULL;
229*437bfbebSnyanmisaka 
230*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->packet_slots, idx, SLOT_BUFFER, &mbuffer);
231*437bfbebSnyanmisaka     ret_fd =  mpp_buffer_get_fd(mbuffer);
232*437bfbebSnyanmisaka 
233*437bfbebSnyanmisaka     return ret_fd;
234*437bfbebSnyanmisaka }
235*437bfbebSnyanmisaka 
init_ctrl_regs(Vdpu383Avs2dRegSet * regs)236*437bfbebSnyanmisaka static void init_ctrl_regs(Vdpu383Avs2dRegSet *regs)
237*437bfbebSnyanmisaka {
238*437bfbebSnyanmisaka     Vdpu383CtrlReg *ctrl_regs = &regs->ctrl_regs;
239*437bfbebSnyanmisaka 
240*437bfbebSnyanmisaka     ctrl_regs->reg8_dec_mode = 3;  // AVS2
241*437bfbebSnyanmisaka     ctrl_regs->reg9.buf_empty_en = 1;
242*437bfbebSnyanmisaka 
243*437bfbebSnyanmisaka     ctrl_regs->reg10.strmd_auto_gating_e      = 1;
244*437bfbebSnyanmisaka     ctrl_regs->reg10.inter_auto_gating_e      = 1;
245*437bfbebSnyanmisaka     ctrl_regs->reg10.intra_auto_gating_e      = 1;
246*437bfbebSnyanmisaka     ctrl_regs->reg10.transd_auto_gating_e     = 1;
247*437bfbebSnyanmisaka     ctrl_regs->reg10.recon_auto_gating_e      = 1;
248*437bfbebSnyanmisaka     ctrl_regs->reg10.filterd_auto_gating_e    = 1;
249*437bfbebSnyanmisaka     ctrl_regs->reg10.bus_auto_gating_e        = 1;
250*437bfbebSnyanmisaka     ctrl_regs->reg10.ctrl_auto_gating_e       = 1;
251*437bfbebSnyanmisaka     ctrl_regs->reg10.rcb_auto_gating_e        = 1;
252*437bfbebSnyanmisaka     ctrl_regs->reg10.err_prc_auto_gating_e    = 1;
253*437bfbebSnyanmisaka 
254*437bfbebSnyanmisaka     ctrl_regs->reg13_core_timeout_threshold = 0xffffff;
255*437bfbebSnyanmisaka 
256*437bfbebSnyanmisaka     ctrl_regs->reg16.error_proc_disable = 1;
257*437bfbebSnyanmisaka     ctrl_regs->reg16.error_spread_disable = 0;
258*437bfbebSnyanmisaka     ctrl_regs->reg16.roi_error_ctu_cal_en = 0;
259*437bfbebSnyanmisaka 
260*437bfbebSnyanmisaka     ctrl_regs->reg20_cabac_error_en_lowbits = 0xffffffff;
261*437bfbebSnyanmisaka     ctrl_regs->reg21_cabac_error_en_highbits = 0x3fffffff;
262*437bfbebSnyanmisaka 
263*437bfbebSnyanmisaka     /* performance */
264*437bfbebSnyanmisaka     ctrl_regs->reg28.axi_perf_work_e = 1;
265*437bfbebSnyanmisaka     ctrl_regs->reg28.axi_cnt_type = 1;
266*437bfbebSnyanmisaka     ctrl_regs->reg28.rd_latency_id = 0xb;
267*437bfbebSnyanmisaka     ctrl_regs->reg28.rd_latency_thr = 0;
268*437bfbebSnyanmisaka 
269*437bfbebSnyanmisaka     ctrl_regs->reg29.addr_align_type = 2;
270*437bfbebSnyanmisaka     ctrl_regs->reg29.ar_cnt_id_type = 0;
271*437bfbebSnyanmisaka     ctrl_regs->reg29.aw_cnt_id_type = 0;
272*437bfbebSnyanmisaka     ctrl_regs->reg29.ar_count_id = 0xa;
273*437bfbebSnyanmisaka     ctrl_regs->reg29.aw_count_id = 0;
274*437bfbebSnyanmisaka     ctrl_regs->reg29.rd_band_width_mode = 0;
275*437bfbebSnyanmisaka }
276*437bfbebSnyanmisaka 
avs2d_refine_rcb_size(Vdpu383RcbInfo * rcb_info,RK_S32 width,RK_S32 height,void * dxva)277*437bfbebSnyanmisaka static void avs2d_refine_rcb_size(Vdpu383RcbInfo *rcb_info,
278*437bfbebSnyanmisaka                                   RK_S32 width, RK_S32 height, void *dxva)
279*437bfbebSnyanmisaka {
280*437bfbebSnyanmisaka     (void) height;
281*437bfbebSnyanmisaka     Avs2dSyntax_t *syntax = dxva;
282*437bfbebSnyanmisaka     RK_U8 ctu_size = 1 << syntax->pp.lcu_size;
283*437bfbebSnyanmisaka     RK_U8 bit_depth = syntax->pp.bit_depth_chroma_minus8 + 8;
284*437bfbebSnyanmisaka     RK_U32 rcb_bits = 0;
285*437bfbebSnyanmisaka     RK_U32 filterd_row_append = 8192;
286*437bfbebSnyanmisaka 
287*437bfbebSnyanmisaka     width = MPP_ALIGN(width, ctu_size);
288*437bfbebSnyanmisaka 
289*437bfbebSnyanmisaka     /* RCB_STRMD_ROW && RCB_STRMD_TILE_ROW*/
290*437bfbebSnyanmisaka     if (width > 8192)
291*437bfbebSnyanmisaka         rcb_bits = ((width + 63) / 64) * 112;
292*437bfbebSnyanmisaka     else
293*437bfbebSnyanmisaka         rcb_bits = 0;
294*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_ROW].size = MPP_RCB_BYTES(rcb_bits);
295*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_TILE_ROW].size = 0;
296*437bfbebSnyanmisaka 
297*437bfbebSnyanmisaka     /* RCB_INTER_ROW && RCB_INTER_TILE_ROW*/
298*437bfbebSnyanmisaka     rcb_bits = ((width + 7) / 8) * 166;
299*437bfbebSnyanmisaka     rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
300*437bfbebSnyanmisaka     rcb_info[RCB_INTER_TILE_ROW].size = 0;
301*437bfbebSnyanmisaka 
302*437bfbebSnyanmisaka     /* RCB_INTRA_ROW && RCB_INTRA_TILE_ROW*/
303*437bfbebSnyanmisaka     rcb_bits = MPP_ALIGN(width, 512) * (bit_depth + 2);
304*437bfbebSnyanmisaka     rcb_bits = rcb_bits * 3; //TODO:
305*437bfbebSnyanmisaka     rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
306*437bfbebSnyanmisaka     rcb_info[RCB_INTRA_TILE_ROW].size = 0;
307*437bfbebSnyanmisaka 
308*437bfbebSnyanmisaka     /* RCB_FILTERD_ROW && RCB_FILTERD_TILE_ROW*/
309*437bfbebSnyanmisaka     if (width > 4096)
310*437bfbebSnyanmisaka         filterd_row_append = 27648;
311*437bfbebSnyanmisaka     rcb_bits = MPP_ALIGN(width, 64) * (30 * bit_depth + 9);
312*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
313*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_PROTECT_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
314*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_TILE_ROW].size = 0;
315*437bfbebSnyanmisaka 
316*437bfbebSnyanmisaka     /* RCB_FILTERD_TILE_COL */
317*437bfbebSnyanmisaka     rcb_info[RCB_FILTERD_TILE_COL].size = 0;
318*437bfbebSnyanmisaka }
319*437bfbebSnyanmisaka 
hal_avs2d_rcb_info_update(void * hal,Vdpu383Avs2dRegSet * regs)320*437bfbebSnyanmisaka static void hal_avs2d_rcb_info_update(void *hal, Vdpu383Avs2dRegSet *regs)
321*437bfbebSnyanmisaka {
322*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
323*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
324*437bfbebSnyanmisaka     Avs2dRkvRegCtx_t *reg_ctx = (Avs2dRkvRegCtx_t *)p_hal->reg_ctx;
325*437bfbebSnyanmisaka     RK_S32 width = p_hal->syntax.pp.pic_width_in_luma_samples;
326*437bfbebSnyanmisaka     RK_S32 height = p_hal->syntax.pp.pic_height_in_luma_samples;
327*437bfbebSnyanmisaka     RK_S32 i = 0;
328*437bfbebSnyanmisaka     RK_S32 loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
329*437bfbebSnyanmisaka 
330*437bfbebSnyanmisaka     (void) regs;
331*437bfbebSnyanmisaka 
332*437bfbebSnyanmisaka     reg_ctx->rcb_buf_size = vdpu383_get_rcb_buf_size(reg_ctx->rcb_info, width, height);
333*437bfbebSnyanmisaka     avs2d_refine_rcb_size(reg_ctx->rcb_info, width, height, (void *)&p_hal->syntax);
334*437bfbebSnyanmisaka 
335*437bfbebSnyanmisaka     for (i = 0; i < loop; i++) {
336*437bfbebSnyanmisaka         MppBuffer rcb_buf = NULL;
337*437bfbebSnyanmisaka 
338*437bfbebSnyanmisaka         if (reg_ctx->rcb_buf[i]) {
339*437bfbebSnyanmisaka             mpp_buffer_put(reg_ctx->rcb_buf[i]);
340*437bfbebSnyanmisaka             reg_ctx->rcb_buf[i] = NULL;
341*437bfbebSnyanmisaka         }
342*437bfbebSnyanmisaka 
343*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->buf_group, &rcb_buf, reg_ctx->rcb_buf_size);
344*437bfbebSnyanmisaka         if (ret)
345*437bfbebSnyanmisaka             mpp_err_f("AVS2D mpp_buffer_group_get failed\n");
346*437bfbebSnyanmisaka 
347*437bfbebSnyanmisaka         reg_ctx->rcb_buf[i] = rcb_buf;
348*437bfbebSnyanmisaka     }
349*437bfbebSnyanmisaka }
350*437bfbebSnyanmisaka 
fill_registers(Avs2dHalCtx_t * p_hal,Vdpu383Avs2dRegSet * regs,HalTaskInfo * task)351*437bfbebSnyanmisaka static MPP_RET fill_registers(Avs2dHalCtx_t *p_hal, Vdpu383Avs2dRegSet *regs, HalTaskInfo *task)
352*437bfbebSnyanmisaka {
353*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
354*437bfbebSnyanmisaka     RK_U32 i;
355*437bfbebSnyanmisaka     MppFrame mframe = NULL;
356*437bfbebSnyanmisaka     Avs2dSyntax_t *syntax = &p_hal->syntax;
357*437bfbebSnyanmisaka     RefParams_Avs2d *refp = &syntax->refp;
358*437bfbebSnyanmisaka     HalDecTask *task_dec  = &task->dec;
359*437bfbebSnyanmisaka 
360*437bfbebSnyanmisaka     RK_U32 is_fbc = 0;
361*437bfbebSnyanmisaka     RK_U32 is_tile = 0;
362*437bfbebSnyanmisaka     HalBuf *mv_buf = NULL;
363*437bfbebSnyanmisaka 
364*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->frame_slots, task_dec->output, SLOT_FRAME_PTR, &mframe);
365*437bfbebSnyanmisaka     is_fbc = MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe));
366*437bfbebSnyanmisaka     is_tile = MPP_FRAME_FMT_IS_TILE(mpp_frame_get_fmt(mframe));
367*437bfbebSnyanmisaka 
368*437bfbebSnyanmisaka     //!< caculate the yuv_frame_size
369*437bfbebSnyanmisaka     {
370*437bfbebSnyanmisaka         RK_U32 hor_virstride = 0;
371*437bfbebSnyanmisaka         RK_U32 ver_virstride = 0;
372*437bfbebSnyanmisaka         RK_U32 y_virstride = 0;
373*437bfbebSnyanmisaka         RK_U32 uv_virstride = 0;
374*437bfbebSnyanmisaka 
375*437bfbebSnyanmisaka         hor_virstride = mpp_frame_get_hor_stride(mframe);
376*437bfbebSnyanmisaka         ver_virstride = mpp_frame_get_ver_stride(mframe);
377*437bfbebSnyanmisaka         y_virstride = hor_virstride * ver_virstride;
378*437bfbebSnyanmisaka         uv_virstride = hor_virstride * ver_virstride / 2;
379*437bfbebSnyanmisaka         AVS2D_HAL_TRACE("is_fbc %d y_virstride %d, hor_virstride %d, ver_virstride %d\n",
380*437bfbebSnyanmisaka                         is_fbc, y_virstride, hor_virstride, ver_virstride);
381*437bfbebSnyanmisaka 
382*437bfbebSnyanmisaka         if (is_fbc) {
383*437bfbebSnyanmisaka             RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
384*437bfbebSnyanmisaka             RK_U32 fbd_offset;
385*437bfbebSnyanmisaka 
386*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.fbc_e = 1;
387*437bfbebSnyanmisaka             regs->avs2d_paras.reg68_hor_virstride = fbc_hdr_stride / 64;
388*437bfbebSnyanmisaka             fbd_offset = regs->avs2d_paras.reg68_hor_virstride * MPP_ALIGN(ver_virstride, 64) * 4;
389*437bfbebSnyanmisaka             regs->avs2d_addrs.reg193_fbc_payload_offset = fbd_offset;
390*437bfbebSnyanmisaka         } else if (is_tile) {
391*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.tile_e = 1;
392*437bfbebSnyanmisaka             regs->avs2d_paras.reg68_hor_virstride = hor_virstride * 6 / 16;
393*437bfbebSnyanmisaka             regs->avs2d_paras.reg70_y_virstride = (y_virstride + uv_virstride) / 16;
394*437bfbebSnyanmisaka         } else {
395*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.fbc_e = 0;
396*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.tile_e = 0;
397*437bfbebSnyanmisaka             regs->avs2d_paras.reg68_hor_virstride = hor_virstride / 16;
398*437bfbebSnyanmisaka             regs->avs2d_paras.reg69_raster_uv_hor_virstride = hor_virstride / 16;
399*437bfbebSnyanmisaka             regs->avs2d_paras.reg70_y_virstride = y_virstride / 16;
400*437bfbebSnyanmisaka         }
401*437bfbebSnyanmisaka     }
402*437bfbebSnyanmisaka 
403*437bfbebSnyanmisaka     // set current
404*437bfbebSnyanmisaka     {
405*437bfbebSnyanmisaka         RK_S32 fd = get_frame_fd(p_hal, task_dec->output);
406*437bfbebSnyanmisaka 
407*437bfbebSnyanmisaka         mpp_assert(fd >= 0);
408*437bfbebSnyanmisaka 
409*437bfbebSnyanmisaka         regs->avs2d_addrs.reg168_decout_base = fd;
410*437bfbebSnyanmisaka         regs->avs2d_addrs.reg192_payload_st_cur_base = fd;
411*437bfbebSnyanmisaka         mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, task_dec->output);
412*437bfbebSnyanmisaka         regs->avs2d_addrs.reg216_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
413*437bfbebSnyanmisaka         AVS2D_HAL_TRACE("cur frame index %d, fd %d, colmv fd %d", task_dec->output, fd, regs->avs2d_addrs.reg216_colmv_cur_base);
414*437bfbebSnyanmisaka 
415*437bfbebSnyanmisaka         // TODO: set up error_ref_base
416*437bfbebSnyanmisaka         // regs->avs2d_addr.reg169_err_ref_base.base = regs->avs2d_addr.reg216_colmv_cur_base.base;
417*437bfbebSnyanmisaka     }
418*437bfbebSnyanmisaka 
419*437bfbebSnyanmisaka     // set reference
420*437bfbebSnyanmisaka     {
421*437bfbebSnyanmisaka         RK_S32 valid_slot = -1;
422*437bfbebSnyanmisaka 
423*437bfbebSnyanmisaka         AVS2D_HAL_TRACE("num of ref %d", refp->ref_pic_num);
424*437bfbebSnyanmisaka 
425*437bfbebSnyanmisaka         for (i = 0; i < refp->ref_pic_num; i++) {
426*437bfbebSnyanmisaka             if (task_dec->refer[i] < 0)
427*437bfbebSnyanmisaka                 continue;
428*437bfbebSnyanmisaka 
429*437bfbebSnyanmisaka             valid_slot = i;
430*437bfbebSnyanmisaka             break;
431*437bfbebSnyanmisaka         }
432*437bfbebSnyanmisaka 
433*437bfbebSnyanmisaka         for (i = 0; i < MAX_REF_NUM; i++) {
434*437bfbebSnyanmisaka             if (i < refp->ref_pic_num) {
435*437bfbebSnyanmisaka                 MppFrame frame_ref = NULL;
436*437bfbebSnyanmisaka 
437*437bfbebSnyanmisaka                 RK_S32 slot_idx = task_dec->refer[i] < 0 ? task_dec->refer[valid_slot] : task_dec->refer[i];
438*437bfbebSnyanmisaka 
439*437bfbebSnyanmisaka                 if (slot_idx < 0) {
440*437bfbebSnyanmisaka                     AVS2D_HAL_TRACE("missing ref, could not found valid ref");
441*437bfbebSnyanmisaka                     task->dec.flags.ref_err = 1;
442*437bfbebSnyanmisaka                     return ret = MPP_ERR_UNKNOW;
443*437bfbebSnyanmisaka                 }
444*437bfbebSnyanmisaka 
445*437bfbebSnyanmisaka                 mpp_buf_slot_get_prop(p_hal->frame_slots, slot_idx, SLOT_FRAME_PTR, &frame_ref);
446*437bfbebSnyanmisaka 
447*437bfbebSnyanmisaka                 if (frame_ref) {
448*437bfbebSnyanmisaka                     regs->avs2d_addrs.reg170_185_ref_base[i] = get_frame_fd(p_hal, slot_idx);
449*437bfbebSnyanmisaka                     regs->avs2d_addrs.reg195_210_payload_st_ref_base[i] = get_frame_fd(p_hal, slot_idx);
450*437bfbebSnyanmisaka                     mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, slot_idx);
451*437bfbebSnyanmisaka                     regs->avs2d_addrs.reg217_232_colmv_ref_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
452*437bfbebSnyanmisaka                 }
453*437bfbebSnyanmisaka             }
454*437bfbebSnyanmisaka         }
455*437bfbebSnyanmisaka 
456*437bfbebSnyanmisaka         if (p_hal->syntax.refp.scene_ref_enable && p_hal->syntax.refp.scene_ref_slot_idx >= 0) {
457*437bfbebSnyanmisaka             MppFrame scene_ref = NULL;
458*437bfbebSnyanmisaka             RK_S32 slot_idx = p_hal->syntax.refp.scene_ref_slot_idx;
459*437bfbebSnyanmisaka             RK_S32 replace_idx = p_hal->syntax.refp.scene_ref_replace_pos;
460*437bfbebSnyanmisaka 
461*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal->frame_slots, slot_idx, SLOT_FRAME_PTR, &scene_ref);
462*437bfbebSnyanmisaka 
463*437bfbebSnyanmisaka             if (scene_ref) {
464*437bfbebSnyanmisaka                 regs->avs2d_addrs.reg170_185_ref_base[replace_idx] = get_frame_fd(p_hal, slot_idx);
465*437bfbebSnyanmisaka                 regs->avs2d_addrs.reg195_210_payload_st_ref_base[replace_idx] = regs->avs2d_addrs.reg170_185_ref_base[replace_idx];
466*437bfbebSnyanmisaka                 mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, slot_idx);
467*437bfbebSnyanmisaka                 regs->avs2d_addrs.reg217_232_colmv_ref_base[replace_idx] = mpp_buffer_get_fd(mv_buf->buf[0]);
468*437bfbebSnyanmisaka             }
469*437bfbebSnyanmisaka         }
470*437bfbebSnyanmisaka 
471*437bfbebSnyanmisaka         regs->avs2d_addrs.reg169_error_ref_base = regs->avs2d_addrs.reg170_185_ref_base[0];
472*437bfbebSnyanmisaka         regs->avs2d_addrs.reg194_payload_st_error_ref_base = regs->avs2d_addrs.reg195_210_payload_st_ref_base[0];
473*437bfbebSnyanmisaka     }
474*437bfbebSnyanmisaka 
475*437bfbebSnyanmisaka     // set rlc
476*437bfbebSnyanmisaka     regs->common_addr.reg128_strm_base = get_packet_fd(p_hal, task_dec->input);
477*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("packet fd %d from slot %d", regs->common_addr.reg128_strm_base, task_dec->input);
478*437bfbebSnyanmisaka 
479*437bfbebSnyanmisaka     regs->avs2d_paras.reg66_stream_len = MPP_ALIGN(mpp_packet_get_length(task_dec->input_packet), 16) + 64;
480*437bfbebSnyanmisaka 
481*437bfbebSnyanmisaka     {
482*437bfbebSnyanmisaka         //scale down config
483*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->frame_slots, task_dec->output,
484*437bfbebSnyanmisaka                               SLOT_FRAME_PTR, &mframe);
485*437bfbebSnyanmisaka         if (mpp_frame_get_thumbnail_en(mframe)) {
486*437bfbebSnyanmisaka             regs->common_addr.reg133_scale_down_base = regs->avs2d_addrs.reg168_decout_base;
487*437bfbebSnyanmisaka             vdpu383_setup_down_scale(mframe, p_hal->dev, &regs->ctrl_regs,
488*437bfbebSnyanmisaka                                      (void *)&regs->avs2d_paras);
489*437bfbebSnyanmisaka         } else {
490*437bfbebSnyanmisaka             regs->ctrl_regs.reg9.scale_down_en = 0;
491*437bfbebSnyanmisaka         }
492*437bfbebSnyanmisaka     }
493*437bfbebSnyanmisaka 
494*437bfbebSnyanmisaka     return ret;
495*437bfbebSnyanmisaka }
496*437bfbebSnyanmisaka 
hal_avs2d_vdpu383_deinit(void * hal)497*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu383_deinit(void *hal)
498*437bfbebSnyanmisaka {
499*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
500*437bfbebSnyanmisaka     RK_U32 i, loop;
501*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
502*437bfbebSnyanmisaka     Avs2dRkvRegCtx_t *reg_ctx = (Avs2dRkvRegCtx_t *)p_hal->reg_ctx;
503*437bfbebSnyanmisaka 
504*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("In.");
505*437bfbebSnyanmisaka 
506*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == reg_ctx);
507*437bfbebSnyanmisaka 
508*437bfbebSnyanmisaka     //!< malloc buffers
509*437bfbebSnyanmisaka     loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
510*437bfbebSnyanmisaka     for (i = 0; i < loop; i++) {
511*437bfbebSnyanmisaka         if (reg_ctx->rcb_buf[i]) {
512*437bfbebSnyanmisaka             mpp_buffer_put(reg_ctx->rcb_buf[i]);
513*437bfbebSnyanmisaka             reg_ctx->rcb_buf[i] = NULL;
514*437bfbebSnyanmisaka         }
515*437bfbebSnyanmisaka 
516*437bfbebSnyanmisaka         MPP_FREE(reg_ctx->reg_buf[i].regs);
517*437bfbebSnyanmisaka     }
518*437bfbebSnyanmisaka 
519*437bfbebSnyanmisaka     if (reg_ctx->bufs) {
520*437bfbebSnyanmisaka         mpp_buffer_put(reg_ctx->bufs);
521*437bfbebSnyanmisaka         reg_ctx->bufs = NULL;
522*437bfbebSnyanmisaka     }
523*437bfbebSnyanmisaka 
524*437bfbebSnyanmisaka     if (p_hal->cmv_bufs) {
525*437bfbebSnyanmisaka         hal_bufs_deinit(p_hal->cmv_bufs);
526*437bfbebSnyanmisaka         p_hal->cmv_bufs = NULL;
527*437bfbebSnyanmisaka     }
528*437bfbebSnyanmisaka 
529*437bfbebSnyanmisaka     MPP_FREE(p_hal->reg_ctx);
530*437bfbebSnyanmisaka 
531*437bfbebSnyanmisaka __RETURN:
532*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("Out. ret %d", ret);
533*437bfbebSnyanmisaka     return ret;
534*437bfbebSnyanmisaka }
535*437bfbebSnyanmisaka 
hal_avs2d_vdpu383_init(void * hal,MppHalCfg * cfg)536*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu383_init(void *hal, MppHalCfg *cfg)
537*437bfbebSnyanmisaka {
538*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
539*437bfbebSnyanmisaka     RK_U32 i, loop;
540*437bfbebSnyanmisaka     Avs2dRkvRegCtx_t *reg_ctx;
541*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
542*437bfbebSnyanmisaka 
543*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("In.");
544*437bfbebSnyanmisaka 
545*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
546*437bfbebSnyanmisaka 
547*437bfbebSnyanmisaka     MEM_CHECK(ret, p_hal->reg_ctx = mpp_calloc_size(void, sizeof(Avs2dRkvRegCtx_t)));
548*437bfbebSnyanmisaka     reg_ctx = (Avs2dRkvRegCtx_t *)p_hal->reg_ctx;
549*437bfbebSnyanmisaka 
550*437bfbebSnyanmisaka     //!< malloc buffers
551*437bfbebSnyanmisaka     loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
552*437bfbebSnyanmisaka     FUN_CHECK(ret = mpp_buffer_get(p_hal->buf_group, &reg_ctx->bufs, AVS2_ALL_TBL_BUF_SIZE(loop)));
553*437bfbebSnyanmisaka     reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
554*437bfbebSnyanmisaka     reg_ctx->bufs_ptr = mpp_buffer_get_ptr(reg_ctx->bufs);
555*437bfbebSnyanmisaka     mpp_buffer_attach_dev(reg_ctx->bufs, p_hal->dev);
556*437bfbebSnyanmisaka 
557*437bfbebSnyanmisaka     for (i = 0; i < loop; i++) {
558*437bfbebSnyanmisaka         reg_ctx->reg_buf[i].regs = mpp_calloc(Vdpu383Avs2dRegSet, 1);
559*437bfbebSnyanmisaka         init_ctrl_regs(reg_ctx->reg_buf[i].regs);
560*437bfbebSnyanmisaka         reg_ctx->reg_buf[i].offset_shph = AVS2_SHPH_OFFSET(i);
561*437bfbebSnyanmisaka         reg_ctx->reg_buf[i].offset_sclst = AVS2_SCALIST_OFFSET(i);
562*437bfbebSnyanmisaka     }
563*437bfbebSnyanmisaka 
564*437bfbebSnyanmisaka     if (!p_hal->fast_mode) {
565*437bfbebSnyanmisaka         reg_ctx->regs = reg_ctx->reg_buf[0].regs;
566*437bfbebSnyanmisaka         reg_ctx->shph_offset = reg_ctx->reg_buf[0].offset_shph;
567*437bfbebSnyanmisaka         reg_ctx->sclst_offset = reg_ctx->reg_buf[0].offset_sclst;
568*437bfbebSnyanmisaka     }
569*437bfbebSnyanmisaka 
570*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
571*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->frame_slots, SLOTS_VER_ALIGN, avs2d_ver_align);
572*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->frame_slots, SLOTS_LEN_ALIGN, avs2d_len_align);
573*437bfbebSnyanmisaka 
574*437bfbebSnyanmisaka __RETURN:
575*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("Out. ret %d", ret);
576*437bfbebSnyanmisaka     (void)cfg;
577*437bfbebSnyanmisaka     return ret;
578*437bfbebSnyanmisaka __FAILED:
579*437bfbebSnyanmisaka     hal_avs2d_vdpu383_deinit(p_hal);
580*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("Out. ret %d", ret);
581*437bfbebSnyanmisaka     return ret;
582*437bfbebSnyanmisaka }
583*437bfbebSnyanmisaka 
calc_mv_size(RK_S32 pic_w,RK_S32 pic_h,RK_S32 ctu_w)584*437bfbebSnyanmisaka static RK_S32 calc_mv_size(RK_S32 pic_w, RK_S32 pic_h, RK_S32 ctu_w)
585*437bfbebSnyanmisaka {
586*437bfbebSnyanmisaka     RK_S32 seg_w = 64 * 16 * 16 / ctu_w; // colmv_block_size = 16, colmv_per_bytes = 16
587*437bfbebSnyanmisaka     RK_S32 seg_cnt_w = MPP_ALIGN(pic_w, seg_w) / seg_w;
588*437bfbebSnyanmisaka     RK_S32 seg_cnt_h = MPP_ALIGN(pic_h, ctu_w) / ctu_w;
589*437bfbebSnyanmisaka     RK_S32 mv_size   = seg_cnt_w * seg_cnt_h * 64 * 16;
590*437bfbebSnyanmisaka 
591*437bfbebSnyanmisaka     return mv_size;
592*437bfbebSnyanmisaka }
593*437bfbebSnyanmisaka 
set_up_colmv_buf(void * hal)594*437bfbebSnyanmisaka static MPP_RET set_up_colmv_buf(void *hal)
595*437bfbebSnyanmisaka {
596*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
597*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
598*437bfbebSnyanmisaka     Avs2dSyntax_t *syntax = &p_hal->syntax;
599*437bfbebSnyanmisaka     PicParams_Avs2d *pp   = &syntax->pp;
600*437bfbebSnyanmisaka     RK_U32 ctu_size = 1 << (p_hal->syntax.pp.lcu_size);
601*437bfbebSnyanmisaka     RK_S32 mv_size = calc_mv_size(pp->pic_width_in_luma_samples,
602*437bfbebSnyanmisaka                                   pp->pic_height_in_luma_samples * (1 + pp->field_coded_sequence),
603*437bfbebSnyanmisaka                                   ctu_size);
604*437bfbebSnyanmisaka 
605*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("mv_size %d", mv_size);
606*437bfbebSnyanmisaka 
607*437bfbebSnyanmisaka     if (p_hal->cmv_bufs == NULL || p_hal->mv_size < (RK_U32)mv_size) {
608*437bfbebSnyanmisaka         size_t size = mv_size;
609*437bfbebSnyanmisaka 
610*437bfbebSnyanmisaka         if (p_hal->cmv_bufs) {
611*437bfbebSnyanmisaka             hal_bufs_deinit(p_hal->cmv_bufs);
612*437bfbebSnyanmisaka             p_hal->cmv_bufs = NULL;
613*437bfbebSnyanmisaka         }
614*437bfbebSnyanmisaka 
615*437bfbebSnyanmisaka         hal_bufs_init(&p_hal->cmv_bufs);
616*437bfbebSnyanmisaka         if (p_hal->cmv_bufs == NULL) {
617*437bfbebSnyanmisaka             mpp_err_f("colmv bufs init fail");
618*437bfbebSnyanmisaka             ret = MPP_ERR_INIT;
619*437bfbebSnyanmisaka             goto __RETURN;
620*437bfbebSnyanmisaka         }
621*437bfbebSnyanmisaka 
622*437bfbebSnyanmisaka         p_hal->mv_size = mv_size;
623*437bfbebSnyanmisaka         p_hal->mv_count = mpp_buf_slot_get_count(p_hal->frame_slots);
624*437bfbebSnyanmisaka         hal_bufs_setup(p_hal->cmv_bufs, p_hal->mv_count, 1, &size);
625*437bfbebSnyanmisaka     }
626*437bfbebSnyanmisaka 
627*437bfbebSnyanmisaka __RETURN:
628*437bfbebSnyanmisaka     return ret;
629*437bfbebSnyanmisaka }
630*437bfbebSnyanmisaka 
hal_avs2d_vdpu383_gen_regs(void * hal,HalTaskInfo * task)631*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu383_gen_regs(void *hal, HalTaskInfo *task)
632*437bfbebSnyanmisaka {
633*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
634*437bfbebSnyanmisaka     Avs2dRkvRegCtx_t *reg_ctx;
635*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
636*437bfbebSnyanmisaka     Vdpu383Avs2dRegSet *regs = NULL;
637*437bfbebSnyanmisaka 
638*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("In.");
639*437bfbebSnyanmisaka 
640*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
641*437bfbebSnyanmisaka     if ((task->dec.flags.parse_err || task->dec.flags.ref_err) &&
642*437bfbebSnyanmisaka         !p_hal->cfg->base.disable_error) {
643*437bfbebSnyanmisaka         ret = MPP_NOK;
644*437bfbebSnyanmisaka         goto __RETURN;
645*437bfbebSnyanmisaka     }
646*437bfbebSnyanmisaka 
647*437bfbebSnyanmisaka     ret = set_up_colmv_buf(p_hal);
648*437bfbebSnyanmisaka     if (ret)
649*437bfbebSnyanmisaka         goto __RETURN;
650*437bfbebSnyanmisaka 
651*437bfbebSnyanmisaka     reg_ctx = (Avs2dRkvRegCtx_t *)p_hal->reg_ctx;
652*437bfbebSnyanmisaka 
653*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
654*437bfbebSnyanmisaka         RK_U32 i = 0;
655*437bfbebSnyanmisaka 
656*437bfbebSnyanmisaka         for (i = 0; i <  MPP_ARRAY_ELEMS(reg_ctx->reg_buf); i++) {
657*437bfbebSnyanmisaka             if (!reg_ctx->reg_buf[i].valid) {
658*437bfbebSnyanmisaka                 task->dec.reg_index = i;
659*437bfbebSnyanmisaka                 regs = reg_ctx->reg_buf[i].regs;
660*437bfbebSnyanmisaka                 reg_ctx->shph_offset = reg_ctx->reg_buf[i].offset_shph;
661*437bfbebSnyanmisaka                 reg_ctx->sclst_offset = reg_ctx->reg_buf[i].offset_sclst;
662*437bfbebSnyanmisaka                 reg_ctx->regs = reg_ctx->reg_buf[i].regs;
663*437bfbebSnyanmisaka                 reg_ctx->reg_buf[i].valid = 1;
664*437bfbebSnyanmisaka                 break;
665*437bfbebSnyanmisaka             }
666*437bfbebSnyanmisaka         }
667*437bfbebSnyanmisaka 
668*437bfbebSnyanmisaka         mpp_assert(regs);
669*437bfbebSnyanmisaka     }
670*437bfbebSnyanmisaka 
671*437bfbebSnyanmisaka     regs = reg_ctx->regs;
672*437bfbebSnyanmisaka 
673*437bfbebSnyanmisaka     prepare_header(p_hal, reg_ctx->shph_dat, sizeof(reg_ctx->shph_dat) / 8);
674*437bfbebSnyanmisaka     prepare_scalist(p_hal, reg_ctx->scalist_dat, sizeof(reg_ctx->scalist_dat));
675*437bfbebSnyanmisaka 
676*437bfbebSnyanmisaka     ret = fill_registers(p_hal, regs, task);
677*437bfbebSnyanmisaka 
678*437bfbebSnyanmisaka     if (ret)
679*437bfbebSnyanmisaka         goto __RETURN;
680*437bfbebSnyanmisaka 
681*437bfbebSnyanmisaka     {
682*437bfbebSnyanmisaka         memcpy(reg_ctx->bufs_ptr + reg_ctx->shph_offset, reg_ctx->shph_dat, sizeof(reg_ctx->shph_dat));
683*437bfbebSnyanmisaka         memcpy(reg_ctx->bufs_ptr + reg_ctx->sclst_offset, reg_ctx->scalist_dat, sizeof(reg_ctx->scalist_dat));
684*437bfbebSnyanmisaka 
685*437bfbebSnyanmisaka         regs->common_addr.reg131_gbl_base = reg_ctx->bufs_fd;
686*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(p_hal->dev, 131, reg_ctx->shph_offset);
687*437bfbebSnyanmisaka         regs->avs2d_paras.reg67_global_len = AVS2_383_SHPH_SIZE;
688*437bfbebSnyanmisaka 
689*437bfbebSnyanmisaka         regs->common_addr.reg132_scanlist_addr = reg_ctx->bufs_fd;
690*437bfbebSnyanmisaka         mpp_dev_set_reg_offset(p_hal->dev, 132, reg_ctx->sclst_offset);
691*437bfbebSnyanmisaka     }
692*437bfbebSnyanmisaka 
693*437bfbebSnyanmisaka     // set rcb
694*437bfbebSnyanmisaka     {
695*437bfbebSnyanmisaka         hal_avs2d_rcb_info_update(p_hal, regs);
696*437bfbebSnyanmisaka         vdpu383_setup_rcb(&regs->common_addr, p_hal->dev, p_hal->fast_mode ?
697*437bfbebSnyanmisaka                           reg_ctx->rcb_buf[task->dec.reg_index] : reg_ctx->rcb_buf[0],
698*437bfbebSnyanmisaka                           reg_ctx->rcb_info);
699*437bfbebSnyanmisaka 
700*437bfbebSnyanmisaka     }
701*437bfbebSnyanmisaka 
702*437bfbebSnyanmisaka     vdpu383_setup_statistic(&regs->ctrl_regs);
703*437bfbebSnyanmisaka     mpp_buffer_sync_end(reg_ctx->bufs);
704*437bfbebSnyanmisaka 
705*437bfbebSnyanmisaka __RETURN:
706*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("Out. ret %d", ret);
707*437bfbebSnyanmisaka     return ret;
708*437bfbebSnyanmisaka }
709*437bfbebSnyanmisaka 
hal_avs2d_vdpu383_start(void * hal,HalTaskInfo * task)710*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu383_start(void *hal, HalTaskInfo *task)
711*437bfbebSnyanmisaka {
712*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
713*437bfbebSnyanmisaka     Vdpu383Avs2dRegSet *regs = NULL;
714*437bfbebSnyanmisaka     Avs2dRkvRegCtx_t *reg_ctx;
715*437bfbebSnyanmisaka     MppDev dev = NULL;
716*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
717*437bfbebSnyanmisaka 
718*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("In.");
719*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
720*437bfbebSnyanmisaka 
721*437bfbebSnyanmisaka     if ((task->dec.flags.parse_err || task->dec.flags.ref_err) &&
722*437bfbebSnyanmisaka         !p_hal->cfg->base.disable_error) {
723*437bfbebSnyanmisaka         goto __RETURN;
724*437bfbebSnyanmisaka     }
725*437bfbebSnyanmisaka 
726*437bfbebSnyanmisaka     reg_ctx = (Avs2dRkvRegCtx_t *)p_hal->reg_ctx;
727*437bfbebSnyanmisaka     regs = p_hal->fast_mode ? reg_ctx->reg_buf[task->dec.reg_index].regs : reg_ctx->regs;
728*437bfbebSnyanmisaka     dev = p_hal->dev;
729*437bfbebSnyanmisaka 
730*437bfbebSnyanmisaka     p_hal->frame_no++;
731*437bfbebSnyanmisaka 
732*437bfbebSnyanmisaka     do {
733*437bfbebSnyanmisaka         MppDevRegWrCfg wr_cfg;
734*437bfbebSnyanmisaka         MppDevRegRdCfg rd_cfg;
735*437bfbebSnyanmisaka 
736*437bfbebSnyanmisaka         wr_cfg.reg = &regs->ctrl_regs;
737*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->ctrl_regs);
738*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CTRL_REGS;
739*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
740*437bfbebSnyanmisaka         if (ret) {
741*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
742*437bfbebSnyanmisaka             break;
743*437bfbebSnyanmisaka         }
744*437bfbebSnyanmisaka 
745*437bfbebSnyanmisaka         wr_cfg.reg = &regs->common_addr;
746*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->common_addr);
747*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
748*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
749*437bfbebSnyanmisaka         if (ret) {
750*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
751*437bfbebSnyanmisaka             break;
752*437bfbebSnyanmisaka         }
753*437bfbebSnyanmisaka 
754*437bfbebSnyanmisaka         wr_cfg.reg = &regs->avs2d_paras;
755*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->avs2d_paras);
756*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_PARAS_REGS;
757*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
758*437bfbebSnyanmisaka         if (ret) {
759*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
760*437bfbebSnyanmisaka             break;
761*437bfbebSnyanmisaka         }
762*437bfbebSnyanmisaka 
763*437bfbebSnyanmisaka         wr_cfg.reg = &regs->avs2d_addrs;
764*437bfbebSnyanmisaka         wr_cfg.size = sizeof(regs->avs2d_addrs);
765*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
766*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
767*437bfbebSnyanmisaka         if (ret) {
768*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
769*437bfbebSnyanmisaka             break;
770*437bfbebSnyanmisaka         }
771*437bfbebSnyanmisaka 
772*437bfbebSnyanmisaka         rd_cfg.reg = &regs->ctrl_regs.reg15;
773*437bfbebSnyanmisaka         rd_cfg.size = sizeof(regs->ctrl_regs.reg15);
774*437bfbebSnyanmisaka         rd_cfg.offset = OFFSET_INTERRUPT_REGS;
775*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
776*437bfbebSnyanmisaka         if (ret) {
777*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
778*437bfbebSnyanmisaka             break;
779*437bfbebSnyanmisaka         }
780*437bfbebSnyanmisaka 
781*437bfbebSnyanmisaka         if (avs2d_hal_debug & AVS2D_HAL_DBG_REG) {
782*437bfbebSnyanmisaka             memset(reg_ctx->reg_out, 0, sizeof(reg_ctx->reg_out));
783*437bfbebSnyanmisaka             rd_cfg.reg = reg_ctx->reg_out;
784*437bfbebSnyanmisaka             rd_cfg.size = sizeof(reg_ctx->reg_out);
785*437bfbebSnyanmisaka             rd_cfg.offset = 0;
786*437bfbebSnyanmisaka             ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
787*437bfbebSnyanmisaka         }
788*437bfbebSnyanmisaka 
789*437bfbebSnyanmisaka         /* rcb info for sram */
790*437bfbebSnyanmisaka         vdpu383_set_rcbinfo(dev, (Vdpu383RcbInfo*)reg_ctx->rcb_info);
791*437bfbebSnyanmisaka 
792*437bfbebSnyanmisaka         // send request to hardware
793*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
794*437bfbebSnyanmisaka         if (ret) {
795*437bfbebSnyanmisaka             mpp_err_f("send cmd failed %d\n", ret);
796*437bfbebSnyanmisaka             break;
797*437bfbebSnyanmisaka         }
798*437bfbebSnyanmisaka 
799*437bfbebSnyanmisaka     } while (0);
800*437bfbebSnyanmisaka 
801*437bfbebSnyanmisaka __RETURN:
802*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("Out.");
803*437bfbebSnyanmisaka     return ret;
804*437bfbebSnyanmisaka }
805*437bfbebSnyanmisaka 
fetch_data(RK_U32 fmt,RK_U8 * line,RK_U32 num)806*437bfbebSnyanmisaka static RK_U8 fetch_data(RK_U32 fmt, RK_U8 *line, RK_U32 num)
807*437bfbebSnyanmisaka {
808*437bfbebSnyanmisaka     RK_U32 offset = 0;
809*437bfbebSnyanmisaka     RK_U32 value = 0;
810*437bfbebSnyanmisaka 
811*437bfbebSnyanmisaka     if (fmt == MPP_FMT_YUV420SP_10BIT) {
812*437bfbebSnyanmisaka         offset = (num * 2) & 7;
813*437bfbebSnyanmisaka         value = (line[num * 10 / 8] >> offset) |
814*437bfbebSnyanmisaka                 (line[num * 10 / 8 + 1] << (8 - offset));
815*437bfbebSnyanmisaka 
816*437bfbebSnyanmisaka         value = (value & 0x3ff) >> 2;
817*437bfbebSnyanmisaka     } else if (fmt == MPP_FMT_YUV420SP) {
818*437bfbebSnyanmisaka         value = line[num];
819*437bfbebSnyanmisaka     }
820*437bfbebSnyanmisaka 
821*437bfbebSnyanmisaka     return value;
822*437bfbebSnyanmisaka }
823*437bfbebSnyanmisaka 
hal_avs2d_vdpu383_dump_yuv(void * hal,HalTaskInfo * task)824*437bfbebSnyanmisaka static MPP_RET hal_avs2d_vdpu383_dump_yuv(void *hal, HalTaskInfo *task)
825*437bfbebSnyanmisaka {
826*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
827*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
828*437bfbebSnyanmisaka 
829*437bfbebSnyanmisaka     MppFrameFormat fmt = MPP_FMT_YUV420SP;
830*437bfbebSnyanmisaka     RK_U32 vir_w = 0;
831*437bfbebSnyanmisaka     RK_U32 vir_h = 0;
832*437bfbebSnyanmisaka     RK_U32 i = 0;
833*437bfbebSnyanmisaka     RK_U32 j = 0;
834*437bfbebSnyanmisaka     FILE *fp_stream = NULL;
835*437bfbebSnyanmisaka     char name[50];
836*437bfbebSnyanmisaka     MppBuffer buffer = NULL;
837*437bfbebSnyanmisaka     MppFrame frame;
838*437bfbebSnyanmisaka     void *base = NULL;
839*437bfbebSnyanmisaka 
840*437bfbebSnyanmisaka     ret = mpp_buf_slot_get_prop(p_hal->frame_slots, task->dec.output, SLOT_FRAME_PTR, &frame);
841*437bfbebSnyanmisaka 
842*437bfbebSnyanmisaka     if (ret != MPP_OK || frame == NULL)
843*437bfbebSnyanmisaka         mpp_log_f("failed to get frame slot %d", task->dec.output);
844*437bfbebSnyanmisaka 
845*437bfbebSnyanmisaka     ret = mpp_buf_slot_get_prop(p_hal->frame_slots, task->dec.output, SLOT_BUFFER, &buffer);
846*437bfbebSnyanmisaka 
847*437bfbebSnyanmisaka     if (ret != MPP_OK || buffer == NULL)
848*437bfbebSnyanmisaka         mpp_log_f("failed to get frame buffer slot %d", task->dec.output);
849*437bfbebSnyanmisaka 
850*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("frame slot %d, fd %d\n", task->dec.output, mpp_buffer_get_fd(buffer));
851*437bfbebSnyanmisaka     base = mpp_buffer_get_ptr(buffer);
852*437bfbebSnyanmisaka     vir_w = mpp_frame_get_hor_stride(frame);
853*437bfbebSnyanmisaka     vir_h = mpp_frame_get_ver_stride(frame);
854*437bfbebSnyanmisaka     fmt = mpp_frame_get_fmt(frame);
855*437bfbebSnyanmisaka     snprintf(name, sizeof(name), "/data/tmp/rkv_out_%dx%d_nv12_%03d.yuv", vir_w, vir_h,
856*437bfbebSnyanmisaka              p_hal->frame_no);
857*437bfbebSnyanmisaka     fp_stream = fopen(name, "wb");
858*437bfbebSnyanmisaka 
859*437bfbebSnyanmisaka     if (fmt != MPP_FMT_YUV420SP_10BIT) {
860*437bfbebSnyanmisaka         fwrite(base, 1, vir_w * vir_h * 3 / 2, fp_stream);
861*437bfbebSnyanmisaka     } else {
862*437bfbebSnyanmisaka         RK_U8 tmp = 0;
863*437bfbebSnyanmisaka         for (i = 0; i < vir_h; i++) {
864*437bfbebSnyanmisaka             for (j = 0; j < vir_w; j++) {
865*437bfbebSnyanmisaka                 tmp = fetch_data(fmt, base, j);
866*437bfbebSnyanmisaka                 fwrite(&tmp, 1, 1, fp_stream);
867*437bfbebSnyanmisaka             }
868*437bfbebSnyanmisaka             base += vir_w;
869*437bfbebSnyanmisaka         }
870*437bfbebSnyanmisaka 
871*437bfbebSnyanmisaka         for (i = 0; i < vir_h / 2; i++) {
872*437bfbebSnyanmisaka             for (j = 0; j < vir_w; j++) {
873*437bfbebSnyanmisaka                 tmp = fetch_data(fmt, base, j);
874*437bfbebSnyanmisaka                 fwrite(&tmp, 1, 1, fp_stream);
875*437bfbebSnyanmisaka             }
876*437bfbebSnyanmisaka             base += vir_w;
877*437bfbebSnyanmisaka         }
878*437bfbebSnyanmisaka     }
879*437bfbebSnyanmisaka     fclose(fp_stream);
880*437bfbebSnyanmisaka 
881*437bfbebSnyanmisaka     return ret;
882*437bfbebSnyanmisaka }
883*437bfbebSnyanmisaka 
hal_avs2d_vdpu383_wait(void * hal,HalTaskInfo * task)884*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu383_wait(void *hal, HalTaskInfo *task)
885*437bfbebSnyanmisaka {
886*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
887*437bfbebSnyanmisaka     Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
888*437bfbebSnyanmisaka     Avs2dRkvRegCtx_t *reg_ctx;
889*437bfbebSnyanmisaka     Vdpu383Avs2dRegSet *regs;
890*437bfbebSnyanmisaka 
891*437bfbebSnyanmisaka     INP_CHECK(ret, NULL == p_hal);
892*437bfbebSnyanmisaka     reg_ctx = (Avs2dRkvRegCtx_t *)p_hal->reg_ctx;
893*437bfbebSnyanmisaka     regs = p_hal->fast_mode ? reg_ctx->reg_buf[task->dec.reg_index].regs : reg_ctx->regs;
894*437bfbebSnyanmisaka 
895*437bfbebSnyanmisaka     if ((task->dec.flags.parse_err || task->dec.flags.ref_err) &&
896*437bfbebSnyanmisaka         !p_hal->cfg->base.disable_error) {
897*437bfbebSnyanmisaka         AVS2D_HAL_DBG(AVS2D_HAL_DBG_ERROR, "found task error.\n");
898*437bfbebSnyanmisaka         ret = MPP_NOK;
899*437bfbebSnyanmisaka         goto __RETURN;
900*437bfbebSnyanmisaka     } else {
901*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
902*437bfbebSnyanmisaka         if (ret)
903*437bfbebSnyanmisaka             mpp_err_f("poll cmd failed %d\n", ret);
904*437bfbebSnyanmisaka     }
905*437bfbebSnyanmisaka 
906*437bfbebSnyanmisaka     if (avs2d_hal_debug & AVS2D_HAL_DBG_OUT)
907*437bfbebSnyanmisaka         hal_avs2d_vdpu383_dump_yuv(hal, task);
908*437bfbebSnyanmisaka 
909*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("read irq_status 0x%08x\n", regs->ctrl_regs.reg19);
910*437bfbebSnyanmisaka 
911*437bfbebSnyanmisaka     if (p_hal->dec_cb) {
912*437bfbebSnyanmisaka         DecCbHalDone param;
913*437bfbebSnyanmisaka 
914*437bfbebSnyanmisaka         param.task = (void *)&task->dec;
915*437bfbebSnyanmisaka         param.regs = (RK_U32 *)regs;
916*437bfbebSnyanmisaka 
917*437bfbebSnyanmisaka         if ((!regs->ctrl_regs.reg15.rkvdec_frame_rdy_sta) ||
918*437bfbebSnyanmisaka             regs->ctrl_regs.reg15.rkvdec_strm_error_sta ||
919*437bfbebSnyanmisaka             regs->ctrl_regs.reg15.rkvdec_core_timeout_sta ||
920*437bfbebSnyanmisaka             regs->ctrl_regs.reg15.rkvdec_ip_timeout_sta ||
921*437bfbebSnyanmisaka             regs->ctrl_regs.reg15.rkvdec_bus_error_sta ||
922*437bfbebSnyanmisaka             regs->ctrl_regs.reg15.rkvdec_buffer_empty_sta ||
923*437bfbebSnyanmisaka             regs->ctrl_regs.reg15.rkvdec_colmv_ref_error_sta)
924*437bfbebSnyanmisaka             param.hard_err = 1;
925*437bfbebSnyanmisaka         else
926*437bfbebSnyanmisaka             param.hard_err = 0;
927*437bfbebSnyanmisaka 
928*437bfbebSnyanmisaka         task->dec.flags.ref_info_valid = 0;
929*437bfbebSnyanmisaka 
930*437bfbebSnyanmisaka         AVS2D_HAL_TRACE("hal frame %d hard_err= %d", p_hal->frame_no, param.hard_err);
931*437bfbebSnyanmisaka 
932*437bfbebSnyanmisaka         mpp_callback(p_hal->dec_cb, &param);
933*437bfbebSnyanmisaka     }
934*437bfbebSnyanmisaka 
935*437bfbebSnyanmisaka     memset(&regs->ctrl_regs.reg19, 0, sizeof(RK_U32));
936*437bfbebSnyanmisaka     if (p_hal->fast_mode)
937*437bfbebSnyanmisaka         reg_ctx->reg_buf[task->dec.reg_index].valid = 0;
938*437bfbebSnyanmisaka 
939*437bfbebSnyanmisaka __RETURN:
940*437bfbebSnyanmisaka     AVS2D_HAL_TRACE("Out. ret %d", ret);
941*437bfbebSnyanmisaka     return ret;
942*437bfbebSnyanmisaka }
943*437bfbebSnyanmisaka 
944*437bfbebSnyanmisaka const MppHalApi hal_avs2d_vdpu383 = {
945*437bfbebSnyanmisaka     .name     = "avs2d_vdpu383",
946*437bfbebSnyanmisaka     .type     = MPP_CTX_DEC,
947*437bfbebSnyanmisaka     .coding   = MPP_VIDEO_CodingAVS2,
948*437bfbebSnyanmisaka     .ctx_size = sizeof(Avs2dRkvRegCtx_t),
949*437bfbebSnyanmisaka     .flag     = 0,
950*437bfbebSnyanmisaka     .init     = hal_avs2d_vdpu383_init,
951*437bfbebSnyanmisaka     .deinit   = hal_avs2d_vdpu383_deinit,
952*437bfbebSnyanmisaka     .reg_gen  = hal_avs2d_vdpu383_gen_regs,
953*437bfbebSnyanmisaka     .start    = hal_avs2d_vdpu383_start,
954*437bfbebSnyanmisaka     .wait     = hal_avs2d_vdpu383_wait,
955*437bfbebSnyanmisaka     .reset    = NULL,
956*437bfbebSnyanmisaka     .flush    = NULL,
957*437bfbebSnyanmisaka     .control  = NULL,
958*437bfbebSnyanmisaka };
959