1*437bfbebSnyanmisaka /*
2*437bfbebSnyanmisaka * Copyright 2022 Rockchip Electronics Co. LTD
3*437bfbebSnyanmisaka *
4*437bfbebSnyanmisaka * Licensed under the Apache License, Version 2.0 (the "License");
5*437bfbebSnyanmisaka * you may not use this file except in compliance with the License.
6*437bfbebSnyanmisaka * You may obtain a copy of the License at
7*437bfbebSnyanmisaka *
8*437bfbebSnyanmisaka * http://www.apache.org/licenses/LICENSE-2.0
9*437bfbebSnyanmisaka *
10*437bfbebSnyanmisaka * Unless required by applicable law or agreed to in writing, software
11*437bfbebSnyanmisaka * distributed under the License is distributed on an "AS IS" BASIS,
12*437bfbebSnyanmisaka * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*437bfbebSnyanmisaka * See the License for the specific language governing permissions and
14*437bfbebSnyanmisaka * limitations under the License.
15*437bfbebSnyanmisaka */
16*437bfbebSnyanmisaka
17*437bfbebSnyanmisaka #define MODULE_TAG "hal_avs2d_vdpu382"
18*437bfbebSnyanmisaka
19*437bfbebSnyanmisaka #include <string.h>
20*437bfbebSnyanmisaka #include <stdio.h>
21*437bfbebSnyanmisaka
22*437bfbebSnyanmisaka #include "mpp_log.h"
23*437bfbebSnyanmisaka #include "mpp_mem.h"
24*437bfbebSnyanmisaka #include "mpp_common.h"
25*437bfbebSnyanmisaka #include "mpp_debug.h"
26*437bfbebSnyanmisaka #include "mpp_bitput.h"
27*437bfbebSnyanmisaka
28*437bfbebSnyanmisaka #include "avs2d_syntax.h"
29*437bfbebSnyanmisaka #include "hal_avs2d_api.h"
30*437bfbebSnyanmisaka #include "hal_avs2d_vdpu382.h"
31*437bfbebSnyanmisaka #include "mpp_dec_cb_param.h"
32*437bfbebSnyanmisaka #include "vdpu382_avs2d.h"
33*437bfbebSnyanmisaka
34*437bfbebSnyanmisaka #define VDPU382_FAST_REG_SET_CNT (3)
35*437bfbebSnyanmisaka #define MAX_REF_NUM (8)
36*437bfbebSnyanmisaka #define AVS2_RKV_SHPH_SIZE (1408 / 8) /* bytes */
37*437bfbebSnyanmisaka #define AVS2_RKV_SCALIST_SIZE (80 + 128) /* bytes */
38*437bfbebSnyanmisaka #define VDPU382_TOTAL_REG_CNT (278)
39*437bfbebSnyanmisaka
40*437bfbebSnyanmisaka #define AVS2_RKV_SHPH_ALIGNED_SIZE (MPP_ALIGN(AVS2_RKV_SHPH_SIZE, SZ_4K))
41*437bfbebSnyanmisaka #define AVS2_RKV_SCALIST_ALIGNED_SIZE (MPP_ALIGN(AVS2_RKV_SCALIST_SIZE, SZ_4K))
42*437bfbebSnyanmisaka #define AVS2_RKV_STREAM_INFO_SET_SIZE (AVS2_RKV_SHPH_ALIGNED_SIZE + \
43*437bfbebSnyanmisaka AVS2_RKV_SCALIST_ALIGNED_SIZE)
44*437bfbebSnyanmisaka #define AVS2_ALL_TBL_BUF_SIZE(cnt) (AVS2_RKV_STREAM_INFO_SET_SIZE * (cnt))
45*437bfbebSnyanmisaka #define AVS2_SHPH_OFFSET(pos) (AVS2_RKV_STREAM_INFO_SET_SIZE * (pos))
46*437bfbebSnyanmisaka #define AVS2_SCALIST_OFFSET(pos) (AVS2_SHPH_OFFSET(pos) + AVS2_RKV_SHPH_ALIGNED_SIZE)
47*437bfbebSnyanmisaka
48*437bfbebSnyanmisaka #define COLMV_COMPRESS_EN (1)
49*437bfbebSnyanmisaka #define COLMV_BLOCK_SIZE (16)
50*437bfbebSnyanmisaka #define COLMV_BYTES (16)
51*437bfbebSnyanmisaka
52*437bfbebSnyanmisaka typedef struct avs2d_buf_t {
53*437bfbebSnyanmisaka RK_U32 valid;
54*437bfbebSnyanmisaka RK_U32 offset_shph;
55*437bfbebSnyanmisaka RK_U32 offset_sclst;
56*437bfbebSnyanmisaka Vdpu382Avs2dRegSet *regs;
57*437bfbebSnyanmisaka } Avs2dVdpu382Buf_t;
58*437bfbebSnyanmisaka
59*437bfbebSnyanmisaka typedef struct avs2d_reg_ctx_t {
60*437bfbebSnyanmisaka Avs2dVdpu382Buf_t reg_buf[VDPU382_FAST_REG_SET_CNT];
61*437bfbebSnyanmisaka
62*437bfbebSnyanmisaka RK_U32 shph_offset;
63*437bfbebSnyanmisaka RK_U32 sclst_offset;
64*437bfbebSnyanmisaka
65*437bfbebSnyanmisaka Vdpu382Avs2dRegSet *regs;
66*437bfbebSnyanmisaka
67*437bfbebSnyanmisaka RK_U8 shph_dat[AVS2_RKV_SHPH_SIZE];
68*437bfbebSnyanmisaka RK_U8 scalist_dat[AVS2_RKV_SCALIST_SIZE];
69*437bfbebSnyanmisaka
70*437bfbebSnyanmisaka MppBuffer bufs;
71*437bfbebSnyanmisaka RK_S32 bufs_fd;
72*437bfbebSnyanmisaka void *bufs_ptr;
73*437bfbebSnyanmisaka
74*437bfbebSnyanmisaka MppBuffer rcb_buf[VDPU382_FAST_REG_SET_CNT];
75*437bfbebSnyanmisaka RK_S32 rcb_buf_size;
76*437bfbebSnyanmisaka Vdpu382RcbInfo rcb_info[RCB_BUF_COUNT];
77*437bfbebSnyanmisaka RK_U32 reg_out[VDPU382_TOTAL_REG_CNT];
78*437bfbebSnyanmisaka
79*437bfbebSnyanmisaka } Avs2dVdpu382RegCtx_t;
80*437bfbebSnyanmisaka
81*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu382_deinit(void *hal);
avs2d_ver_align(RK_U32 val)82*437bfbebSnyanmisaka static RK_U32 avs2d_ver_align(RK_U32 val)
83*437bfbebSnyanmisaka {
84*437bfbebSnyanmisaka return MPP_ALIGN(val, 16);
85*437bfbebSnyanmisaka }
86*437bfbebSnyanmisaka
avs2d_hor_align(RK_U32 val)87*437bfbebSnyanmisaka static RK_U32 avs2d_hor_align(RK_U32 val)
88*437bfbebSnyanmisaka {
89*437bfbebSnyanmisaka
90*437bfbebSnyanmisaka return MPP_ALIGN(val, 16);
91*437bfbebSnyanmisaka }
92*437bfbebSnyanmisaka
avs2d_len_align(RK_U32 val)93*437bfbebSnyanmisaka static RK_U32 avs2d_len_align(RK_U32 val)
94*437bfbebSnyanmisaka {
95*437bfbebSnyanmisaka return (2 * MPP_ALIGN(val, 16));
96*437bfbebSnyanmisaka }
97*437bfbebSnyanmisaka
avs2d_hor_align_64(RK_U32 val)98*437bfbebSnyanmisaka static RK_U32 avs2d_hor_align_64(RK_U32 val)
99*437bfbebSnyanmisaka {
100*437bfbebSnyanmisaka return MPP_ALIGN(val, 64);
101*437bfbebSnyanmisaka }
102*437bfbebSnyanmisaka
prepare_header(Avs2dHalCtx_t * p_hal,RK_U8 * data,RK_U32 len)103*437bfbebSnyanmisaka static MPP_RET prepare_header(Avs2dHalCtx_t *p_hal, RK_U8 *data, RK_U32 len)
104*437bfbebSnyanmisaka {
105*437bfbebSnyanmisaka RK_U32 i, j;
106*437bfbebSnyanmisaka BitputCtx_t bp;
107*437bfbebSnyanmisaka RK_U64 *bit_buf = (RK_U64 *)data;
108*437bfbebSnyanmisaka Avs2dSyntax_t *syntax = &p_hal->syntax;
109*437bfbebSnyanmisaka PicParams_Avs2d *pp = &syntax->pp;
110*437bfbebSnyanmisaka AlfParams_Avs2d *alfp = &syntax->alfp;
111*437bfbebSnyanmisaka RefParams_Avs2d *refp = &syntax->refp;
112*437bfbebSnyanmisaka WqmParams_Avs2d *wqmp = &syntax->wqmp;
113*437bfbebSnyanmisaka
114*437bfbebSnyanmisaka memset(data, 0, len);
115*437bfbebSnyanmisaka
116*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, bit_buf, len);
117*437bfbebSnyanmisaka //!< sequence header syntax
118*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->chroma_format_idc, 2);
119*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pic_width_in_luma_samples, 16);
120*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pic_height_in_luma_samples, 16);
121*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->bit_depth_luma_minus8, 3);
122*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->bit_depth_chroma_minus8, 3);
123*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->lcu_size, 3);
124*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->progressive_sequence, 1);
125*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->field_coded_sequence, 1);
126*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->multi_hypothesis_skip_enable_flag, 1);
127*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->dual_hypothesis_prediction_enable_flag, 1);
128*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->weighted_skip_enable_flag, 1);
129*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->asymmetrc_motion_partitions_enable_flag, 1);
130*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->nonsquare_quadtree_transform_enable_flag, 1);
131*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->nonsquare_intra_prediction_enable_flag, 1);
132*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->secondary_transform_enable_flag, 1);
133*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->sample_adaptive_offset_enable_flag, 1);
134*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->adaptive_loop_filter_enable_flag, 1);
135*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->pmvr_enable_flag, 1);
136*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->cross_slice_loopfilter_enable_flag, 1);
137*437bfbebSnyanmisaka //!< picture header syntax
138*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->picture_type, 3);
139*437bfbebSnyanmisaka mpp_put_bits(&bp, refp->ref_pic_num, 3);
140*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->scene_reference_enable_flag, 1);
141*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->bottom_field_picture_flag, 1);
142*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->fixed_picture_qp, 1);
143*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->picture_qp, 7);
144*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->loop_filter_disable_flag, 1);
145*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->alpha_c_offset, 5);
146*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->beta_offset, 5);
147*437bfbebSnyanmisaka //!< weight quant param
148*437bfbebSnyanmisaka mpp_put_bits(&bp, wqmp->chroma_quant_param_delta_cb, 6);
149*437bfbebSnyanmisaka mpp_put_bits(&bp, wqmp->chroma_quant_param_delta_cr, 6);
150*437bfbebSnyanmisaka mpp_put_bits(&bp, wqmp->pic_weight_quant_enable_flag, 1);
151*437bfbebSnyanmisaka //!< alf param
152*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->enable_pic_alf_y, 1);
153*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->enable_pic_alf_cb, 1);
154*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->enable_pic_alf_cr, 1);
155*437bfbebSnyanmisaka
156*437bfbebSnyanmisaka if (alfp->enable_pic_alf_y) {
157*437bfbebSnyanmisaka RK_U32 alf_filter_num = alfp->alf_filter_num_minus1 + 1;
158*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->alf_filter_num_minus1, 4);
159*437bfbebSnyanmisaka
160*437bfbebSnyanmisaka for (i = 0; i < 16; i++)
161*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->alf_coeff_idx_tab[i], 4);
162*437bfbebSnyanmisaka
163*437bfbebSnyanmisaka for (i = 0; i < alf_filter_num; i++) {
164*437bfbebSnyanmisaka for (j = 0; j < 9; j++) {
165*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->alf_coeff_y[i][j], 7);
166*437bfbebSnyanmisaka }
167*437bfbebSnyanmisaka }
168*437bfbebSnyanmisaka }
169*437bfbebSnyanmisaka
170*437bfbebSnyanmisaka if (alfp->enable_pic_alf_cb) {
171*437bfbebSnyanmisaka for (j = 0; j < 9; j++)
172*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->alf_coeff_cb[j], 7);
173*437bfbebSnyanmisaka }
174*437bfbebSnyanmisaka
175*437bfbebSnyanmisaka if (alfp->enable_pic_alf_cr) {
176*437bfbebSnyanmisaka for (j = 0; j < 9; j++)
177*437bfbebSnyanmisaka mpp_put_bits(&bp, alfp->alf_coeff_cr[j], 7);
178*437bfbebSnyanmisaka }
179*437bfbebSnyanmisaka
180*437bfbebSnyanmisaka mpp_put_align(&bp, 128, 0);
181*437bfbebSnyanmisaka
182*437bfbebSnyanmisaka return MPP_OK;
183*437bfbebSnyanmisaka }
184*437bfbebSnyanmisaka
prepare_scalist(Avs2dHalCtx_t * p_hal,RK_U8 * data,RK_U32 len)185*437bfbebSnyanmisaka static MPP_RET prepare_scalist(Avs2dHalCtx_t *p_hal, RK_U8 *data, RK_U32 len)
186*437bfbebSnyanmisaka {
187*437bfbebSnyanmisaka RK_U32 i, j;
188*437bfbebSnyanmisaka RK_U32 size_id, block_size;
189*437bfbebSnyanmisaka BitputCtx_t bp;
190*437bfbebSnyanmisaka RK_U64 *bit_buf = (RK_U64 *)data;
191*437bfbebSnyanmisaka Avs2dSyntax_t *syntax = &p_hal->syntax;
192*437bfbebSnyanmisaka WqmParams_Avs2d *wqmp = &syntax->wqmp;
193*437bfbebSnyanmisaka
194*437bfbebSnyanmisaka if (!wqmp->pic_weight_quant_enable_flag)
195*437bfbebSnyanmisaka return MPP_OK;
196*437bfbebSnyanmisaka
197*437bfbebSnyanmisaka memset(data, 0, len);
198*437bfbebSnyanmisaka
199*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, bit_buf, len);
200*437bfbebSnyanmisaka
201*437bfbebSnyanmisaka for (size_id = 0; size_id < 2; size_id++) {
202*437bfbebSnyanmisaka block_size = MPP_MIN(1 << (size_id + 2), 8);
203*437bfbebSnyanmisaka for (i = 0; i < block_size; i++) {
204*437bfbebSnyanmisaka for (j = 0 ; j < block_size; j++)
205*437bfbebSnyanmisaka //!< row col reversed
206*437bfbebSnyanmisaka mpp_put_bits(&bp, wqmp->wq_matrix[size_id][size_id * j + i], 8);
207*437bfbebSnyanmisaka }
208*437bfbebSnyanmisaka }
209*437bfbebSnyanmisaka
210*437bfbebSnyanmisaka return MPP_OK;
211*437bfbebSnyanmisaka }
212*437bfbebSnyanmisaka
get_frame_fd(Avs2dHalCtx_t * p_hal,RK_S32 idx)213*437bfbebSnyanmisaka static RK_S32 get_frame_fd(Avs2dHalCtx_t *p_hal, RK_S32 idx)
214*437bfbebSnyanmisaka {
215*437bfbebSnyanmisaka RK_S32 ret_fd = 0;
216*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
217*437bfbebSnyanmisaka
218*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, idx, SLOT_BUFFER, &mbuffer);
219*437bfbebSnyanmisaka ret_fd = mpp_buffer_get_fd(mbuffer);
220*437bfbebSnyanmisaka
221*437bfbebSnyanmisaka return ret_fd;
222*437bfbebSnyanmisaka }
223*437bfbebSnyanmisaka
get_packet_fd(Avs2dHalCtx_t * p_hal,RK_S32 idx)224*437bfbebSnyanmisaka static RK_S32 get_packet_fd(Avs2dHalCtx_t *p_hal, RK_S32 idx)
225*437bfbebSnyanmisaka {
226*437bfbebSnyanmisaka RK_S32 ret_fd = 0;
227*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
228*437bfbebSnyanmisaka
229*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->packet_slots, idx, SLOT_BUFFER, &mbuffer);
230*437bfbebSnyanmisaka ret_fd = mpp_buffer_get_fd(mbuffer);
231*437bfbebSnyanmisaka
232*437bfbebSnyanmisaka return ret_fd;
233*437bfbebSnyanmisaka }
234*437bfbebSnyanmisaka
init_common_regs(Vdpu382Avs2dRegSet * regs)235*437bfbebSnyanmisaka static MPP_RET init_common_regs(Vdpu382Avs2dRegSet *regs)
236*437bfbebSnyanmisaka {
237*437bfbebSnyanmisaka Vdpu382RegCommon *common = ®s->common;
238*437bfbebSnyanmisaka
239*437bfbebSnyanmisaka common->reg009.dec_mode = 3; // AVS2
240*437bfbebSnyanmisaka common->reg015.rlc_mode = 0;
241*437bfbebSnyanmisaka
242*437bfbebSnyanmisaka common->reg011.buf_empty_en = 1;
243*437bfbebSnyanmisaka common->reg011.err_head_fill_e = 1;
244*437bfbebSnyanmisaka common->reg011.err_colmv_fill_e = 1;
245*437bfbebSnyanmisaka
246*437bfbebSnyanmisaka common->reg010.dec_e = 1;
247*437bfbebSnyanmisaka
248*437bfbebSnyanmisaka common->reg013.h26x_error_mode = 0;
249*437bfbebSnyanmisaka common->reg021.inter_error_prc_mode = 0;
250*437bfbebSnyanmisaka common->reg021.error_deb_en = 0;
251*437bfbebSnyanmisaka common->reg021.error_intra_mode = 0;
252*437bfbebSnyanmisaka
253*437bfbebSnyanmisaka common->reg024.cabac_err_en_lowbits = 0xffffffdf;
254*437bfbebSnyanmisaka common->reg025.cabac_err_en_highbits = 0x3dffffff;
255*437bfbebSnyanmisaka
256*437bfbebSnyanmisaka common->reg026.inter_auto_gating_e = 1;
257*437bfbebSnyanmisaka common->reg026.filterd_auto_gating_e = 1;
258*437bfbebSnyanmisaka common->reg026.strmd_auto_gating_e = 1;
259*437bfbebSnyanmisaka common->reg026.mcp_auto_gating_e = 1;
260*437bfbebSnyanmisaka common->reg026.busifd_auto_gating_e = 1;
261*437bfbebSnyanmisaka common->reg026.dec_ctrl_auto_gating_e = 1;
262*437bfbebSnyanmisaka common->reg026.intra_auto_gating_e = 1;
263*437bfbebSnyanmisaka common->reg026.mc_auto_gating_e = 1;
264*437bfbebSnyanmisaka common->reg026.transd_auto_gating_e = 1;
265*437bfbebSnyanmisaka common->reg026.sram_auto_gating_e = 1;
266*437bfbebSnyanmisaka common->reg026.cru_auto_gating_e = 1;
267*437bfbebSnyanmisaka common->reg026.reg_cfg_gating_en = 1;
268*437bfbebSnyanmisaka
269*437bfbebSnyanmisaka common->reg032_timeout_threshold = 0x3fffff;
270*437bfbebSnyanmisaka
271*437bfbebSnyanmisaka common->reg011.dec_clkgate_e = 1;
272*437bfbebSnyanmisaka
273*437bfbebSnyanmisaka common->reg013.stmerror_waitdecfifo_empty = 1;
274*437bfbebSnyanmisaka common->reg012.colmv_compress_en = COLMV_COMPRESS_EN;
275*437bfbebSnyanmisaka common->reg012.info_collect_en = 1;
276*437bfbebSnyanmisaka common->reg012.error_info_en = 0;
277*437bfbebSnyanmisaka
278*437bfbebSnyanmisaka return MPP_OK;
279*437bfbebSnyanmisaka }
280*437bfbebSnyanmisaka
avs2d_refine_rcb_size(Vdpu382RcbInfo * rcb_info,Vdpu382Avs2dRegSet * hw_regs,RK_S32 width,RK_S32 height,void * dxva)281*437bfbebSnyanmisaka static void avs2d_refine_rcb_size(Vdpu382RcbInfo *rcb_info,
282*437bfbebSnyanmisaka Vdpu382Avs2dRegSet *hw_regs,
283*437bfbebSnyanmisaka RK_S32 width, RK_S32 height, void *dxva)
284*437bfbebSnyanmisaka {
285*437bfbebSnyanmisaka (void) height;
286*437bfbebSnyanmisaka Avs2dSyntax_t *syntax = dxva;
287*437bfbebSnyanmisaka RK_U8 ctu_size = 1 << syntax->pp.lcu_size;
288*437bfbebSnyanmisaka RK_U32 chroma_fmt_idc = syntax->pp.chroma_format_idc;
289*437bfbebSnyanmisaka RK_U8 bit_depth = syntax->pp.bit_depth_chroma_minus8 + 8;
290*437bfbebSnyanmisaka RK_U32 rcb_bits = 0;
291*437bfbebSnyanmisaka
292*437bfbebSnyanmisaka width = MPP_ALIGN(width, ctu_size);
293*437bfbebSnyanmisaka
294*437bfbebSnyanmisaka /* RCB_STRMD_ROW */
295*437bfbebSnyanmisaka if (width >= 8192) {
296*437bfbebSnyanmisaka RK_U32 factor = 64 / ctu_size;
297*437bfbebSnyanmisaka
298*437bfbebSnyanmisaka rcb_bits = (MPP_ALIGN(width, ctu_size) + factor - 1) / factor * 24;
299*437bfbebSnyanmisaka } else
300*437bfbebSnyanmisaka rcb_bits = 0;
301*437bfbebSnyanmisaka rcb_info[RCB_STRMD_ROW].size = MPP_RCB_BYTES(rcb_bits);
302*437bfbebSnyanmisaka
303*437bfbebSnyanmisaka /* RCB_TRANSD_ROW */
304*437bfbebSnyanmisaka if (width >= 8192)
305*437bfbebSnyanmisaka rcb_bits = (MPP_ALIGN(width - 8192, 4) << 1);
306*437bfbebSnyanmisaka else
307*437bfbebSnyanmisaka rcb_bits = 0;
308*437bfbebSnyanmisaka rcb_info[RCB_TRANSD_ROW].size = MPP_RCB_BYTES(rcb_bits);
309*437bfbebSnyanmisaka
310*437bfbebSnyanmisaka /* RCB_TRANSD_COL */
311*437bfbebSnyanmisaka rcb_info[RCB_TRANSD_COL].size = 0;
312*437bfbebSnyanmisaka
313*437bfbebSnyanmisaka /* RCB_INTER_ROW */
314*437bfbebSnyanmisaka rcb_bits = width * 21;
315*437bfbebSnyanmisaka rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
316*437bfbebSnyanmisaka
317*437bfbebSnyanmisaka /* RCB_INTER_COL */
318*437bfbebSnyanmisaka rcb_info[RCB_INTER_COL].size = 0;
319*437bfbebSnyanmisaka
320*437bfbebSnyanmisaka /* RCB_INTRA_ROW */
321*437bfbebSnyanmisaka rcb_bits = width * ((chroma_fmt_idc ? 1 : 0) + 1) * 11;
322*437bfbebSnyanmisaka rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
323*437bfbebSnyanmisaka
324*437bfbebSnyanmisaka /* RCB_DBLK_ROW */
325*437bfbebSnyanmisaka if (chroma_fmt_idc == 1 ) {
326*437bfbebSnyanmisaka if (ctu_size == 32)
327*437bfbebSnyanmisaka rcb_bits = width * ( 4 + 8 * bit_depth);
328*437bfbebSnyanmisaka else
329*437bfbebSnyanmisaka rcb_bits = width * ( 2 + 8 * bit_depth);
330*437bfbebSnyanmisaka } else
331*437bfbebSnyanmisaka rcb_bits = 0;
332*437bfbebSnyanmisaka rcb_info[RCB_DBLK_ROW].size = MPP_RCB_BYTES(rcb_bits);
333*437bfbebSnyanmisaka
334*437bfbebSnyanmisaka /* RCB_SAO_ROW */
335*437bfbebSnyanmisaka if (chroma_fmt_idc == 1 || chroma_fmt_idc == 2) {
336*437bfbebSnyanmisaka rcb_bits = width * (128 / ctu_size + 2 * bit_depth);
337*437bfbebSnyanmisaka } else {
338*437bfbebSnyanmisaka rcb_bits = width * (128 / ctu_size + 3 * bit_depth);
339*437bfbebSnyanmisaka }
340*437bfbebSnyanmisaka rcb_info[RCB_SAO_ROW].size = MPP_RCB_BYTES(rcb_bits);
341*437bfbebSnyanmisaka
342*437bfbebSnyanmisaka /* RCB_FBC_ROW */
343*437bfbebSnyanmisaka if (hw_regs->common.reg012.fbc_e)
344*437bfbebSnyanmisaka rcb_bits = width * 4 * bit_depth;
345*437bfbebSnyanmisaka else
346*437bfbebSnyanmisaka rcb_bits = 0;
347*437bfbebSnyanmisaka rcb_info[RCB_FBC_ROW].size = MPP_RCB_BYTES(rcb_bits);
348*437bfbebSnyanmisaka
349*437bfbebSnyanmisaka /* RCB_FILT_COL */
350*437bfbebSnyanmisaka rcb_info[RCB_FILT_COL].size = 0;
351*437bfbebSnyanmisaka return;
352*437bfbebSnyanmisaka }
353*437bfbebSnyanmisaka
hal_avs2d_rcb_info_update(void * hal,Vdpu382Avs2dRegSet * hw_regs)354*437bfbebSnyanmisaka static void hal_avs2d_rcb_info_update(void *hal, Vdpu382Avs2dRegSet *hw_regs)
355*437bfbebSnyanmisaka {
356*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
357*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
358*437bfbebSnyanmisaka Avs2dVdpu382RegCtx_t *reg_ctx = (Avs2dVdpu382RegCtx_t *)p_hal->reg_ctx;
359*437bfbebSnyanmisaka RK_S32 width = p_hal->syntax.pp.pic_width_in_luma_samples;
360*437bfbebSnyanmisaka RK_S32 height = p_hal->syntax.pp.pic_height_in_luma_samples;
361*437bfbebSnyanmisaka RK_S32 i = 0;
362*437bfbebSnyanmisaka RK_S32 loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
363*437bfbebSnyanmisaka
364*437bfbebSnyanmisaka reg_ctx->rcb_buf_size = vdpu382_get_rcb_buf_size(reg_ctx->rcb_info, width, height);
365*437bfbebSnyanmisaka avs2d_refine_rcb_size(reg_ctx->rcb_info, hw_regs, width, height, (void *)&p_hal->syntax);
366*437bfbebSnyanmisaka
367*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
368*437bfbebSnyanmisaka MppBuffer rcb_buf = NULL;
369*437bfbebSnyanmisaka
370*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
371*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
372*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
373*437bfbebSnyanmisaka }
374*437bfbebSnyanmisaka
375*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->buf_group, &rcb_buf, reg_ctx->rcb_buf_size);
376*437bfbebSnyanmisaka
377*437bfbebSnyanmisaka if (ret)
378*437bfbebSnyanmisaka mpp_err_f("AVS2D mpp_buffer_group_get failed\n");
379*437bfbebSnyanmisaka
380*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = rcb_buf;
381*437bfbebSnyanmisaka }
382*437bfbebSnyanmisaka }
383*437bfbebSnyanmisaka
fill_registers(Avs2dHalCtx_t * p_hal,Vdpu382Avs2dRegSet * p_regs,HalTaskInfo * task)384*437bfbebSnyanmisaka static MPP_RET fill_registers(Avs2dHalCtx_t *p_hal, Vdpu382Avs2dRegSet *p_regs, HalTaskInfo *task)
385*437bfbebSnyanmisaka {
386*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
387*437bfbebSnyanmisaka RK_U32 i;
388*437bfbebSnyanmisaka MppFrame mframe = NULL;
389*437bfbebSnyanmisaka Avs2dSyntax_t *syntax = &p_hal->syntax;
390*437bfbebSnyanmisaka PicParams_Avs2d *pp = &syntax->pp;
391*437bfbebSnyanmisaka RefParams_Avs2d *refp = &syntax->refp;
392*437bfbebSnyanmisaka HalDecTask *task_dec = &task->dec;
393*437bfbebSnyanmisaka Vdpu382RegCommon *common = &p_regs->common;
394*437bfbebSnyanmisaka RK_U32 is_fbc = 0;
395*437bfbebSnyanmisaka HalBuf *mv_buf = NULL;
396*437bfbebSnyanmisaka
397*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, task_dec->output, SLOT_FRAME_PTR, &mframe);
398*437bfbebSnyanmisaka is_fbc = MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe));
399*437bfbebSnyanmisaka
400*437bfbebSnyanmisaka //!< caculate the yuv_frame_size
401*437bfbebSnyanmisaka {
402*437bfbebSnyanmisaka RK_U32 hor_virstride = 0;
403*437bfbebSnyanmisaka RK_U32 ver_virstride = 0;
404*437bfbebSnyanmisaka RK_U32 y_virstride = 0;
405*437bfbebSnyanmisaka
406*437bfbebSnyanmisaka hor_virstride = mpp_frame_get_hor_stride(mframe);
407*437bfbebSnyanmisaka ver_virstride = mpp_frame_get_ver_stride(mframe);
408*437bfbebSnyanmisaka y_virstride = hor_virstride * ver_virstride;
409*437bfbebSnyanmisaka AVS2D_HAL_TRACE("is_fbc %d y_virstride %d, hor_virstride %d, ver_virstride %d\n", is_fbc, y_virstride, hor_virstride, ver_virstride);
410*437bfbebSnyanmisaka
411*437bfbebSnyanmisaka if (is_fbc) {
412*437bfbebSnyanmisaka RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
413*437bfbebSnyanmisaka RK_U32 fbd_offset = MPP_ALIGN(fbc_hdr_stride * (ver_virstride + 16) / 16, SZ_4K);
414*437bfbebSnyanmisaka
415*437bfbebSnyanmisaka common->reg012.fbc_e = 1;
416*437bfbebSnyanmisaka common->reg018.y_hor_virstride = fbc_hdr_stride / 16;
417*437bfbebSnyanmisaka common->reg019.uv_hor_virstride = fbc_hdr_stride / 16;
418*437bfbebSnyanmisaka common->reg020_fbc_payload_off.payload_st_offset = fbd_offset >> 4;
419*437bfbebSnyanmisaka } else {
420*437bfbebSnyanmisaka common->reg012.fbc_e = 0;
421*437bfbebSnyanmisaka common->reg018.y_hor_virstride = hor_virstride / 16;
422*437bfbebSnyanmisaka common->reg019.uv_hor_virstride = hor_virstride / 16;
423*437bfbebSnyanmisaka common->reg020_y_virstride.y_virstride = y_virstride / 16;
424*437bfbebSnyanmisaka }
425*437bfbebSnyanmisaka common->reg013.cur_pic_is_idr = (pp->picture_type == 0 || pp->picture_type == 4 || pp->picture_type == 5);
426*437bfbebSnyanmisaka }
427*437bfbebSnyanmisaka
428*437bfbebSnyanmisaka // set current
429*437bfbebSnyanmisaka {
430*437bfbebSnyanmisaka RK_S32 fd = -1;
431*437bfbebSnyanmisaka p_regs->avs2d_param.reg65_cur_top_poc = mpp_frame_get_poc(mframe);
432*437bfbebSnyanmisaka p_regs->avs2d_param.reg66_cur_bot_poc = 0;
433*437bfbebSnyanmisaka fd = get_frame_fd(p_hal, task_dec->output);
434*437bfbebSnyanmisaka mpp_assert(fd >= 0);
435*437bfbebSnyanmisaka p_regs->common_addr.reg130_decout_base = fd;
436*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, task_dec->output);
437*437bfbebSnyanmisaka p_regs->common_addr.reg131_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
438*437bfbebSnyanmisaka AVS2D_HAL_TRACE("cur frame index %d, fd %d, colmv fd %d", task_dec->output, fd, p_regs->common_addr.reg131_colmv_cur_base);
439*437bfbebSnyanmisaka }
440*437bfbebSnyanmisaka
441*437bfbebSnyanmisaka // set reference
442*437bfbebSnyanmisaka {
443*437bfbebSnyanmisaka RK_U64 ref_flag = 0;
444*437bfbebSnyanmisaka RK_S32 valid_slot = -1;
445*437bfbebSnyanmisaka RK_U32 *ref_low = (RK_U32 *)&p_regs->avs2d_param.reg99;
446*437bfbebSnyanmisaka RK_U32 *ref_hight = (RK_U32 *)&p_regs->avs2d_param.reg100;
447*437bfbebSnyanmisaka RK_U32 err_ref_base = 0;
448*437bfbebSnyanmisaka
449*437bfbebSnyanmisaka AVS2D_HAL_TRACE("num of ref %d", refp->ref_pic_num);
450*437bfbebSnyanmisaka
451*437bfbebSnyanmisaka for (i = 0; i < refp->ref_pic_num; i++) {
452*437bfbebSnyanmisaka if (task_dec->refer[i] < 0)
453*437bfbebSnyanmisaka continue;
454*437bfbebSnyanmisaka
455*437bfbebSnyanmisaka valid_slot = i;
456*437bfbebSnyanmisaka break;
457*437bfbebSnyanmisaka }
458*437bfbebSnyanmisaka
459*437bfbebSnyanmisaka for (i = 0; i < refp->ref_pic_num; i++) {
460*437bfbebSnyanmisaka MppFrame frame_ref = NULL;
461*437bfbebSnyanmisaka
462*437bfbebSnyanmisaka RK_S32 slot_idx = task_dec->refer[i] < 0 ? task_dec->refer[valid_slot] : task_dec->refer[i];
463*437bfbebSnyanmisaka
464*437bfbebSnyanmisaka if (slot_idx < 0) {
465*437bfbebSnyanmisaka AVS2D_HAL_DBG(AVS2D_HAL_DBG_ERROR, "missing ref, could not found valid ref");
466*437bfbebSnyanmisaka task->dec.flags.ref_err = 1;
467*437bfbebSnyanmisaka return ret = MPP_ERR_UNKNOW;
468*437bfbebSnyanmisaka }
469*437bfbebSnyanmisaka
470*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, slot_idx, SLOT_FRAME_PTR, &frame_ref);
471*437bfbebSnyanmisaka
472*437bfbebSnyanmisaka if (frame_ref) {
473*437bfbebSnyanmisaka RK_U32 frm_flag = 1 << 3;
474*437bfbebSnyanmisaka
475*437bfbebSnyanmisaka if (pp->bottom_field_picture_flag)
476*437bfbebSnyanmisaka frm_flag |= 1 << 2;
477*437bfbebSnyanmisaka
478*437bfbebSnyanmisaka if (pp->field_coded_sequence)
479*437bfbebSnyanmisaka frm_flag |= 1;
480*437bfbebSnyanmisaka
481*437bfbebSnyanmisaka ref_flag |= frm_flag << (i * 8);
482*437bfbebSnyanmisaka
483*437bfbebSnyanmisaka p_regs->avs2d_addr.ref_base[i] = get_frame_fd(p_hal, slot_idx);
484*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, slot_idx);
485*437bfbebSnyanmisaka p_regs->avs2d_addr.colmv_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
486*437bfbebSnyanmisaka
487*437bfbebSnyanmisaka p_regs->avs2d_param.reg67_098_ref_poc[i] = mpp_frame_get_poc(frame_ref);
488*437bfbebSnyanmisaka if (!err_ref_base && !mpp_frame_get_errinfo(frame_ref))
489*437bfbebSnyanmisaka err_ref_base = p_regs->avs2d_addr.ref_base[i];
490*437bfbebSnyanmisaka
491*437bfbebSnyanmisaka AVS2D_HAL_TRACE("ref_base[%d] index=%d, fd = %d, colmv %d, poc %d",
492*437bfbebSnyanmisaka i, slot_idx, p_regs->avs2d_addr.ref_base[i],
493*437bfbebSnyanmisaka p_regs->avs2d_addr.colmv_base[i], p_regs->avs2d_param.reg67_098_ref_poc[i]);
494*437bfbebSnyanmisaka }
495*437bfbebSnyanmisaka }
496*437bfbebSnyanmisaka
497*437bfbebSnyanmisaka if (p_hal->syntax.refp.scene_ref_enable && p_hal->syntax.refp.scene_ref_slot_idx >= 0) {
498*437bfbebSnyanmisaka MppFrame scene_ref = NULL;
499*437bfbebSnyanmisaka RK_S32 replace_idx = p_hal->syntax.refp.scene_ref_replace_pos;
500*437bfbebSnyanmisaka RK_S32 slot_idx = p_hal->syntax.refp.scene_ref_slot_idx;
501*437bfbebSnyanmisaka
502*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->frame_slots, slot_idx, SLOT_FRAME_PTR, &scene_ref);
503*437bfbebSnyanmisaka
504*437bfbebSnyanmisaka if (scene_ref) {
505*437bfbebSnyanmisaka p_regs->avs2d_addr.ref_base[replace_idx] = get_frame_fd(p_hal, slot_idx);
506*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(p_hal->cmv_bufs, slot_idx);
507*437bfbebSnyanmisaka p_regs->avs2d_addr.colmv_base[replace_idx] = mpp_buffer_get_fd(mv_buf->buf[0]);
508*437bfbebSnyanmisaka p_regs->avs2d_param.reg67_098_ref_poc[replace_idx] = mpp_frame_get_poc(scene_ref);
509*437bfbebSnyanmisaka }
510*437bfbebSnyanmisaka }
511*437bfbebSnyanmisaka
512*437bfbebSnyanmisaka *ref_low = (RK_U32) (ref_flag & 0xffffffff);
513*437bfbebSnyanmisaka *ref_hight = (RK_U32) ((ref_flag >> 32) & 0xffffffff);
514*437bfbebSnyanmisaka
515*437bfbebSnyanmisaka p_regs->common_addr.reg132_error_ref_base = err_ref_base;
516*437bfbebSnyanmisaka }
517*437bfbebSnyanmisaka
518*437bfbebSnyanmisaka // set rlc
519*437bfbebSnyanmisaka {
520*437bfbebSnyanmisaka p_regs->common_addr.reg128_rlc_base = get_packet_fd(p_hal, task_dec->input);
521*437bfbebSnyanmisaka AVS2D_HAL_TRACE("packet fd %d from slot %d", p_regs->common_addr.reg128_rlc_base, task_dec->input);
522*437bfbebSnyanmisaka p_regs->common_addr.reg129_rlcwrite_base = p_regs->common_addr.reg128_rlc_base;
523*437bfbebSnyanmisaka common->reg016_str_len = MPP_ALIGN(mpp_packet_get_length(task_dec->input_packet), 16) + 64;
524*437bfbebSnyanmisaka }
525*437bfbebSnyanmisaka
526*437bfbebSnyanmisaka /* set scale down info */
527*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe)) {
528*437bfbebSnyanmisaka p_regs->avs2d_addr.scale_down_luma_base = p_regs->common_addr.reg130_decout_base;
529*437bfbebSnyanmisaka p_regs->avs2d_addr.scale_down_chorme_base = p_regs->common_addr.reg130_decout_base;
530*437bfbebSnyanmisaka vdpu382_setup_down_scale(mframe, p_hal->dev, &p_regs->common);
531*437bfbebSnyanmisaka } else {
532*437bfbebSnyanmisaka p_regs->avs2d_addr.scale_down_luma_base = 0;
533*437bfbebSnyanmisaka p_regs->avs2d_addr.scale_down_chorme_base = 0;
534*437bfbebSnyanmisaka p_regs->common.reg012.scale_down_en = 0;
535*437bfbebSnyanmisaka }
536*437bfbebSnyanmisaka
537*437bfbebSnyanmisaka return ret;
538*437bfbebSnyanmisaka }
539*437bfbebSnyanmisaka
hal_avs2d_vdpu382_deinit(void * hal)540*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu382_deinit(void *hal)
541*437bfbebSnyanmisaka {
542*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
543*437bfbebSnyanmisaka RK_U32 i, loop;
544*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
545*437bfbebSnyanmisaka Avs2dVdpu382RegCtx_t *reg_ctx = (Avs2dVdpu382RegCtx_t *)p_hal->reg_ctx;
546*437bfbebSnyanmisaka
547*437bfbebSnyanmisaka AVS2D_HAL_TRACE("In.");
548*437bfbebSnyanmisaka
549*437bfbebSnyanmisaka INP_CHECK(ret, NULL == reg_ctx);
550*437bfbebSnyanmisaka
551*437bfbebSnyanmisaka //!< malloc buffers
552*437bfbebSnyanmisaka loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
553*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
554*437bfbebSnyanmisaka if (reg_ctx->rcb_buf[i]) {
555*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->rcb_buf[i]);
556*437bfbebSnyanmisaka reg_ctx->rcb_buf[i] = NULL;
557*437bfbebSnyanmisaka }
558*437bfbebSnyanmisaka
559*437bfbebSnyanmisaka MPP_FREE(reg_ctx->reg_buf[i].regs);
560*437bfbebSnyanmisaka }
561*437bfbebSnyanmisaka
562*437bfbebSnyanmisaka if (reg_ctx->bufs) {
563*437bfbebSnyanmisaka mpp_buffer_put(reg_ctx->bufs);
564*437bfbebSnyanmisaka reg_ctx->bufs = NULL;
565*437bfbebSnyanmisaka }
566*437bfbebSnyanmisaka
567*437bfbebSnyanmisaka if (p_hal->cmv_bufs) {
568*437bfbebSnyanmisaka hal_bufs_deinit(p_hal->cmv_bufs);
569*437bfbebSnyanmisaka p_hal->cmv_bufs = NULL;
570*437bfbebSnyanmisaka }
571*437bfbebSnyanmisaka
572*437bfbebSnyanmisaka MPP_FREE(p_hal->reg_ctx);
573*437bfbebSnyanmisaka
574*437bfbebSnyanmisaka __RETURN:
575*437bfbebSnyanmisaka AVS2D_HAL_TRACE("Out. ret %d", ret);
576*437bfbebSnyanmisaka return ret;
577*437bfbebSnyanmisaka }
578*437bfbebSnyanmisaka
hal_avs2d_vdpu382_init(void * hal,MppHalCfg * cfg)579*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu382_init(void *hal, MppHalCfg *cfg)
580*437bfbebSnyanmisaka {
581*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
582*437bfbebSnyanmisaka RK_U32 i, loop;
583*437bfbebSnyanmisaka Avs2dVdpu382RegCtx_t *reg_ctx;
584*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
585*437bfbebSnyanmisaka
586*437bfbebSnyanmisaka AVS2D_HAL_TRACE("In.");
587*437bfbebSnyanmisaka
588*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
589*437bfbebSnyanmisaka
590*437bfbebSnyanmisaka MEM_CHECK(ret, p_hal->reg_ctx = mpp_calloc_size(void, sizeof(Avs2dVdpu382RegCtx_t)));
591*437bfbebSnyanmisaka reg_ctx = (Avs2dVdpu382RegCtx_t *)p_hal->reg_ctx;
592*437bfbebSnyanmisaka
593*437bfbebSnyanmisaka //!< malloc buffers
594*437bfbebSnyanmisaka loop = p_hal->fast_mode ? MPP_ARRAY_ELEMS(reg_ctx->reg_buf) : 1;
595*437bfbebSnyanmisaka FUN_CHECK(ret = mpp_buffer_get(p_hal->buf_group, ®_ctx->bufs, AVS2_ALL_TBL_BUF_SIZE(loop)));
596*437bfbebSnyanmisaka reg_ctx->bufs_fd = mpp_buffer_get_fd(reg_ctx->bufs);
597*437bfbebSnyanmisaka reg_ctx->bufs_ptr = mpp_buffer_get_ptr(reg_ctx->bufs);
598*437bfbebSnyanmisaka
599*437bfbebSnyanmisaka for (i = 0; i < loop; i++) {
600*437bfbebSnyanmisaka reg_ctx->reg_buf[i].regs = mpp_calloc(Vdpu382Avs2dRegSet, 1);
601*437bfbebSnyanmisaka init_common_regs(reg_ctx->reg_buf[i].regs);
602*437bfbebSnyanmisaka reg_ctx->reg_buf[i].offset_shph = AVS2_SHPH_OFFSET(i);
603*437bfbebSnyanmisaka reg_ctx->reg_buf[i].offset_sclst = AVS2_SCALIST_OFFSET(i);
604*437bfbebSnyanmisaka }
605*437bfbebSnyanmisaka
606*437bfbebSnyanmisaka if (!p_hal->fast_mode) {
607*437bfbebSnyanmisaka reg_ctx->regs = reg_ctx->reg_buf[0].regs;
608*437bfbebSnyanmisaka reg_ctx->shph_offset = reg_ctx->reg_buf[0].offset_shph;
609*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->reg_buf[0].offset_sclst;
610*437bfbebSnyanmisaka }
611*437bfbebSnyanmisaka
612*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(cfg->cfg->base.out_fmt))
613*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, avs2d_hor_align_64);
614*437bfbebSnyanmisaka else
615*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, avs2d_hor_align);
616*437bfbebSnyanmisaka
617*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_HOR_ALIGN, avs2d_hor_align);
618*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_VER_ALIGN, avs2d_ver_align);
619*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->frame_slots, SLOTS_LEN_ALIGN, avs2d_len_align);
620*437bfbebSnyanmisaka
621*437bfbebSnyanmisaka __RETURN:
622*437bfbebSnyanmisaka AVS2D_HAL_TRACE("Out. ret %d", ret);
623*437bfbebSnyanmisaka (void)cfg;
624*437bfbebSnyanmisaka return ret;
625*437bfbebSnyanmisaka __FAILED:
626*437bfbebSnyanmisaka hal_avs2d_vdpu382_deinit(p_hal);
627*437bfbebSnyanmisaka AVS2D_HAL_TRACE("Out. ret %d", ret);
628*437bfbebSnyanmisaka return ret;
629*437bfbebSnyanmisaka }
630*437bfbebSnyanmisaka
set_up_colmv_buf(void * hal)631*437bfbebSnyanmisaka static MPP_RET set_up_colmv_buf(void *hal)
632*437bfbebSnyanmisaka {
633*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
634*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
635*437bfbebSnyanmisaka Avs2dSyntax_t *syntax = &p_hal->syntax;
636*437bfbebSnyanmisaka PicParams_Avs2d *pp = &syntax->pp;
637*437bfbebSnyanmisaka RK_U32 mv_size = 0;
638*437bfbebSnyanmisaka RK_U32 ctu_size = 1 << (p_hal->syntax.pp.lcu_size);
639*437bfbebSnyanmisaka RK_U32 width = p_hal->syntax.pp.pic_width_in_luma_samples;
640*437bfbebSnyanmisaka RK_U32 height = p_hal->syntax.pp.pic_height_in_luma_samples;
641*437bfbebSnyanmisaka
642*437bfbebSnyanmisaka mv_size = vdpu382_get_colmv_size(width, height, ctu_size, COLMV_BYTES,
643*437bfbebSnyanmisaka COLMV_BLOCK_SIZE, COLMV_COMPRESS_EN);
644*437bfbebSnyanmisaka if (pp->field_coded_sequence)
645*437bfbebSnyanmisaka mv_size *= 2;
646*437bfbebSnyanmisaka AVS2D_HAL_TRACE("mv_size %d", mv_size);
647*437bfbebSnyanmisaka
648*437bfbebSnyanmisaka if (p_hal->cmv_bufs == NULL || p_hal->mv_size < mv_size) {
649*437bfbebSnyanmisaka size_t size = mv_size;
650*437bfbebSnyanmisaka
651*437bfbebSnyanmisaka if (p_hal->cmv_bufs) {
652*437bfbebSnyanmisaka hal_bufs_deinit(p_hal->cmv_bufs);
653*437bfbebSnyanmisaka p_hal->cmv_bufs = NULL;
654*437bfbebSnyanmisaka }
655*437bfbebSnyanmisaka
656*437bfbebSnyanmisaka hal_bufs_init(&p_hal->cmv_bufs);
657*437bfbebSnyanmisaka if (p_hal->cmv_bufs == NULL) {
658*437bfbebSnyanmisaka mpp_err_f("colmv bufs init fail");
659*437bfbebSnyanmisaka ret = MPP_ERR_INIT;
660*437bfbebSnyanmisaka goto __RETURN;
661*437bfbebSnyanmisaka }
662*437bfbebSnyanmisaka
663*437bfbebSnyanmisaka p_hal->mv_size = mv_size;
664*437bfbebSnyanmisaka p_hal->mv_count = mpp_buf_slot_get_count(p_hal->frame_slots);
665*437bfbebSnyanmisaka hal_bufs_setup(p_hal->cmv_bufs, p_hal->mv_count, 1, &size);
666*437bfbebSnyanmisaka }
667*437bfbebSnyanmisaka
668*437bfbebSnyanmisaka __RETURN:
669*437bfbebSnyanmisaka return ret;
670*437bfbebSnyanmisaka }
671*437bfbebSnyanmisaka
hal_avs2d_vdpu382_gen_regs(void * hal,HalTaskInfo * task)672*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu382_gen_regs(void *hal, HalTaskInfo *task)
673*437bfbebSnyanmisaka {
674*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
675*437bfbebSnyanmisaka Avs2dVdpu382RegCtx_t *reg_ctx;
676*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
677*437bfbebSnyanmisaka Vdpu382Avs2dRegSet *regs = NULL;
678*437bfbebSnyanmisaka
679*437bfbebSnyanmisaka AVS2D_HAL_TRACE("In.");
680*437bfbebSnyanmisaka
681*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
682*437bfbebSnyanmisaka
683*437bfbebSnyanmisaka if ((task->dec.flags.parse_err || task->dec.flags.ref_err) &&
684*437bfbebSnyanmisaka !p_hal->cfg->base.disable_error) {
685*437bfbebSnyanmisaka ret = MPP_NOK;
686*437bfbebSnyanmisaka goto __RETURN;
687*437bfbebSnyanmisaka }
688*437bfbebSnyanmisaka
689*437bfbebSnyanmisaka ret = set_up_colmv_buf(p_hal);
690*437bfbebSnyanmisaka if (ret)
691*437bfbebSnyanmisaka goto __RETURN;
692*437bfbebSnyanmisaka
693*437bfbebSnyanmisaka reg_ctx = (Avs2dVdpu382RegCtx_t *)p_hal->reg_ctx;
694*437bfbebSnyanmisaka
695*437bfbebSnyanmisaka if (p_hal->fast_mode) {
696*437bfbebSnyanmisaka RK_U32 i = 0;
697*437bfbebSnyanmisaka
698*437bfbebSnyanmisaka for (i = 0; i < MPP_ARRAY_ELEMS(reg_ctx->reg_buf); i++) {
699*437bfbebSnyanmisaka if (!reg_ctx->reg_buf[i].valid) {
700*437bfbebSnyanmisaka task->dec.reg_index = i;
701*437bfbebSnyanmisaka regs = reg_ctx->reg_buf[i].regs;
702*437bfbebSnyanmisaka reg_ctx->shph_offset = reg_ctx->reg_buf[i].offset_shph;
703*437bfbebSnyanmisaka reg_ctx->sclst_offset = reg_ctx->reg_buf[i].offset_sclst;
704*437bfbebSnyanmisaka reg_ctx->regs = reg_ctx->reg_buf[i].regs;
705*437bfbebSnyanmisaka reg_ctx->reg_buf[i].valid = 1;
706*437bfbebSnyanmisaka break;
707*437bfbebSnyanmisaka }
708*437bfbebSnyanmisaka }
709*437bfbebSnyanmisaka
710*437bfbebSnyanmisaka mpp_assert(regs);
711*437bfbebSnyanmisaka }
712*437bfbebSnyanmisaka
713*437bfbebSnyanmisaka regs = reg_ctx->regs;
714*437bfbebSnyanmisaka
715*437bfbebSnyanmisaka prepare_header(p_hal, reg_ctx->shph_dat, sizeof(reg_ctx->shph_dat));
716*437bfbebSnyanmisaka prepare_scalist(p_hal, reg_ctx->scalist_dat, sizeof(reg_ctx->scalist_dat));
717*437bfbebSnyanmisaka
718*437bfbebSnyanmisaka ret = fill_registers(p_hal, regs, task);
719*437bfbebSnyanmisaka
720*437bfbebSnyanmisaka if (ret)
721*437bfbebSnyanmisaka goto __RETURN;
722*437bfbebSnyanmisaka
723*437bfbebSnyanmisaka {
724*437bfbebSnyanmisaka memcpy(reg_ctx->bufs_ptr + reg_ctx->shph_offset, reg_ctx->shph_dat, sizeof(reg_ctx->shph_dat));
725*437bfbebSnyanmisaka memcpy(reg_ctx->bufs_ptr + reg_ctx->sclst_offset, reg_ctx->scalist_dat, sizeof(reg_ctx->scalist_dat));
726*437bfbebSnyanmisaka regs->common.reg012.scanlist_addr_valid_en = 1;
727*437bfbebSnyanmisaka
728*437bfbebSnyanmisaka regs->avs2d_addr.head_base = reg_ctx->bufs_fd;
729*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 161, reg_ctx->shph_offset);
730*437bfbebSnyanmisaka
731*437bfbebSnyanmisaka regs->avs2d_param.reg105.head_len = AVS2_RKV_SHPH_SIZE / 16;
732*437bfbebSnyanmisaka regs->avs2d_param.reg105.head_len -= (regs->avs2d_param.reg105.head_len > 0) ? 1 : 0;
733*437bfbebSnyanmisaka
734*437bfbebSnyanmisaka regs->avs2d_addr.scanlist_addr = reg_ctx->bufs_fd;
735*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 180, reg_ctx->sclst_offset);
736*437bfbebSnyanmisaka }
737*437bfbebSnyanmisaka
738*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_IN) {
739*437bfbebSnyanmisaka FILE *fp_shph = NULL;
740*437bfbebSnyanmisaka char name[50];
741*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_shph_%03d.bin", p_hal->frame_no);
742*437bfbebSnyanmisaka fp_shph = fopen(name, "wb");
743*437bfbebSnyanmisaka fwrite(reg_ctx->bufs_ptr + reg_ctx->shph_offset, 1, sizeof(reg_ctx->shph_dat), fp_shph);
744*437bfbebSnyanmisaka fclose(fp_shph);
745*437bfbebSnyanmisaka }
746*437bfbebSnyanmisaka
747*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_IN) {
748*437bfbebSnyanmisaka FILE *fp_scalist = NULL;
749*437bfbebSnyanmisaka char name[50];
750*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_scalist_%03d.bin", p_hal->frame_no);
751*437bfbebSnyanmisaka fp_scalist = fopen(name, "wb");
752*437bfbebSnyanmisaka fwrite(reg_ctx->bufs_ptr + reg_ctx->sclst_offset, 1, sizeof(reg_ctx->scalist_dat), fp_scalist);
753*437bfbebSnyanmisaka fclose(fp_scalist);
754*437bfbebSnyanmisaka }
755*437bfbebSnyanmisaka
756*437bfbebSnyanmisaka // set rcb
757*437bfbebSnyanmisaka {
758*437bfbebSnyanmisaka hal_avs2d_rcb_info_update(p_hal, regs);
759*437bfbebSnyanmisaka vdpu382_setup_rcb(®s->common_addr, p_hal->dev, p_hal->fast_mode ?
760*437bfbebSnyanmisaka reg_ctx->rcb_buf[task->dec.reg_index] : reg_ctx->rcb_buf[0],
761*437bfbebSnyanmisaka reg_ctx->rcb_info);
762*437bfbebSnyanmisaka
763*437bfbebSnyanmisaka }
764*437bfbebSnyanmisaka
765*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_IN) {
766*437bfbebSnyanmisaka FILE *fp_rcb = NULL;
767*437bfbebSnyanmisaka char name[50];
768*437bfbebSnyanmisaka void *base = NULL;
769*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_rcb_%03d.bin", p_hal->frame_no);
770*437bfbebSnyanmisaka fp_rcb = fopen(name, "wb");
771*437bfbebSnyanmisaka base = mpp_buffer_get_ptr(reg_ctx->rcb_buf[0]);
772*437bfbebSnyanmisaka fwrite(base, 1, reg_ctx->rcb_buf_size, fp_rcb);
773*437bfbebSnyanmisaka fclose(fp_rcb);
774*437bfbebSnyanmisaka
775*437bfbebSnyanmisaka }
776*437bfbebSnyanmisaka
777*437bfbebSnyanmisaka vdpu382_setup_statistic(®s->common, ®s->statistic);
778*437bfbebSnyanmisaka mpp_buffer_sync_end(reg_ctx->bufs);
779*437bfbebSnyanmisaka
780*437bfbebSnyanmisaka /* enable reference frame usage feedback */
781*437bfbebSnyanmisaka regs->statistic.reg265.perf_cnt0_sel = 42;
782*437bfbebSnyanmisaka
783*437bfbebSnyanmisaka __RETURN:
784*437bfbebSnyanmisaka AVS2D_HAL_TRACE("Out. ret %d", ret);
785*437bfbebSnyanmisaka return ret;
786*437bfbebSnyanmisaka }
787*437bfbebSnyanmisaka
hal_avs2d_vdpu382_dump_reg_write(void * hal,Vdpu382Avs2dRegSet * regs)788*437bfbebSnyanmisaka static MPP_RET hal_avs2d_vdpu382_dump_reg_write(void *hal, Vdpu382Avs2dRegSet *regs)
789*437bfbebSnyanmisaka {
790*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
791*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
792*437bfbebSnyanmisaka FILE *fp_reg = NULL;
793*437bfbebSnyanmisaka RK_U32 i = 0;
794*437bfbebSnyanmisaka char name[50];
795*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_reg_write_%03d.txt", p_hal->frame_no);
796*437bfbebSnyanmisaka fp_reg = fopen(name , "w+");
797*437bfbebSnyanmisaka
798*437bfbebSnyanmisaka fprintf(fp_reg, "********Frame num %d\n", p_hal->frame_no);
799*437bfbebSnyanmisaka for (i = 0; i < 8; i++)
800*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", i, 0);
801*437bfbebSnyanmisaka
802*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu382RegCommon) / sizeof(RK_U32); i++)
803*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", (RK_U32)(i + OFFSET_COMMON_REGS / sizeof(RK_U32)),
804*437bfbebSnyanmisaka ((RK_U32 *)®s->common)[i]);
805*437bfbebSnyanmisaka
806*437bfbebSnyanmisaka for (i = 0; i < 63 - 32; i++)
807*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", i + 33, 0);
808*437bfbebSnyanmisaka
809*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu382RegAvs2dParam) / sizeof(RK_U32); i++)
810*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", (RK_U32)(i + OFFSET_CODEC_PARAMS_REGS / sizeof(RK_U32)),
811*437bfbebSnyanmisaka ((RK_U32 *)®s->avs2d_param)[i]);
812*437bfbebSnyanmisaka
813*437bfbebSnyanmisaka for (i = 0; i < 127 - 112; i++)
814*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", i + 113, 0);
815*437bfbebSnyanmisaka
816*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu382RegCommonAddr) / sizeof(RK_U32); i++)
817*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", (RK_U32)(i + OFFSET_COMMON_ADDR_REGS / sizeof(RK_U32)),
818*437bfbebSnyanmisaka ((RK_U32 *)®s->common_addr)[i]);
819*437bfbebSnyanmisaka
820*437bfbebSnyanmisaka for (i = 0; i < 159 - 142; i++)
821*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", i + 143, 0);
822*437bfbebSnyanmisaka
823*437bfbebSnyanmisaka
824*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu382RegAvs2dAddr) / sizeof(RK_U32); i++ )
825*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", (RK_U32)(i + OFFSET_CODEC_ADDR_REGS / sizeof(RK_U32)),
826*437bfbebSnyanmisaka ((RK_U32 *)®s->avs2d_addr)[i]);
827*437bfbebSnyanmisaka
828*437bfbebSnyanmisaka for (i = 0; i < 223 - 197; i++)
829*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", i + 198, 0);
830*437bfbebSnyanmisaka
831*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu382RegIrqStatus) / sizeof(RK_U32); i++ )
832*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", (RK_U32)(i + OFFSET_INTERRUPT_REGS / sizeof(RK_U32)),
833*437bfbebSnyanmisaka ((RK_U32 *)®s->irq_status)[i]);
834*437bfbebSnyanmisaka
835*437bfbebSnyanmisaka for (i = 0; i < 255 - 237; i++)
836*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", i + 238, 0);
837*437bfbebSnyanmisaka
838*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu382RegStatistic) / sizeof(RK_U32); i++ )
839*437bfbebSnyanmisaka fprintf(fp_reg, "Write reg[%03d] : 0x%08x\n", (RK_U32)(i + OFFSET_STATISTIC_REGS / sizeof(RK_U32)),
840*437bfbebSnyanmisaka ((RK_U32 *)®s->statistic)[i]);
841*437bfbebSnyanmisaka
842*437bfbebSnyanmisaka fclose(fp_reg);
843*437bfbebSnyanmisaka return ret;
844*437bfbebSnyanmisaka }
845*437bfbebSnyanmisaka
hal_avs2d_vdpu382_dump_stream(void * hal,HalTaskInfo * task)846*437bfbebSnyanmisaka static MPP_RET hal_avs2d_vdpu382_dump_stream(void *hal, HalTaskInfo *task)
847*437bfbebSnyanmisaka {
848*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
849*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
850*437bfbebSnyanmisaka
851*437bfbebSnyanmisaka FILE *fp_stream = NULL;
852*437bfbebSnyanmisaka char name[50];
853*437bfbebSnyanmisaka MppBuffer buffer = NULL;
854*437bfbebSnyanmisaka void *base = NULL;
855*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->packet_slots, task->dec.input, SLOT_BUFFER, &buffer);
856*437bfbebSnyanmisaka base = mpp_buffer_get_ptr(buffer);
857*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_stream_in_%03d.bin", p_hal->frame_no);
858*437bfbebSnyanmisaka fp_stream = fopen(name, "wb");
859*437bfbebSnyanmisaka fwrite(base, 1, mpp_packet_get_length(task->dec.input_packet), fp_stream);
860*437bfbebSnyanmisaka fclose(fp_stream);
861*437bfbebSnyanmisaka
862*437bfbebSnyanmisaka return ret;
863*437bfbebSnyanmisaka }
864*437bfbebSnyanmisaka
hal_avs2d_vdpu382_start(void * hal,HalTaskInfo * task)865*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu382_start(void *hal, HalTaskInfo *task)
866*437bfbebSnyanmisaka {
867*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
868*437bfbebSnyanmisaka Vdpu382Avs2dRegSet *regs = NULL;
869*437bfbebSnyanmisaka Avs2dVdpu382RegCtx_t *reg_ctx;
870*437bfbebSnyanmisaka MppDev dev = NULL;
871*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
872*437bfbebSnyanmisaka
873*437bfbebSnyanmisaka AVS2D_HAL_TRACE("In.");
874*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
875*437bfbebSnyanmisaka
876*437bfbebSnyanmisaka if ((task->dec.flags.parse_err || task->dec.flags.ref_err) &&
877*437bfbebSnyanmisaka !p_hal->cfg->base.disable_error) {
878*437bfbebSnyanmisaka ret = MPP_NOK;
879*437bfbebSnyanmisaka goto __RETURN;
880*437bfbebSnyanmisaka }
881*437bfbebSnyanmisaka
882*437bfbebSnyanmisaka reg_ctx = (Avs2dVdpu382RegCtx_t *)p_hal->reg_ctx;
883*437bfbebSnyanmisaka regs = p_hal->fast_mode ? reg_ctx->reg_buf[task->dec.reg_index].regs : reg_ctx->regs;
884*437bfbebSnyanmisaka dev = p_hal->dev;
885*437bfbebSnyanmisaka
886*437bfbebSnyanmisaka p_hal->frame_no++;
887*437bfbebSnyanmisaka
888*437bfbebSnyanmisaka do {
889*437bfbebSnyanmisaka MppDevRegWrCfg wr_cfg;
890*437bfbebSnyanmisaka MppDevRegRdCfg rd_cfg;
891*437bfbebSnyanmisaka
892*437bfbebSnyanmisaka wr_cfg.reg = ®s->common;
893*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->common);
894*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_REGS;
895*437bfbebSnyanmisaka
896*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
897*437bfbebSnyanmisaka
898*437bfbebSnyanmisaka if (ret) {
899*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
900*437bfbebSnyanmisaka break;
901*437bfbebSnyanmisaka }
902*437bfbebSnyanmisaka
903*437bfbebSnyanmisaka wr_cfg.reg = ®s->avs2d_param;
904*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->avs2d_param);
905*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_PARAMS_REGS;
906*437bfbebSnyanmisaka
907*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
908*437bfbebSnyanmisaka
909*437bfbebSnyanmisaka if (ret) {
910*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
911*437bfbebSnyanmisaka break;
912*437bfbebSnyanmisaka }
913*437bfbebSnyanmisaka
914*437bfbebSnyanmisaka wr_cfg.reg = ®s->common_addr;
915*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->common_addr);
916*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
917*437bfbebSnyanmisaka
918*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
919*437bfbebSnyanmisaka
920*437bfbebSnyanmisaka if (ret) {
921*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
922*437bfbebSnyanmisaka break;
923*437bfbebSnyanmisaka }
924*437bfbebSnyanmisaka
925*437bfbebSnyanmisaka wr_cfg.reg = ®s->avs2d_addr;
926*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->avs2d_addr);
927*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
928*437bfbebSnyanmisaka
929*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
930*437bfbebSnyanmisaka
931*437bfbebSnyanmisaka if (ret) {
932*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
933*437bfbebSnyanmisaka break;
934*437bfbebSnyanmisaka }
935*437bfbebSnyanmisaka
936*437bfbebSnyanmisaka wr_cfg.reg = ®s->statistic;
937*437bfbebSnyanmisaka wr_cfg.size = sizeof(regs->statistic);
938*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_STATISTIC_REGS;
939*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
940*437bfbebSnyanmisaka
941*437bfbebSnyanmisaka if (ret) {
942*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
943*437bfbebSnyanmisaka break;
944*437bfbebSnyanmisaka }
945*437bfbebSnyanmisaka
946*437bfbebSnyanmisaka rd_cfg.reg = ®s->irq_status;
947*437bfbebSnyanmisaka rd_cfg.size = sizeof(regs->irq_status);
948*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_INTERRUPT_REGS;
949*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
950*437bfbebSnyanmisaka
951*437bfbebSnyanmisaka if (ret) {
952*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
953*437bfbebSnyanmisaka break;
954*437bfbebSnyanmisaka }
955*437bfbebSnyanmisaka
956*437bfbebSnyanmisaka rd_cfg.reg = ®s->avs2d_param;
957*437bfbebSnyanmisaka rd_cfg.size = sizeof(regs->avs2d_param);
958*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_CODEC_PARAMS_REGS;
959*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
960*437bfbebSnyanmisaka
961*437bfbebSnyanmisaka if (ret) {
962*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
963*437bfbebSnyanmisaka break;
964*437bfbebSnyanmisaka }
965*437bfbebSnyanmisaka
966*437bfbebSnyanmisaka rd_cfg.reg = ®s->statistic;
967*437bfbebSnyanmisaka rd_cfg.size = sizeof(regs->statistic);
968*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_STATISTIC_REGS;
969*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
970*437bfbebSnyanmisaka
971*437bfbebSnyanmisaka if (ret) {
972*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
973*437bfbebSnyanmisaka break;
974*437bfbebSnyanmisaka }
975*437bfbebSnyanmisaka
976*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_REG) {
977*437bfbebSnyanmisaka memset(reg_ctx->reg_out, 0, sizeof(reg_ctx->reg_out));
978*437bfbebSnyanmisaka rd_cfg.reg = reg_ctx->reg_out;
979*437bfbebSnyanmisaka rd_cfg.size = sizeof(reg_ctx->reg_out);
980*437bfbebSnyanmisaka rd_cfg.offset = 0;
981*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
982*437bfbebSnyanmisaka }
983*437bfbebSnyanmisaka
984*437bfbebSnyanmisaka // rcb info for sram
985*437bfbebSnyanmisaka vdpu382_set_rcbinfo(dev, reg_ctx->rcb_info);
986*437bfbebSnyanmisaka
987*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_IN)
988*437bfbebSnyanmisaka hal_avs2d_vdpu382_dump_stream(hal, task);
989*437bfbebSnyanmisaka
990*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_REG)
991*437bfbebSnyanmisaka hal_avs2d_vdpu382_dump_reg_write(hal, regs);
992*437bfbebSnyanmisaka
993*437bfbebSnyanmisaka // send request to hardware
994*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
995*437bfbebSnyanmisaka if (ret) {
996*437bfbebSnyanmisaka mpp_err_f("send cmd failed %d\n", ret);
997*437bfbebSnyanmisaka break;
998*437bfbebSnyanmisaka }
999*437bfbebSnyanmisaka
1000*437bfbebSnyanmisaka } while (0);
1001*437bfbebSnyanmisaka
1002*437bfbebSnyanmisaka __RETURN:
1003*437bfbebSnyanmisaka AVS2D_HAL_TRACE("Out.");
1004*437bfbebSnyanmisaka return ret;
1005*437bfbebSnyanmisaka }
1006*437bfbebSnyanmisaka
1007*437bfbebSnyanmisaka
fetch_data(RK_U32 fmt,RK_U8 * line,RK_U32 num)1008*437bfbebSnyanmisaka static RK_U8 fetch_data(RK_U32 fmt, RK_U8 *line, RK_U32 num)
1009*437bfbebSnyanmisaka {
1010*437bfbebSnyanmisaka RK_U32 offset = 0;
1011*437bfbebSnyanmisaka RK_U32 value = 0;
1012*437bfbebSnyanmisaka
1013*437bfbebSnyanmisaka if (fmt == MPP_FMT_YUV420SP_10BIT) {
1014*437bfbebSnyanmisaka offset = (num * 2) & 7;
1015*437bfbebSnyanmisaka value = (line[num * 10 / 8] >> offset) |
1016*437bfbebSnyanmisaka (line[num * 10 / 8 + 1] << (8 - offset));
1017*437bfbebSnyanmisaka
1018*437bfbebSnyanmisaka value = (value & 0x3ff) >> 2;
1019*437bfbebSnyanmisaka } else if (fmt == MPP_FMT_YUV420SP) {
1020*437bfbebSnyanmisaka value = line[num];
1021*437bfbebSnyanmisaka }
1022*437bfbebSnyanmisaka
1023*437bfbebSnyanmisaka return value;
1024*437bfbebSnyanmisaka }
1025*437bfbebSnyanmisaka
hal_avs2d_vdpu382_dump_yuv(void * hal,HalTaskInfo * task)1026*437bfbebSnyanmisaka static MPP_RET hal_avs2d_vdpu382_dump_yuv(void *hal, HalTaskInfo *task)
1027*437bfbebSnyanmisaka {
1028*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1029*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
1030*437bfbebSnyanmisaka
1031*437bfbebSnyanmisaka MppFrameFormat fmt = MPP_FMT_YUV420SP;
1032*437bfbebSnyanmisaka RK_U32 vir_w = 0;
1033*437bfbebSnyanmisaka RK_U32 vir_h = 0;
1034*437bfbebSnyanmisaka RK_U32 i = 0;
1035*437bfbebSnyanmisaka RK_U32 j = 0;
1036*437bfbebSnyanmisaka FILE *fp_stream = NULL;
1037*437bfbebSnyanmisaka char name[50];
1038*437bfbebSnyanmisaka MppBuffer buffer = NULL;
1039*437bfbebSnyanmisaka MppFrame frame;
1040*437bfbebSnyanmisaka void *base = NULL;
1041*437bfbebSnyanmisaka
1042*437bfbebSnyanmisaka ret = mpp_buf_slot_get_prop(p_hal->frame_slots, task->dec.output, SLOT_FRAME_PTR, &frame);
1043*437bfbebSnyanmisaka
1044*437bfbebSnyanmisaka if (ret != MPP_OK || frame == NULL)
1045*437bfbebSnyanmisaka mpp_log_f("failed to get frame slot %d", task->dec.output);
1046*437bfbebSnyanmisaka
1047*437bfbebSnyanmisaka ret = mpp_buf_slot_get_prop(p_hal->frame_slots, task->dec.output, SLOT_BUFFER, &buffer);
1048*437bfbebSnyanmisaka
1049*437bfbebSnyanmisaka if (ret != MPP_OK || buffer == NULL)
1050*437bfbebSnyanmisaka mpp_log_f("failed to get frame buffer slot %d", task->dec.output);
1051*437bfbebSnyanmisaka
1052*437bfbebSnyanmisaka AVS2D_HAL_TRACE("frame slot %d, fd %d\n", task->dec.output, mpp_buffer_get_fd(buffer));
1053*437bfbebSnyanmisaka base = mpp_buffer_get_ptr(buffer);
1054*437bfbebSnyanmisaka vir_w = mpp_frame_get_hor_stride(frame);
1055*437bfbebSnyanmisaka vir_h = mpp_frame_get_ver_stride(frame);
1056*437bfbebSnyanmisaka fmt = mpp_frame_get_fmt(frame);
1057*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_out_%dx%d_nv12_%03d.yuv", vir_w, vir_h,
1058*437bfbebSnyanmisaka p_hal->frame_no);
1059*437bfbebSnyanmisaka fp_stream = fopen(name, "wb");
1060*437bfbebSnyanmisaka /* if format is fbc, write fbc header first */
1061*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1062*437bfbebSnyanmisaka RK_U32 header_size = 0;
1063*437bfbebSnyanmisaka
1064*437bfbebSnyanmisaka header_size = vir_w * vir_h / 16;
1065*437bfbebSnyanmisaka fwrite(base, 1, header_size, fp_stream);
1066*437bfbebSnyanmisaka base += header_size;
1067*437bfbebSnyanmisaka }
1068*437bfbebSnyanmisaka
1069*437bfbebSnyanmisaka if (fmt != MPP_FMT_YUV420SP_10BIT) {
1070*437bfbebSnyanmisaka fwrite(base, 1, vir_w * vir_h * 3 / 2, fp_stream);
1071*437bfbebSnyanmisaka } else {
1072*437bfbebSnyanmisaka RK_U8 tmp = 0;
1073*437bfbebSnyanmisaka for (i = 0; i < vir_h; i++) {
1074*437bfbebSnyanmisaka for (j = 0; j < vir_w; j++) {
1075*437bfbebSnyanmisaka tmp = fetch_data(fmt, base, j);
1076*437bfbebSnyanmisaka fwrite(&tmp, 1, 1, fp_stream);
1077*437bfbebSnyanmisaka }
1078*437bfbebSnyanmisaka base += vir_w;
1079*437bfbebSnyanmisaka }
1080*437bfbebSnyanmisaka
1081*437bfbebSnyanmisaka for (i = 0; i < vir_h / 2; i++) {
1082*437bfbebSnyanmisaka for (j = 0; j < vir_w; j++) {
1083*437bfbebSnyanmisaka tmp = fetch_data(fmt, base, j);
1084*437bfbebSnyanmisaka fwrite(&tmp, 1, 1, fp_stream);
1085*437bfbebSnyanmisaka }
1086*437bfbebSnyanmisaka base += vir_w;
1087*437bfbebSnyanmisaka }
1088*437bfbebSnyanmisaka }
1089*437bfbebSnyanmisaka fclose(fp_stream);
1090*437bfbebSnyanmisaka
1091*437bfbebSnyanmisaka return ret;
1092*437bfbebSnyanmisaka }
1093*437bfbebSnyanmisaka
hal_avs2d_vdpu382_wait(void * hal,HalTaskInfo * task)1094*437bfbebSnyanmisaka MPP_RET hal_avs2d_vdpu382_wait(void *hal, HalTaskInfo *task)
1095*437bfbebSnyanmisaka {
1096*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1097*437bfbebSnyanmisaka Avs2dHalCtx_t *p_hal = (Avs2dHalCtx_t *)hal;
1098*437bfbebSnyanmisaka Avs2dVdpu382RegCtx_t *reg_ctx;
1099*437bfbebSnyanmisaka Vdpu382Avs2dRegSet *p_regs;
1100*437bfbebSnyanmisaka
1101*437bfbebSnyanmisaka INP_CHECK(ret, NULL == p_hal);
1102*437bfbebSnyanmisaka reg_ctx = (Avs2dVdpu382RegCtx_t *)p_hal->reg_ctx;
1103*437bfbebSnyanmisaka p_regs = p_hal->fast_mode ? reg_ctx->reg_buf[task->dec.reg_index].regs : reg_ctx->regs;
1104*437bfbebSnyanmisaka
1105*437bfbebSnyanmisaka if ((task->dec.flags.parse_err || task->dec.flags.ref_err) &&
1106*437bfbebSnyanmisaka !p_hal->cfg->base.disable_error) {
1107*437bfbebSnyanmisaka AVS2D_HAL_DBG(AVS2D_HAL_DBG_ERROR, "found task error.\n");
1108*437bfbebSnyanmisaka ret = MPP_NOK;
1109*437bfbebSnyanmisaka goto __RETURN;
1110*437bfbebSnyanmisaka } else {
1111*437bfbebSnyanmisaka ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
1112*437bfbebSnyanmisaka if (ret)
1113*437bfbebSnyanmisaka mpp_err_f("poll cmd failed %d\n", ret);
1114*437bfbebSnyanmisaka }
1115*437bfbebSnyanmisaka
1116*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_OUT)
1117*437bfbebSnyanmisaka hal_avs2d_vdpu382_dump_yuv(hal, task);
1118*437bfbebSnyanmisaka
1119*437bfbebSnyanmisaka if (avs2d_hal_debug & AVS2D_HAL_DBG_REG) {
1120*437bfbebSnyanmisaka FILE *fp_reg = NULL;
1121*437bfbebSnyanmisaka RK_U32 i = 0;
1122*437bfbebSnyanmisaka char name[50];
1123*437bfbebSnyanmisaka snprintf(name, sizeof(name), "/data/tmp/rkv_reg_read_%03d.txt", p_hal->frame_no);
1124*437bfbebSnyanmisaka fp_reg = fopen(name , "w+");
1125*437bfbebSnyanmisaka
1126*437bfbebSnyanmisaka for (i = 0; i < 278; i++)
1127*437bfbebSnyanmisaka fprintf(fp_reg, "%08x\n", reg_ctx->reg_out[i]);
1128*437bfbebSnyanmisaka
1129*437bfbebSnyanmisaka fclose(fp_reg);
1130*437bfbebSnyanmisaka }
1131*437bfbebSnyanmisaka
1132*437bfbebSnyanmisaka AVS2D_HAL_TRACE("read reg[224] 0x%08x\n", p_regs->irq_status.reg224);
1133*437bfbebSnyanmisaka
1134*437bfbebSnyanmisaka if (p_hal->dec_cb) {
1135*437bfbebSnyanmisaka DecCbHalDone param;
1136*437bfbebSnyanmisaka
1137*437bfbebSnyanmisaka param.task = (void *)&task->dec;
1138*437bfbebSnyanmisaka param.regs = (RK_U32 *)p_regs;
1139*437bfbebSnyanmisaka
1140*437bfbebSnyanmisaka if (p_regs->irq_status.reg224.dec_error_sta ||
1141*437bfbebSnyanmisaka (!p_regs->irq_status.reg224.dec_rdy_sta) ||
1142*437bfbebSnyanmisaka p_regs->irq_status.reg224.buf_empty_sta ||
1143*437bfbebSnyanmisaka p_regs->irq_status.reg226.strmd_error_status ||
1144*437bfbebSnyanmisaka p_regs->irq_status.reg227.colmv_error_ref_picidx ||
1145*437bfbebSnyanmisaka p_regs->irq_status.reg226.strmd_detect_error_flag)
1146*437bfbebSnyanmisaka param.hard_err = 1;
1147*437bfbebSnyanmisaka else
1148*437bfbebSnyanmisaka param.hard_err = 0;
1149*437bfbebSnyanmisaka
1150*437bfbebSnyanmisaka task->dec.flags.ref_used = p_regs->statistic.reg265.link_perf_cnt0;
1151*437bfbebSnyanmisaka task->dec.flags.ref_info_valid = 1;
1152*437bfbebSnyanmisaka
1153*437bfbebSnyanmisaka if (task->dec.flags.ref_miss) {
1154*437bfbebSnyanmisaka RK_U32 ref_hw_usage = p_regs->statistic.reg265.link_perf_cnt0;
1155*437bfbebSnyanmisaka
1156*437bfbebSnyanmisaka AVS2D_HAL_TRACE("hal frame %d ref miss %x hard_err %d hw_usage %x", p_hal->frame_no,
1157*437bfbebSnyanmisaka task->dec.flags.ref_miss, param.hard_err, ref_hw_usage);
1158*437bfbebSnyanmisaka }
1159*437bfbebSnyanmisaka
1160*437bfbebSnyanmisaka AVS2D_HAL_TRACE("hal frame %d hard_err= %d", p_hal->frame_no, param.hard_err);
1161*437bfbebSnyanmisaka
1162*437bfbebSnyanmisaka mpp_callback(p_hal->dec_cb, ¶m);
1163*437bfbebSnyanmisaka }
1164*437bfbebSnyanmisaka
1165*437bfbebSnyanmisaka memset(&p_regs->irq_status.reg224, 0, sizeof(RK_U32));
1166*437bfbebSnyanmisaka
1167*437bfbebSnyanmisaka if (p_hal->fast_mode)
1168*437bfbebSnyanmisaka reg_ctx->reg_buf[task->dec.reg_index].valid = 0;
1169*437bfbebSnyanmisaka
1170*437bfbebSnyanmisaka __RETURN:
1171*437bfbebSnyanmisaka AVS2D_HAL_TRACE("Out. ret %d", ret);
1172*437bfbebSnyanmisaka return ret;
1173*437bfbebSnyanmisaka }
1174*437bfbebSnyanmisaka
1175*437bfbebSnyanmisaka const MppHalApi hal_avs2d_vdpu382 = {
1176*437bfbebSnyanmisaka .name = "avs2d_vdpu382",
1177*437bfbebSnyanmisaka .type = MPP_CTX_DEC,
1178*437bfbebSnyanmisaka .coding = MPP_VIDEO_CodingAVS2,
1179*437bfbebSnyanmisaka .ctx_size = sizeof(Avs2dVdpu382RegCtx_t),
1180*437bfbebSnyanmisaka .flag = 0,
1181*437bfbebSnyanmisaka .init = hal_avs2d_vdpu382_init,
1182*437bfbebSnyanmisaka .deinit = hal_avs2d_vdpu382_deinit,
1183*437bfbebSnyanmisaka .reg_gen = hal_avs2d_vdpu382_gen_regs,
1184*437bfbebSnyanmisaka .start = hal_avs2d_vdpu382_start,
1185*437bfbebSnyanmisaka .wait = hal_avs2d_vdpu382_wait,
1186*437bfbebSnyanmisaka .reset = NULL,
1187*437bfbebSnyanmisaka .flush = NULL,
1188*437bfbebSnyanmisaka .control = NULL,
1189*437bfbebSnyanmisaka };
1190