1*437bfbebSnyanmisaka /* SPDX-License-Identifier: Apache-2.0 OR MIT */
2*437bfbebSnyanmisaka /*
3*437bfbebSnyanmisaka * Copyright (c) 2024 Rockchip Electronics Co., Ltd.
4*437bfbebSnyanmisaka */
5*437bfbebSnyanmisaka
6*437bfbebSnyanmisaka #define MODULE_TAG "hal_vp9d_vdpu383"
7*437bfbebSnyanmisaka
8*437bfbebSnyanmisaka #include <string.h>
9*437bfbebSnyanmisaka
10*437bfbebSnyanmisaka #include "mpp_debug.h"
11*437bfbebSnyanmisaka #include "mpp_env.h"
12*437bfbebSnyanmisaka #include "mpp_mem.h"
13*437bfbebSnyanmisaka #include "mpp_common.h"
14*437bfbebSnyanmisaka #include "mpp_buffer_impl.h"
15*437bfbebSnyanmisaka #include "mpp_bitput.h"
16*437bfbebSnyanmisaka #include "mpp_compat_impl.h"
17*437bfbebSnyanmisaka
18*437bfbebSnyanmisaka #include "hal_vp9d_debug.h"
19*437bfbebSnyanmisaka #include "hal_vp9d_com.h"
20*437bfbebSnyanmisaka #include "hal_vp9d_vdpu383.h"
21*437bfbebSnyanmisaka #include "hal_vp9d_ctx.h"
22*437bfbebSnyanmisaka #include "vdpu383_vp9d.h"
23*437bfbebSnyanmisaka #include "vp9d_syntax.h"
24*437bfbebSnyanmisaka
25*437bfbebSnyanmisaka #define HW_PROB 1
26*437bfbebSnyanmisaka #define VP9_CONTEXT 4
27*437bfbebSnyanmisaka #define VP9_CTU_SIZE 64
28*437bfbebSnyanmisaka
29*437bfbebSnyanmisaka #define GBL_SIZE 2 * (MPP_ALIGN(1299, 128) / 8)
30*437bfbebSnyanmisaka
31*437bfbebSnyanmisaka #define EIGHTTAP 0
32*437bfbebSnyanmisaka #define EIGHTTAP_SMOOTH 1
33*437bfbebSnyanmisaka #define EIGHTTAP_SHARP 2
34*437bfbebSnyanmisaka #define BILINEAR 3
35*437bfbebSnyanmisaka
36*437bfbebSnyanmisaka const RK_U8 literal_to_filter[] = { EIGHTTAP_SMOOTH, EIGHTTAP,
37*437bfbebSnyanmisaka EIGHTTAP_SHARP, BILINEAR
38*437bfbebSnyanmisaka };
39*437bfbebSnyanmisaka
40*437bfbebSnyanmisaka typedef struct Vdpu383Vp9dCtx_t {
41*437bfbebSnyanmisaka Vp9dRegBuf g_buf[MAX_GEN_REG];
42*437bfbebSnyanmisaka MppBuffer global_base;
43*437bfbebSnyanmisaka MppBuffer probe_base;
44*437bfbebSnyanmisaka MppBuffer count_base;
45*437bfbebSnyanmisaka MppBuffer segid_cur_base;
46*437bfbebSnyanmisaka MppBuffer segid_last_base;
47*437bfbebSnyanmisaka MppBuffer prob_default_base;
48*437bfbebSnyanmisaka void* hw_regs;
49*437bfbebSnyanmisaka RK_S32 mv_base_addr;
50*437bfbebSnyanmisaka RK_S32 pre_mv_base_addr;
51*437bfbebSnyanmisaka Vp9dLastInfo ls_info;
52*437bfbebSnyanmisaka /*
53*437bfbebSnyanmisaka * swap between segid_cur_base & segid_last_base
54*437bfbebSnyanmisaka * 0 used segid_cur_base as last
55*437bfbebSnyanmisaka * 1 used segid_last_base as
56*437bfbebSnyanmisaka */
57*437bfbebSnyanmisaka RK_U32 last_segid_flag;
58*437bfbebSnyanmisaka RK_S32 width;
59*437bfbebSnyanmisaka RK_S32 height;
60*437bfbebSnyanmisaka /* rcb buffers info */
61*437bfbebSnyanmisaka RK_S32 rcb_buf_size;
62*437bfbebSnyanmisaka Vdpu383RcbInfo rcb_info[RCB_BUF_COUNT];
63*437bfbebSnyanmisaka MppBuffer rcb_buf;
64*437bfbebSnyanmisaka RK_U32 num_row_tiles;
65*437bfbebSnyanmisaka RK_U32 bit_depth;
66*437bfbebSnyanmisaka /* colmv buffers info */
67*437bfbebSnyanmisaka HalBufs cmv_bufs;
68*437bfbebSnyanmisaka RK_S32 mv_size;
69*437bfbebSnyanmisaka RK_S32 mv_count;
70*437bfbebSnyanmisaka HalBufs origin_bufs;
71*437bfbebSnyanmisaka RK_U32 prob_ctx_valid[VP9_CONTEXT];
72*437bfbebSnyanmisaka MppBuffer prob_loop_base[VP9_CONTEXT];
73*437bfbebSnyanmisaka /* uncompress header data */
74*437bfbebSnyanmisaka RK_U8 header_data[168];
75*437bfbebSnyanmisaka } Vdpu383Vp9dCtx;
76*437bfbebSnyanmisaka
77*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
78*437bfbebSnyanmisaka static RK_U32 cur_last_segid_flag;
79*437bfbebSnyanmisaka static MppBuffer cur_last_prob_base;
80*437bfbebSnyanmisaka #endif
81*437bfbebSnyanmisaka
vdpu383_setup_scale_origin_bufs(Vdpu383Vp9dCtx * ctx,MppFrame mframe)82*437bfbebSnyanmisaka static MPP_RET vdpu383_setup_scale_origin_bufs(Vdpu383Vp9dCtx *ctx, MppFrame mframe)
83*437bfbebSnyanmisaka {
84*437bfbebSnyanmisaka /* for 8K FrameBuf scale mode */
85*437bfbebSnyanmisaka size_t origin_buf_size = 0;
86*437bfbebSnyanmisaka
87*437bfbebSnyanmisaka origin_buf_size = mpp_frame_get_buf_size(mframe);
88*437bfbebSnyanmisaka
89*437bfbebSnyanmisaka if (!origin_buf_size) {
90*437bfbebSnyanmisaka mpp_err_f("origin_bufs get buf size failed\n");
91*437bfbebSnyanmisaka return MPP_NOK;
92*437bfbebSnyanmisaka }
93*437bfbebSnyanmisaka if (ctx->origin_bufs) {
94*437bfbebSnyanmisaka hal_bufs_deinit(ctx->origin_bufs);
95*437bfbebSnyanmisaka ctx->origin_bufs = NULL;
96*437bfbebSnyanmisaka }
97*437bfbebSnyanmisaka hal_bufs_init(&ctx->origin_bufs);
98*437bfbebSnyanmisaka if (!ctx->origin_bufs) {
99*437bfbebSnyanmisaka mpp_err_f("origin_bufs thumb init fail\n");
100*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
101*437bfbebSnyanmisaka }
102*437bfbebSnyanmisaka hal_bufs_setup(ctx->origin_bufs, 16, 1, &origin_buf_size);
103*437bfbebSnyanmisaka
104*437bfbebSnyanmisaka return MPP_OK;
105*437bfbebSnyanmisaka }
hal_vp9d_alloc_res(HalVp9dCtx * hal)106*437bfbebSnyanmisaka static MPP_RET hal_vp9d_alloc_res(HalVp9dCtx *hal)
107*437bfbebSnyanmisaka {
108*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
109*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
110*437bfbebSnyanmisaka RK_S32 ret = 0;
111*437bfbebSnyanmisaka RK_S32 i = 0;
112*437bfbebSnyanmisaka
113*437bfbebSnyanmisaka /* alloc common buffer */
114*437bfbebSnyanmisaka for (i = 0; i < VP9_CONTEXT; i++) {
115*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->prob_loop_base[i], PROB_SIZE);
116*437bfbebSnyanmisaka if (ret) {
117*437bfbebSnyanmisaka mpp_err("vp9 probe_loop_base get buffer failed\n");
118*437bfbebSnyanmisaka return ret;
119*437bfbebSnyanmisaka }
120*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->prob_loop_base[i], p_hal->dev);
121*437bfbebSnyanmisaka }
122*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->prob_default_base, PROB_SIZE);
123*437bfbebSnyanmisaka if (ret) {
124*437bfbebSnyanmisaka mpp_err("vp9 probe_default_base get buffer failed\n");
125*437bfbebSnyanmisaka return ret;
126*437bfbebSnyanmisaka }
127*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->prob_default_base, p_hal->dev);
128*437bfbebSnyanmisaka
129*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->segid_cur_base, MAX_SEGMAP_SIZE);
130*437bfbebSnyanmisaka if (ret) {
131*437bfbebSnyanmisaka mpp_err("vp9 segid_cur_base get buffer failed\n");
132*437bfbebSnyanmisaka return ret;
133*437bfbebSnyanmisaka }
134*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->segid_cur_base, p_hal->dev);
135*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->segid_last_base, MAX_SEGMAP_SIZE);
136*437bfbebSnyanmisaka if (ret) {
137*437bfbebSnyanmisaka mpp_err("vp9 segid_last_base get buffer failed\n");
138*437bfbebSnyanmisaka return ret;
139*437bfbebSnyanmisaka }
140*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->segid_last_base, p_hal->dev);
141*437bfbebSnyanmisaka
142*437bfbebSnyanmisaka /* alloc buffer for fast mode or normal */
143*437bfbebSnyanmisaka if (p_hal->fast_mode) {
144*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
145*437bfbebSnyanmisaka hw_ctx->g_buf[i].hw_regs = mpp_calloc_size(void, sizeof(Vdpu383Vp9dRegSet));
146*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group,
147*437bfbebSnyanmisaka &hw_ctx->g_buf[i].global_base, GBL_SIZE);
148*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->g_buf[i].global_base, p_hal->dev);
149*437bfbebSnyanmisaka if (ret) {
150*437bfbebSnyanmisaka mpp_err("vp9 global_base get buffer failed\n");
151*437bfbebSnyanmisaka return ret;
152*437bfbebSnyanmisaka }
153*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group,
154*437bfbebSnyanmisaka &hw_ctx->g_buf[i].probe_base, PROB_KF_SIZE);
155*437bfbebSnyanmisaka if (ret) {
156*437bfbebSnyanmisaka mpp_err("vp9 probe_base get buffer failed\n");
157*437bfbebSnyanmisaka return ret;
158*437bfbebSnyanmisaka }
159*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->g_buf[i].probe_base, p_hal->dev);
160*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group,
161*437bfbebSnyanmisaka &hw_ctx->g_buf[i].count_base, COUNT_SIZE);
162*437bfbebSnyanmisaka if (ret) {
163*437bfbebSnyanmisaka mpp_err("vp9 count_base get buffer failed\n");
164*437bfbebSnyanmisaka return ret;
165*437bfbebSnyanmisaka }
166*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->g_buf[i].count_base, p_hal->dev);
167*437bfbebSnyanmisaka }
168*437bfbebSnyanmisaka } else {
169*437bfbebSnyanmisaka hw_ctx->hw_regs = mpp_calloc_size(void, sizeof(Vdpu383Vp9dRegSet));
170*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->global_base, PROB_SIZE);
171*437bfbebSnyanmisaka if (ret) {
172*437bfbebSnyanmisaka mpp_err("vp9 global_base get buffer failed\n");
173*437bfbebSnyanmisaka return ret;
174*437bfbebSnyanmisaka }
175*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->global_base, p_hal->dev);
176*437bfbebSnyanmisaka
177*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->probe_base, PROB_KF_SIZE);
178*437bfbebSnyanmisaka if (ret) {
179*437bfbebSnyanmisaka mpp_err("vp9 probe_base get buffer failed\n");
180*437bfbebSnyanmisaka return ret;
181*437bfbebSnyanmisaka }
182*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->probe_base, p_hal->dev);
183*437bfbebSnyanmisaka
184*437bfbebSnyanmisaka ret = mpp_buffer_get(p_hal->group, &hw_ctx->count_base, COUNT_SIZE);
185*437bfbebSnyanmisaka if (ret) {
186*437bfbebSnyanmisaka mpp_err("vp9 count_base get buffer failed\n");
187*437bfbebSnyanmisaka return ret;
188*437bfbebSnyanmisaka }
189*437bfbebSnyanmisaka mpp_buffer_attach_dev(hw_ctx->count_base, p_hal->dev);
190*437bfbebSnyanmisaka }
191*437bfbebSnyanmisaka return MPP_OK;
192*437bfbebSnyanmisaka }
193*437bfbebSnyanmisaka
hal_vp9d_release_res(HalVp9dCtx * hal)194*437bfbebSnyanmisaka static MPP_RET hal_vp9d_release_res(HalVp9dCtx *hal)
195*437bfbebSnyanmisaka {
196*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
197*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
198*437bfbebSnyanmisaka RK_S32 ret = 0;
199*437bfbebSnyanmisaka RK_S32 i = 0;
200*437bfbebSnyanmisaka
201*437bfbebSnyanmisaka if (hw_ctx->prob_default_base) {
202*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->prob_default_base);
203*437bfbebSnyanmisaka if (ret) {
204*437bfbebSnyanmisaka mpp_err("vp9 probe_wr_base get buffer failed\n");
205*437bfbebSnyanmisaka return ret;
206*437bfbebSnyanmisaka }
207*437bfbebSnyanmisaka }
208*437bfbebSnyanmisaka if (hw_ctx->segid_cur_base) {
209*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->segid_cur_base);
210*437bfbebSnyanmisaka if (ret) {
211*437bfbebSnyanmisaka mpp_err("vp9 segid_cur_base put buffer failed\n");
212*437bfbebSnyanmisaka return ret;
213*437bfbebSnyanmisaka }
214*437bfbebSnyanmisaka }
215*437bfbebSnyanmisaka if (hw_ctx->segid_last_base) {
216*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->segid_last_base);
217*437bfbebSnyanmisaka if (ret) {
218*437bfbebSnyanmisaka mpp_err("vp9 segid_last_base put buffer failed\n");
219*437bfbebSnyanmisaka return ret;
220*437bfbebSnyanmisaka }
221*437bfbebSnyanmisaka }
222*437bfbebSnyanmisaka for (i = 0; i < VP9_CONTEXT; i++) {
223*437bfbebSnyanmisaka if (hw_ctx->prob_loop_base[i]) {
224*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->prob_loop_base[i]);
225*437bfbebSnyanmisaka if (ret) {
226*437bfbebSnyanmisaka mpp_err("vp9 prob_loop_base put buffer failed\n");
227*437bfbebSnyanmisaka return ret;
228*437bfbebSnyanmisaka }
229*437bfbebSnyanmisaka }
230*437bfbebSnyanmisaka }
231*437bfbebSnyanmisaka if (p_hal->fast_mode) {
232*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
233*437bfbebSnyanmisaka if (hw_ctx->g_buf[i].global_base) {
234*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->g_buf[i].global_base);
235*437bfbebSnyanmisaka if (ret) {
236*437bfbebSnyanmisaka mpp_err("vp9 global_base put buffer failed\n");
237*437bfbebSnyanmisaka return ret;
238*437bfbebSnyanmisaka }
239*437bfbebSnyanmisaka }
240*437bfbebSnyanmisaka if (hw_ctx->g_buf[i].probe_base) {
241*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->g_buf[i].probe_base);
242*437bfbebSnyanmisaka if (ret) {
243*437bfbebSnyanmisaka mpp_err("vp9 probe_base put buffer failed\n");
244*437bfbebSnyanmisaka return ret;
245*437bfbebSnyanmisaka }
246*437bfbebSnyanmisaka }
247*437bfbebSnyanmisaka if (hw_ctx->g_buf[i].count_base) {
248*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->g_buf[i].count_base);
249*437bfbebSnyanmisaka if (ret) {
250*437bfbebSnyanmisaka mpp_err("vp9 count_base put buffer failed\n");
251*437bfbebSnyanmisaka return ret;
252*437bfbebSnyanmisaka }
253*437bfbebSnyanmisaka }
254*437bfbebSnyanmisaka if (hw_ctx->g_buf[i].hw_regs) {
255*437bfbebSnyanmisaka mpp_free(hw_ctx->g_buf[i].hw_regs);
256*437bfbebSnyanmisaka hw_ctx->g_buf[i].hw_regs = NULL;
257*437bfbebSnyanmisaka }
258*437bfbebSnyanmisaka if (hw_ctx->g_buf[i].rcb_buf) {
259*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->g_buf[i].rcb_buf);
260*437bfbebSnyanmisaka if (ret) {
261*437bfbebSnyanmisaka mpp_err("vp9 rcb_buf[%d] put buffer failed\n", i);
262*437bfbebSnyanmisaka return ret;
263*437bfbebSnyanmisaka }
264*437bfbebSnyanmisaka }
265*437bfbebSnyanmisaka }
266*437bfbebSnyanmisaka } else {
267*437bfbebSnyanmisaka if (hw_ctx->global_base) {
268*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->global_base);
269*437bfbebSnyanmisaka if (ret) {
270*437bfbebSnyanmisaka mpp_err("vp9 global_base get buffer failed\n");
271*437bfbebSnyanmisaka return ret;
272*437bfbebSnyanmisaka }
273*437bfbebSnyanmisaka }
274*437bfbebSnyanmisaka if (hw_ctx->probe_base) {
275*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->probe_base);
276*437bfbebSnyanmisaka if (ret) {
277*437bfbebSnyanmisaka mpp_err("vp9 probe_base get buffer failed\n");
278*437bfbebSnyanmisaka return ret;
279*437bfbebSnyanmisaka }
280*437bfbebSnyanmisaka }
281*437bfbebSnyanmisaka if (hw_ctx->count_base) {
282*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->count_base);
283*437bfbebSnyanmisaka if (ret) {
284*437bfbebSnyanmisaka mpp_err("vp9 count_base put buffer failed\n");
285*437bfbebSnyanmisaka return ret;
286*437bfbebSnyanmisaka }
287*437bfbebSnyanmisaka }
288*437bfbebSnyanmisaka if (hw_ctx->hw_regs) {
289*437bfbebSnyanmisaka mpp_free(hw_ctx->hw_regs);
290*437bfbebSnyanmisaka hw_ctx->hw_regs = NULL;
291*437bfbebSnyanmisaka }
292*437bfbebSnyanmisaka if (hw_ctx->rcb_buf) {
293*437bfbebSnyanmisaka ret = mpp_buffer_put(hw_ctx->rcb_buf);
294*437bfbebSnyanmisaka if (ret) {
295*437bfbebSnyanmisaka mpp_err("vp9 rcb_buf put buffer failed\n");
296*437bfbebSnyanmisaka return ret;
297*437bfbebSnyanmisaka }
298*437bfbebSnyanmisaka }
299*437bfbebSnyanmisaka }
300*437bfbebSnyanmisaka
301*437bfbebSnyanmisaka if (hw_ctx->cmv_bufs) {
302*437bfbebSnyanmisaka ret = hal_bufs_deinit(hw_ctx->cmv_bufs);
303*437bfbebSnyanmisaka if (ret) {
304*437bfbebSnyanmisaka mpp_err("vp9 cmv bufs deinit buffer failed\n");
305*437bfbebSnyanmisaka return ret;
306*437bfbebSnyanmisaka }
307*437bfbebSnyanmisaka }
308*437bfbebSnyanmisaka if (hw_ctx->origin_bufs) {
309*437bfbebSnyanmisaka ret = hal_bufs_deinit(hw_ctx->origin_bufs);
310*437bfbebSnyanmisaka if (ret) {
311*437bfbebSnyanmisaka mpp_err("thumb vp9 origin_bufs deinit buffer failed\n");
312*437bfbebSnyanmisaka return ret;
313*437bfbebSnyanmisaka }
314*437bfbebSnyanmisaka hw_ctx->origin_bufs = NULL;
315*437bfbebSnyanmisaka }
316*437bfbebSnyanmisaka
317*437bfbebSnyanmisaka return MPP_OK;
318*437bfbebSnyanmisaka }
319*437bfbebSnyanmisaka
hal_vp9d_vdpu383_deinit(void * hal)320*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_deinit(void *hal)
321*437bfbebSnyanmisaka {
322*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
323*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
324*437bfbebSnyanmisaka
325*437bfbebSnyanmisaka hal_vp9d_release_res(p_hal);
326*437bfbebSnyanmisaka
327*437bfbebSnyanmisaka if (p_hal->group) {
328*437bfbebSnyanmisaka ret = mpp_buffer_group_put(p_hal->group);
329*437bfbebSnyanmisaka if (ret) {
330*437bfbebSnyanmisaka mpp_err("vp9d group free buffer failed\n");
331*437bfbebSnyanmisaka return ret;
332*437bfbebSnyanmisaka }
333*437bfbebSnyanmisaka }
334*437bfbebSnyanmisaka MPP_FREE(p_hal->hw_ctx);
335*437bfbebSnyanmisaka
336*437bfbebSnyanmisaka return ret;
337*437bfbebSnyanmisaka }
338*437bfbebSnyanmisaka
hal_vp9d_vdpu383_init(void * hal,MppHalCfg * cfg)339*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_init(void *hal, MppHalCfg *cfg)
340*437bfbebSnyanmisaka {
341*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
342*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
343*437bfbebSnyanmisaka MEM_CHECK(ret, p_hal->hw_ctx = mpp_calloc_size(void, sizeof(Vdpu383Vp9dCtx)));
344*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
345*437bfbebSnyanmisaka (void) cfg;
346*437bfbebSnyanmisaka
347*437bfbebSnyanmisaka hw_ctx->mv_base_addr = -1;
348*437bfbebSnyanmisaka hw_ctx->pre_mv_base_addr = -1;
349*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
350*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->slots, SLOTS_VER_ALIGN, vp9_ver_align);
351*437bfbebSnyanmisaka
352*437bfbebSnyanmisaka if (p_hal->group == NULL) {
353*437bfbebSnyanmisaka ret = mpp_buffer_group_get_internal(&p_hal->group, MPP_BUFFER_TYPE_ION);
354*437bfbebSnyanmisaka if (ret) {
355*437bfbebSnyanmisaka mpp_err("vp9 mpp_buffer_group_get failed\n");
356*437bfbebSnyanmisaka goto __FAILED;
357*437bfbebSnyanmisaka }
358*437bfbebSnyanmisaka }
359*437bfbebSnyanmisaka
360*437bfbebSnyanmisaka ret = hal_vp9d_alloc_res(p_hal);
361*437bfbebSnyanmisaka if (ret) {
362*437bfbebSnyanmisaka mpp_err("hal_vp9d_alloc_res failed\n");
363*437bfbebSnyanmisaka goto __FAILED;
364*437bfbebSnyanmisaka }
365*437bfbebSnyanmisaka
366*437bfbebSnyanmisaka hw_ctx->last_segid_flag = 1;
367*437bfbebSnyanmisaka
368*437bfbebSnyanmisaka if (cfg->hal_fbc_adj_cfg) {
369*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->func = vdpu383_afbc_align_calc;
370*437bfbebSnyanmisaka cfg->hal_fbc_adj_cfg->expand = 0;
371*437bfbebSnyanmisaka }
372*437bfbebSnyanmisaka
373*437bfbebSnyanmisaka return ret;
374*437bfbebSnyanmisaka __FAILED:
375*437bfbebSnyanmisaka hal_vp9d_vdpu383_deinit(hal);
376*437bfbebSnyanmisaka return ret;
377*437bfbebSnyanmisaka }
378*437bfbebSnyanmisaka
vp9d_refine_rcb_size(Vdpu383RcbInfo * rcb_info,RK_S32 width,RK_S32 height,void * data)379*437bfbebSnyanmisaka static void vp9d_refine_rcb_size(Vdpu383RcbInfo *rcb_info,
380*437bfbebSnyanmisaka RK_S32 width, RK_S32 height, void* data)
381*437bfbebSnyanmisaka {
382*437bfbebSnyanmisaka RK_U32 rcb_bits = 0;
383*437bfbebSnyanmisaka DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)data;
384*437bfbebSnyanmisaka RK_U32 tile_row_num = 1 << pic_param->log2_tile_rows;
385*437bfbebSnyanmisaka RK_U32 tile_col_num = 1 << pic_param->log2_tile_cols;
386*437bfbebSnyanmisaka RK_U32 bit_depth = pic_param->BitDepthMinus8Luma + 8;
387*437bfbebSnyanmisaka RK_U32 ext_row_align_size = tile_row_num * 64 * 8;
388*437bfbebSnyanmisaka RK_U32 ext_col_align_size = tile_col_num * 64 * 8;
389*437bfbebSnyanmisaka RK_U32 filterd_row_append = 8192;
390*437bfbebSnyanmisaka
391*437bfbebSnyanmisaka width = MPP_ALIGN(width, VP9_CTU_SIZE);
392*437bfbebSnyanmisaka height = MPP_ALIGN(height, VP9_CTU_SIZE);
393*437bfbebSnyanmisaka /* RCB_STRMD_ROW && RCB_STRMD_TILE_ROW*/
394*437bfbebSnyanmisaka if (width > 4096)
395*437bfbebSnyanmisaka rcb_bits = ((width + 63) / 64) * 250;
396*437bfbebSnyanmisaka else
397*437bfbebSnyanmisaka rcb_bits = 0;
398*437bfbebSnyanmisaka rcb_info[RCB_STRMD_ROW].size = 0;
399*437bfbebSnyanmisaka rcb_info[RCB_STRMD_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
400*437bfbebSnyanmisaka
401*437bfbebSnyanmisaka /* RCB_INTER_ROW && RCB_INTER_TILE_ROW*/
402*437bfbebSnyanmisaka rcb_bits = ((width + 63) / 64) * 2368;
403*437bfbebSnyanmisaka rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
404*437bfbebSnyanmisaka rcb_bits += ext_row_align_size;
405*437bfbebSnyanmisaka if (tile_row_num > 1)
406*437bfbebSnyanmisaka rcb_info[RCB_INTER_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
407*437bfbebSnyanmisaka else
408*437bfbebSnyanmisaka rcb_info[RCB_INTER_TILE_ROW].size = 0;
409*437bfbebSnyanmisaka
410*437bfbebSnyanmisaka /* RCB_INTRA_ROW && RCB_INTRA_TILE_ROW*/
411*437bfbebSnyanmisaka rcb_bits = MPP_ALIGN(width, 512) * (bit_depth + 2);
412*437bfbebSnyanmisaka rcb_bits = rcb_bits * 3; //TODO:
413*437bfbebSnyanmisaka rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
414*437bfbebSnyanmisaka rcb_bits += ext_row_align_size;
415*437bfbebSnyanmisaka if (tile_row_num > 1)
416*437bfbebSnyanmisaka rcb_info[RCB_INTRA_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
417*437bfbebSnyanmisaka else
418*437bfbebSnyanmisaka rcb_info[RCB_INTRA_TILE_ROW].size = 0;
419*437bfbebSnyanmisaka
420*437bfbebSnyanmisaka /* RCB_FILTERD_ROW && RCB_FILTERD_TILE_ROW*/
421*437bfbebSnyanmisaka // save space mode : half for RCB_FILTERD_ROW, half for RCB_FILTERD_PROTECT_ROW
422*437bfbebSnyanmisaka if (width > 4096)
423*437bfbebSnyanmisaka filterd_row_append = 27648;
424*437bfbebSnyanmisaka rcb_bits = (RK_U32)(MPP_ALIGN(width, 64) * (41 * bit_depth + 13));
425*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
426*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_PROTECT_ROW].size = filterd_row_append + MPP_RCB_BYTES(rcb_bits / 2);
427*437bfbebSnyanmisaka rcb_bits += ext_row_align_size;
428*437bfbebSnyanmisaka if (tile_row_num > 1)
429*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_ROW].size = MPP_RCB_BYTES(rcb_bits);
430*437bfbebSnyanmisaka else
431*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_ROW].size = 0;
432*437bfbebSnyanmisaka
433*437bfbebSnyanmisaka /* RCB_FILTERD_TILE_COL */
434*437bfbebSnyanmisaka if (tile_col_num > 1) {
435*437bfbebSnyanmisaka rcb_bits = (RK_U32)(MPP_ALIGN(height, 64) * (42 * bit_depth + 13)) + ext_col_align_size;
436*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_COL].size = MPP_RCB_BYTES(rcb_bits);
437*437bfbebSnyanmisaka } else {
438*437bfbebSnyanmisaka rcb_info[RCB_FILTERD_TILE_COL].size = 0;
439*437bfbebSnyanmisaka }
440*437bfbebSnyanmisaka
441*437bfbebSnyanmisaka }
442*437bfbebSnyanmisaka
hal_vp9d_rcb_info_update(void * hal,Vdpu383Vp9dRegSet * hw_regs,void * data)443*437bfbebSnyanmisaka static void hal_vp9d_rcb_info_update(void *hal, Vdpu383Vp9dRegSet *hw_regs, void *data)
444*437bfbebSnyanmisaka {
445*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
446*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
447*437bfbebSnyanmisaka DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)data;
448*437bfbebSnyanmisaka RK_U32 num_tiles = pic_param->log2_tile_rows;
449*437bfbebSnyanmisaka RK_U32 bit_depth = pic_param->BitDepthMinus8Luma + 8;
450*437bfbebSnyanmisaka RK_S32 height = vp9_ver_align(pic_param->height);
451*437bfbebSnyanmisaka RK_S32 width = vp9_ver_align(pic_param->width);
452*437bfbebSnyanmisaka (void) hw_regs;
453*437bfbebSnyanmisaka
454*437bfbebSnyanmisaka if (hw_ctx->num_row_tiles != num_tiles ||
455*437bfbebSnyanmisaka hw_ctx->bit_depth != bit_depth ||
456*437bfbebSnyanmisaka hw_ctx->width != width ||
457*437bfbebSnyanmisaka hw_ctx->height != height) {
458*437bfbebSnyanmisaka
459*437bfbebSnyanmisaka hw_ctx->rcb_buf_size = vdpu383_get_rcb_buf_size(hw_ctx->rcb_info, width, height);
460*437bfbebSnyanmisaka // TODO: refine rcb buffer size
461*437bfbebSnyanmisaka vp9d_refine_rcb_size(hw_ctx->rcb_info, width, height, pic_param);
462*437bfbebSnyanmisaka
463*437bfbebSnyanmisaka if (p_hal->fast_mode) {
464*437bfbebSnyanmisaka RK_U32 i;
465*437bfbebSnyanmisaka
466*437bfbebSnyanmisaka for (i = 0; i < MPP_ARRAY_ELEMS(hw_ctx->g_buf); i++) {
467*437bfbebSnyanmisaka MppBuffer rcb_buf = hw_ctx->g_buf[i].rcb_buf;
468*437bfbebSnyanmisaka
469*437bfbebSnyanmisaka if (rcb_buf) {
470*437bfbebSnyanmisaka mpp_buffer_put(rcb_buf);
471*437bfbebSnyanmisaka hw_ctx->g_buf[i].rcb_buf = NULL;
472*437bfbebSnyanmisaka }
473*437bfbebSnyanmisaka mpp_buffer_get(p_hal->group, &rcb_buf, hw_ctx->rcb_buf_size);
474*437bfbebSnyanmisaka hw_ctx->g_buf[i].rcb_buf = rcb_buf;
475*437bfbebSnyanmisaka }
476*437bfbebSnyanmisaka } else {
477*437bfbebSnyanmisaka MppBuffer rcb_buf = hw_ctx->rcb_buf;
478*437bfbebSnyanmisaka
479*437bfbebSnyanmisaka if (rcb_buf) {
480*437bfbebSnyanmisaka mpp_buffer_put(rcb_buf);
481*437bfbebSnyanmisaka rcb_buf = NULL;
482*437bfbebSnyanmisaka }
483*437bfbebSnyanmisaka mpp_buffer_get(p_hal->group, &rcb_buf, hw_ctx->rcb_buf_size);
484*437bfbebSnyanmisaka hw_ctx->rcb_buf = rcb_buf;
485*437bfbebSnyanmisaka }
486*437bfbebSnyanmisaka
487*437bfbebSnyanmisaka hw_ctx->num_row_tiles = num_tiles;
488*437bfbebSnyanmisaka hw_ctx->bit_depth = bit_depth;
489*437bfbebSnyanmisaka hw_ctx->width = width;
490*437bfbebSnyanmisaka hw_ctx->height = height;
491*437bfbebSnyanmisaka }
492*437bfbebSnyanmisaka }
493*437bfbebSnyanmisaka
494*437bfbebSnyanmisaka static void
set_tile_offset(RK_S32 * start,RK_S32 * end,RK_S32 idx,RK_S32 log2_n,RK_S32 n)495*437bfbebSnyanmisaka set_tile_offset(RK_S32 *start, RK_S32 *end, RK_S32 idx, RK_S32 log2_n, RK_S32 n)
496*437bfbebSnyanmisaka {
497*437bfbebSnyanmisaka RK_S32 sb_start = ( idx * n) >> log2_n;
498*437bfbebSnyanmisaka RK_S32 sb_end = ((idx + 1) * n) >> log2_n;
499*437bfbebSnyanmisaka
500*437bfbebSnyanmisaka *start = MPP_MIN(sb_start, n) << 3;
501*437bfbebSnyanmisaka *end = MPP_MIN(sb_end, n) << 3;
502*437bfbebSnyanmisaka }
503*437bfbebSnyanmisaka
prepare_uncompress_header(HalVp9dCtx * p_hal,DXVA_PicParams_VP9 * pp,RK_U64 * data,RK_U32 len)504*437bfbebSnyanmisaka static MPP_RET prepare_uncompress_header(HalVp9dCtx *p_hal, DXVA_PicParams_VP9 *pp,
505*437bfbebSnyanmisaka RK_U64 *data, RK_U32 len)
506*437bfbebSnyanmisaka {
507*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
508*437bfbebSnyanmisaka BitputCtx_t bp;
509*437bfbebSnyanmisaka RK_S32 i, j;
510*437bfbebSnyanmisaka
511*437bfbebSnyanmisaka mpp_set_bitput_ctx(&bp, data, len);
512*437bfbebSnyanmisaka
513*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->frame_type, 1);
514*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->error_resilient_mode, 1);
515*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->BitDepthMinus8Luma, 3);
516*437bfbebSnyanmisaka mpp_put_bits(&bp, 1, 2); // yuv420
517*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->width, 16);
518*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->height, 16);
519*437bfbebSnyanmisaka
520*437bfbebSnyanmisaka mpp_put_bits(&bp, (!pp->frame_type || pp->intra_only), 1);
521*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_sign_bias[1], 1);
522*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_sign_bias[2], 1);
523*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_sign_bias[3], 1);
524*437bfbebSnyanmisaka
525*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->allow_high_precision_mv, 1);
526*437bfbebSnyanmisaka /* sync with cmodel */
527*437bfbebSnyanmisaka if (!pp->frame_type || pp->intra_only)
528*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 3);
529*437bfbebSnyanmisaka else {
530*437bfbebSnyanmisaka if (pp->interp_filter == 4) /* FILTER_SWITCHABLE */
531*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->interp_filter, 3);
532*437bfbebSnyanmisaka else
533*437bfbebSnyanmisaka mpp_put_bits(&bp, literal_to_filter[pp->interp_filter], 3);
534*437bfbebSnyanmisaka }
535*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->parallelmode, 1);
536*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->refresh_frame_context, 1);
537*437bfbebSnyanmisaka
538*437bfbebSnyanmisaka /* loop filter */
539*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->filter_level, 6);
540*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->sharpness_level, 3);
541*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mode_ref_delta_enabled, 1);
542*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mode_ref_delta_update, 1);
543*437bfbebSnyanmisaka
544*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_deltas[0], 7);
545*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_deltas[1], 7);
546*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_deltas[2], 7);
547*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_deltas[3], 7);
548*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mode_deltas[0], 7);
549*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mode_deltas[1], 7);
550*437bfbebSnyanmisaka
551*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->base_qindex, 8);
552*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->y_dc_delta_q, 5);
553*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->uv_dc_delta_q, 5);
554*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->uv_ac_delta_q, 5);
555*437bfbebSnyanmisaka mpp_put_bits(&bp, (!pp->base_qindex && !pp->y_dc_delta_q && !pp->uv_dc_delta_q && !pp->uv_ac_delta_q), 1);
556*437bfbebSnyanmisaka
557*437bfbebSnyanmisaka for (i = 0; i < 3; i++) {
558*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.pred_probs[i], 8);
559*437bfbebSnyanmisaka }
560*437bfbebSnyanmisaka for (i = 0; i < 7; i++) {
561*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.tree_probs[i], 8);
562*437bfbebSnyanmisaka }
563*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.enabled, 1);
564*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.update_map, 1);
565*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.temporal_update, 1);
566*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.abs_delta, 1);
567*437bfbebSnyanmisaka
568*437bfbebSnyanmisaka {
569*437bfbebSnyanmisaka RK_U32 use_prev_frame_mvs = !pp->error_resilient_mode &&
570*437bfbebSnyanmisaka pp->width == hw_ctx->ls_info.last_width &&
571*437bfbebSnyanmisaka pp->height == hw_ctx->ls_info.last_height &&
572*437bfbebSnyanmisaka !hw_ctx->ls_info.last_intra_only &&
573*437bfbebSnyanmisaka hw_ctx->ls_info.last_show_frame;
574*437bfbebSnyanmisaka mpp_put_bits(&bp, use_prev_frame_mvs, 1);
575*437bfbebSnyanmisaka }
576*437bfbebSnyanmisaka
577*437bfbebSnyanmisaka for ( i = 0; i < 8; i++ )
578*437bfbebSnyanmisaka for ( j = 0; j < 4; j++ )
579*437bfbebSnyanmisaka mpp_put_bits(&bp, (pp->stVP9Segments.feature_mask[i] >> j) & 0x1, 1);
580*437bfbebSnyanmisaka
581*437bfbebSnyanmisaka for ( i = 0; i < 8; i++ ) {
582*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.feature_data[i][0], 9);
583*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.feature_data[i][1], 7);
584*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->stVP9Segments.feature_data[i][2], 2);
585*437bfbebSnyanmisaka }
586*437bfbebSnyanmisaka
587*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->first_partition_size, 16);
588*437bfbebSnyanmisaka
589*437bfbebSnyanmisaka /* refer frame width and height */
590*437bfbebSnyanmisaka {
591*437bfbebSnyanmisaka RK_S32 ref_idx = pp->frame_refs[0].Index7Bits;
592*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_coded_width[ref_idx], 16);
593*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_coded_height[ref_idx], 16);
594*437bfbebSnyanmisaka ref_idx = pp->frame_refs[1].Index7Bits;
595*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_coded_width[ref_idx], 16);
596*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_coded_height[ref_idx], 16);
597*437bfbebSnyanmisaka ref_idx = pp->frame_refs[2].Index7Bits;
598*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_coded_width[ref_idx], 16);
599*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->ref_frame_coded_height[ref_idx], 16);
600*437bfbebSnyanmisaka }
601*437bfbebSnyanmisaka
602*437bfbebSnyanmisaka /* last frame info */
603*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_mode_deltas[0], 7);
604*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_mode_deltas[1], 7);
605*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_ref_deltas[0], 7);
606*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_ref_deltas[1], 7);
607*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_ref_deltas[2], 7);
608*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_ref_deltas[3], 7);
609*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.segmentation_enable_flag_last, 1);
610*437bfbebSnyanmisaka
611*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.last_show_frame, 1);
612*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->intra_only, 1);
613*437bfbebSnyanmisaka {
614*437bfbebSnyanmisaka RK_U32 last_widthheight_eqcur = pp->width == hw_ctx->ls_info.last_width &&
615*437bfbebSnyanmisaka pp->height == hw_ctx->ls_info.last_height;
616*437bfbebSnyanmisaka
617*437bfbebSnyanmisaka mpp_put_bits(&bp, last_widthheight_eqcur, 1);
618*437bfbebSnyanmisaka }
619*437bfbebSnyanmisaka mpp_put_bits(&bp, hw_ctx->ls_info.color_space_last, 3);
620*437bfbebSnyanmisaka
621*437bfbebSnyanmisaka mpp_put_bits(&bp, !hw_ctx->ls_info.last_frame_type, 1);
622*437bfbebSnyanmisaka mpp_put_bits(&bp, 0, 1);
623*437bfbebSnyanmisaka mpp_put_bits(&bp, 1, 1);
624*437bfbebSnyanmisaka mpp_put_bits(&bp, 1, 1);
625*437bfbebSnyanmisaka mpp_put_bits(&bp, 1, 1);
626*437bfbebSnyanmisaka
627*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvscale[0][0], 16);
628*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvscale[0][1], 16);
629*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvscale[1][0], 16);
630*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvscale[1][1], 16);
631*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvscale[2][0], 16);
632*437bfbebSnyanmisaka mpp_put_bits(&bp, pp->mvscale[2][1], 16);
633*437bfbebSnyanmisaka
634*437bfbebSnyanmisaka /* tile cols and rows */
635*437bfbebSnyanmisaka {
636*437bfbebSnyanmisaka RK_S32 tile_width[64] = {0};
637*437bfbebSnyanmisaka RK_S32 tile_height[4] = {0};
638*437bfbebSnyanmisaka RK_S32 tile_cols = 1 << pp->log2_tile_cols;
639*437bfbebSnyanmisaka RK_S32 tile_rows = 1 << pp->log2_tile_rows;
640*437bfbebSnyanmisaka
641*437bfbebSnyanmisaka mpp_put_bits(&bp, tile_cols, 7);
642*437bfbebSnyanmisaka mpp_put_bits(&bp, tile_rows, 3);
643*437bfbebSnyanmisaka
644*437bfbebSnyanmisaka for (i = 0; i < tile_cols; ++i) { // tile_col
645*437bfbebSnyanmisaka RK_S32 tile_col_start = 0;
646*437bfbebSnyanmisaka RK_S32 tile_col_end = 0;
647*437bfbebSnyanmisaka
648*437bfbebSnyanmisaka set_tile_offset(&tile_col_start, &tile_col_end,
649*437bfbebSnyanmisaka i, pp->log2_tile_cols, MPP_ALIGN(pp->width, 64) / 64);
650*437bfbebSnyanmisaka tile_width[i] = (tile_col_end - tile_col_start + 7) / 8;
651*437bfbebSnyanmisaka }
652*437bfbebSnyanmisaka
653*437bfbebSnyanmisaka for (j = 0; j < tile_rows; ++j) { // tile_row
654*437bfbebSnyanmisaka RK_S32 tile_row_start = 0;
655*437bfbebSnyanmisaka RK_S32 tile_row_end = 0;
656*437bfbebSnyanmisaka
657*437bfbebSnyanmisaka set_tile_offset(&tile_row_start, &tile_row_end,
658*437bfbebSnyanmisaka j, pp->log2_tile_rows, MPP_ALIGN(pp->height, 64) / 64);
659*437bfbebSnyanmisaka tile_height[j] = (tile_row_end - tile_row_start + 7) / 8;
660*437bfbebSnyanmisaka }
661*437bfbebSnyanmisaka
662*437bfbebSnyanmisaka for (i = 0; i < 64; i++)
663*437bfbebSnyanmisaka mpp_put_bits(&bp, tile_width[i], 10);
664*437bfbebSnyanmisaka
665*437bfbebSnyanmisaka for (j = 0; j < 4; j++)
666*437bfbebSnyanmisaka mpp_put_bits(&bp, tile_height[j], 10);
667*437bfbebSnyanmisaka }
668*437bfbebSnyanmisaka
669*437bfbebSnyanmisaka mpp_put_align(&bp, 64, 0);//128
670*437bfbebSnyanmisaka
671*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
672*437bfbebSnyanmisaka {
673*437bfbebSnyanmisaka char *cur_fname = "global_cfg.dat";
674*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
675*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
676*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)bp.pbuf, 64 * (bp.index - 1) + bp.bitpos, 64, 0);
677*437bfbebSnyanmisaka }
678*437bfbebSnyanmisaka #endif
679*437bfbebSnyanmisaka
680*437bfbebSnyanmisaka return MPP_OK;
681*437bfbebSnyanmisaka }
682*437bfbebSnyanmisaka
hal_vp9d_vdpu383_gen_regs(void * hal,HalTaskInfo * task)683*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_gen_regs(void *hal, HalTaskInfo *task)
684*437bfbebSnyanmisaka {
685*437bfbebSnyanmisaka RK_S32 i;
686*437bfbebSnyanmisaka RK_U8 bit_depth = 0;
687*437bfbebSnyanmisaka RK_U32 ref_frame_width_y;
688*437bfbebSnyanmisaka RK_U32 ref_frame_height_y;
689*437bfbebSnyanmisaka RK_S32 stream_len = 0, aglin_offset = 0;
690*437bfbebSnyanmisaka RK_U32 y_hor_virstride, uv_hor_virstride, y_virstride;
691*437bfbebSnyanmisaka RK_U8 *bitstream = NULL;
692*437bfbebSnyanmisaka MppBuffer streambuf = NULL;
693*437bfbebSnyanmisaka RK_U32 sw_y_hor_virstride;
694*437bfbebSnyanmisaka RK_U32 sw_uv_hor_virstride;
695*437bfbebSnyanmisaka RK_U32 sw_y_virstride;
696*437bfbebSnyanmisaka RK_U32 sw_uv_virstride;
697*437bfbebSnyanmisaka RK_U8 ref_idx = 0;
698*437bfbebSnyanmisaka RK_U8 ref_frame_idx = 0;
699*437bfbebSnyanmisaka RK_U32 *reg_ref_base = NULL;
700*437bfbebSnyanmisaka RK_U32 *reg_payload_ref_base = NULL;
701*437bfbebSnyanmisaka RK_S32 intraFlag = 0;
702*437bfbebSnyanmisaka MppBuffer framebuf = NULL;
703*437bfbebSnyanmisaka HalBuf *mv_buf = NULL;
704*437bfbebSnyanmisaka RK_U32 fbc_en = 0;
705*437bfbebSnyanmisaka HalBuf *origin_buf = NULL;
706*437bfbebSnyanmisaka
707*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
708*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
709*437bfbebSnyanmisaka DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
710*437bfbebSnyanmisaka Vdpu383Vp9dRegSet *vp9_hw_regs = NULL;
711*437bfbebSnyanmisaka RK_S32 mv_size = pic_param->width * pic_param->height / 2;
712*437bfbebSnyanmisaka RK_U32 frame_ctx_id = pic_param->frame_context_idx;
713*437bfbebSnyanmisaka MppFrame mframe;
714*437bfbebSnyanmisaka MppFrame ref_frame = NULL;
715*437bfbebSnyanmisaka
716*437bfbebSnyanmisaka if (p_hal->fast_mode) {
717*437bfbebSnyanmisaka for (i = 0; i < MAX_GEN_REG; i++) {
718*437bfbebSnyanmisaka if (!hw_ctx->g_buf[i].use_flag) {
719*437bfbebSnyanmisaka task->dec.reg_index = i;
720*437bfbebSnyanmisaka hw_ctx->global_base = hw_ctx->g_buf[i].global_base;
721*437bfbebSnyanmisaka hw_ctx->probe_base = hw_ctx->g_buf[i].probe_base;
722*437bfbebSnyanmisaka hw_ctx->count_base = hw_ctx->g_buf[i].count_base;
723*437bfbebSnyanmisaka hw_ctx->hw_regs = hw_ctx->g_buf[i].hw_regs;
724*437bfbebSnyanmisaka hw_ctx->g_buf[i].use_flag = 1;
725*437bfbebSnyanmisaka break;
726*437bfbebSnyanmisaka }
727*437bfbebSnyanmisaka }
728*437bfbebSnyanmisaka if (i == MAX_GEN_REG) {
729*437bfbebSnyanmisaka mpp_err("vp9 fast mode buf all used\n");
730*437bfbebSnyanmisaka return MPP_ERR_NOMEM;
731*437bfbebSnyanmisaka }
732*437bfbebSnyanmisaka }
733*437bfbebSnyanmisaka vp9_hw_regs = (Vdpu383Vp9dRegSet*)hw_ctx->hw_regs;
734*437bfbebSnyanmisaka memset(vp9_hw_regs, 0, sizeof(Vdpu383Vp9dRegSet));
735*437bfbebSnyanmisaka
736*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
737*437bfbebSnyanmisaka {
738*437bfbebSnyanmisaka memset(dump_cur_dir, 0, sizeof(dump_cur_dir));
739*437bfbebSnyanmisaka sprintf(dump_cur_dir, "vp9/Frame%04d", dump_cur_frame);
740*437bfbebSnyanmisaka if (access(dump_cur_dir, 0)) {
741*437bfbebSnyanmisaka if (mkdir(dump_cur_dir))
742*437bfbebSnyanmisaka mpp_err_f("error: mkdir %s\n", dump_cur_dir);
743*437bfbebSnyanmisaka }
744*437bfbebSnyanmisaka dump_cur_frame++;
745*437bfbebSnyanmisaka }
746*437bfbebSnyanmisaka #endif
747*437bfbebSnyanmisaka
748*437bfbebSnyanmisaka /* uncompress header data */
749*437bfbebSnyanmisaka prepare_uncompress_header(p_hal, pic_param, (RK_U64 *)hw_ctx->header_data, sizeof(hw_ctx->header_data) / 8);
750*437bfbebSnyanmisaka memcpy(mpp_buffer_get_ptr(hw_ctx->global_base), hw_ctx->header_data, sizeof(hw_ctx->header_data));
751*437bfbebSnyanmisaka mpp_buffer_sync_end(hw_ctx->global_base);
752*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg67_global_len = GBL_SIZE / 16;
753*437bfbebSnyanmisaka vp9_hw_regs->common_addr.reg131_gbl_base = mpp_buffer_get_fd(hw_ctx->global_base);
754*437bfbebSnyanmisaka
755*437bfbebSnyanmisaka if (hw_ctx->cmv_bufs == NULL || hw_ctx->mv_size < mv_size) {
756*437bfbebSnyanmisaka size_t size = mv_size;
757*437bfbebSnyanmisaka
758*437bfbebSnyanmisaka if (hw_ctx->cmv_bufs) {
759*437bfbebSnyanmisaka hal_bufs_deinit(hw_ctx->cmv_bufs);
760*437bfbebSnyanmisaka hw_ctx->cmv_bufs = NULL;
761*437bfbebSnyanmisaka }
762*437bfbebSnyanmisaka
763*437bfbebSnyanmisaka hal_bufs_init(&hw_ctx->cmv_bufs);
764*437bfbebSnyanmisaka if (hw_ctx->cmv_bufs == NULL) {
765*437bfbebSnyanmisaka mpp_err_f("colmv bufs init fail");
766*437bfbebSnyanmisaka return MPP_NOK;
767*437bfbebSnyanmisaka }
768*437bfbebSnyanmisaka hw_ctx->mv_size = mv_size;
769*437bfbebSnyanmisaka hw_ctx->mv_count = mpp_buf_slot_get_count(p_hal ->slots);
770*437bfbebSnyanmisaka hal_bufs_setup(hw_ctx->cmv_bufs, hw_ctx->mv_count, 1, &size);
771*437bfbebSnyanmisaka }
772*437bfbebSnyanmisaka
773*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
774*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY &&
775*437bfbebSnyanmisaka hw_ctx->origin_bufs == NULL) {
776*437bfbebSnyanmisaka vdpu383_setup_scale_origin_bufs(hw_ctx, mframe);
777*437bfbebSnyanmisaka }
778*437bfbebSnyanmisaka
779*437bfbebSnyanmisaka stream_len = (RK_S32)mpp_packet_get_length(task->dec.input_packet);
780*437bfbebSnyanmisaka
781*437bfbebSnyanmisaka intraFlag = (!pic_param->frame_type || pic_param->intra_only);
782*437bfbebSnyanmisaka #if HW_PROB
783*437bfbebSnyanmisaka // hal_vp9d_prob_flag_delta(mpp_buffer_get_ptr(hw_ctx->probe_base), task->dec.syntax.data);
784*437bfbebSnyanmisaka /* init kf_probe */
785*437bfbebSnyanmisaka hal_vp9d_prob_kf(mpp_buffer_get_ptr(hw_ctx->probe_base));
786*437bfbebSnyanmisaka mpp_buffer_sync_end(hw_ctx->probe_base);
787*437bfbebSnyanmisaka if (intraFlag) {
788*437bfbebSnyanmisaka hal_vp9d_prob_default(mpp_buffer_get_ptr(hw_ctx->prob_default_base), task->dec.syntax.data);
789*437bfbebSnyanmisaka mpp_buffer_sync_end(hw_ctx->prob_default_base);
790*437bfbebSnyanmisaka }
791*437bfbebSnyanmisaka
792*437bfbebSnyanmisaka /* config last prob base and update write base */
793*437bfbebSnyanmisaka {
794*437bfbebSnyanmisaka if (intraFlag || pic_param->error_resilient_mode) {
795*437bfbebSnyanmisaka if (intraFlag
796*437bfbebSnyanmisaka || pic_param->error_resilient_mode
797*437bfbebSnyanmisaka || (pic_param->reset_frame_context == 3)) {
798*437bfbebSnyanmisaka memset(hw_ctx->prob_ctx_valid, 0, sizeof(hw_ctx->prob_ctx_valid));
799*437bfbebSnyanmisaka } else if (pic_param->reset_frame_context == 2) {
800*437bfbebSnyanmisaka hw_ctx->prob_ctx_valid[frame_ctx_id] = 0;
801*437bfbebSnyanmisaka }
802*437bfbebSnyanmisaka }
803*437bfbebSnyanmisaka
804*437bfbebSnyanmisaka if (hw_ctx->prob_ctx_valid[frame_ctx_id]) {
805*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg184_lastprob_base =
806*437bfbebSnyanmisaka mpp_buffer_get_fd(hw_ctx->prob_loop_base[frame_ctx_id]);
807*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
808*437bfbebSnyanmisaka { cur_last_prob_base = hw_ctx->prob_loop_base[frame_ctx_id]; }
809*437bfbebSnyanmisaka #endif
810*437bfbebSnyanmisaka } else {
811*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg184_lastprob_base = mpp_buffer_get_fd(hw_ctx->prob_default_base);
812*437bfbebSnyanmisaka hw_ctx->prob_ctx_valid[frame_ctx_id] |= pic_param->refresh_frame_context;
813*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
814*437bfbebSnyanmisaka { cur_last_prob_base = hw_ctx->prob_default_base; }
815*437bfbebSnyanmisaka #endif
816*437bfbebSnyanmisaka }
817*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg185_updateprob_base =
818*437bfbebSnyanmisaka mpp_buffer_get_fd(hw_ctx->prob_loop_base[frame_ctx_id]);
819*437bfbebSnyanmisaka }
820*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg183_kfprob_base = mpp_buffer_get_fd(hw_ctx->probe_base);
821*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
822*437bfbebSnyanmisaka {
823*437bfbebSnyanmisaka char *cur_fname = "cabac_last_probe.dat";
824*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
825*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
826*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(cur_last_prob_base),
827*437bfbebSnyanmisaka 8 * 152 * 16, 128, 0);
828*437bfbebSnyanmisaka }
829*437bfbebSnyanmisaka {
830*437bfbebSnyanmisaka char *cur_fname = "cabac_kf_probe.dat";
831*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
832*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
833*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(hw_ctx->probe_base),
834*437bfbebSnyanmisaka 8 * PROB_KF_SIZE, 128, 0);
835*437bfbebSnyanmisaka }
836*437bfbebSnyanmisaka #endif
837*437bfbebSnyanmisaka #else
838*437bfbebSnyanmisaka #endif
839*437bfbebSnyanmisaka
840*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg66_stream_len = ((stream_len + 15) & (~15)) + 0x80;
841*437bfbebSnyanmisaka
842*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->packet_slots, task->dec.input, SLOT_BUFFER, &streambuf);
843*437bfbebSnyanmisaka bitstream = mpp_buffer_get_ptr(streambuf);
844*437bfbebSnyanmisaka aglin_offset = vp9_hw_regs->vp9d_paras.reg66_stream_len - stream_len;
845*437bfbebSnyanmisaka if (aglin_offset > 0) {
846*437bfbebSnyanmisaka memset((void *)(bitstream + stream_len), 0, aglin_offset);
847*437bfbebSnyanmisaka }
848*437bfbebSnyanmisaka
849*437bfbebSnyanmisaka //--- caculate the yuv_frame_size and mv_size
850*437bfbebSnyanmisaka bit_depth = pic_param->BitDepthMinus8Luma + 8;
851*437bfbebSnyanmisaka
852*437bfbebSnyanmisaka {
853*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
854*437bfbebSnyanmisaka fbc_en = MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe));
855*437bfbebSnyanmisaka
856*437bfbebSnyanmisaka if (fbc_en) {
857*437bfbebSnyanmisaka RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
858*437bfbebSnyanmisaka RK_U32 h = MPP_ALIGN(mpp_frame_get_height(mframe), 64);
859*437bfbebSnyanmisaka RK_U32 fbd_offset;
860*437bfbebSnyanmisaka
861*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg9.fbc_e = 1;
862*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg68_hor_virstride = fbc_hdr_stride / 64;
863*437bfbebSnyanmisaka fbd_offset = vp9_hw_regs->vp9d_paras.reg68_hor_virstride * h * 4;
864*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg193_fbc_payload_offset = fbd_offset;
865*437bfbebSnyanmisaka /* error stride */
866*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg80_error_ref_hor_virstride = fbc_hdr_stride / 64;
867*437bfbebSnyanmisaka } else {
868*437bfbebSnyanmisaka sw_y_hor_virstride = mpp_frame_get_hor_stride(mframe) >> 4;
869*437bfbebSnyanmisaka sw_uv_hor_virstride = sw_y_hor_virstride;
870*437bfbebSnyanmisaka sw_y_virstride = mpp_frame_get_ver_stride(mframe) * sw_y_hor_virstride;
871*437bfbebSnyanmisaka sw_uv_virstride = sw_y_virstride / 2;
872*437bfbebSnyanmisaka
873*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg9.fbc_e = 0;
874*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_TILE(mpp_frame_get_fmt(mframe))) {
875*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg9.tile_e = 1;
876*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg68_hor_virstride = sw_y_hor_virstride * 6;
877*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg70_y_virstride = sw_y_virstride + sw_uv_virstride;
878*437bfbebSnyanmisaka } else {
879*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg9.tile_e = 0;
880*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg68_hor_virstride = sw_y_hor_virstride;
881*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg69_raster_uv_hor_virstride = sw_uv_hor_virstride;
882*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg70_y_virstride = sw_y_virstride;
883*437bfbebSnyanmisaka }
884*437bfbebSnyanmisaka /* error stride */
885*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg80_error_ref_hor_virstride = sw_y_hor_virstride;
886*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg81_error_ref_raster_uv_hor_virstride = sw_uv_hor_virstride;
887*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg82_error_ref_virstride = sw_y_virstride;
888*437bfbebSnyanmisaka }
889*437bfbebSnyanmisaka }
890*437bfbebSnyanmisaka if (!pic_param->intra_only && pic_param->frame_type &&
891*437bfbebSnyanmisaka !pic_param->error_resilient_mode && hw_ctx->ls_info.last_show_frame) {
892*437bfbebSnyanmisaka hw_ctx->pre_mv_base_addr = hw_ctx->mv_base_addr;
893*437bfbebSnyanmisaka }
894*437bfbebSnyanmisaka
895*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
896*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal ->slots, task->dec.output, SLOT_BUFFER, &framebuf);
897*437bfbebSnyanmisaka if (mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY) {
898*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(hw_ctx->origin_bufs, task->dec.output);
899*437bfbebSnyanmisaka framebuf = origin_buf->buf[0];
900*437bfbebSnyanmisaka }
901*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg168_decout_base = mpp_buffer_get_fd(framebuf);
902*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg169_error_ref_base = mpp_buffer_get_fd(framebuf);
903*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg192_payload_st_cur_base = mpp_buffer_get_fd(framebuf);
904*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg194_payload_st_error_ref_base = mpp_buffer_get_fd(framebuf);
905*437bfbebSnyanmisaka vp9_hw_regs->common_addr.reg128_strm_base = mpp_buffer_get_fd(streambuf);
906*437bfbebSnyanmisaka
907*437bfbebSnyanmisaka {
908*437bfbebSnyanmisaka RK_U32 strm_offset = pic_param->uncompressed_header_size_byte_aligned;
909*437bfbebSnyanmisaka
910*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg65_strm_start_bit = 8 * (strm_offset & 0xf);
911*437bfbebSnyanmisaka mpp_dev_set_reg_offset(p_hal->dev, 128, strm_offset & 0xfffffff0);
912*437bfbebSnyanmisaka }
913*437bfbebSnyanmisaka
914*437bfbebSnyanmisaka if (hw_ctx->last_segid_flag) {
915*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg181_segidlast_base = mpp_buffer_get_fd(hw_ctx->segid_last_base);
916*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg182_segidcur_base = mpp_buffer_get_fd(hw_ctx->segid_cur_base);
917*437bfbebSnyanmisaka } else {
918*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg181_segidlast_base = mpp_buffer_get_fd(hw_ctx->segid_cur_base);
919*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg182_segidcur_base = mpp_buffer_get_fd(hw_ctx->segid_last_base);
920*437bfbebSnyanmisaka }
921*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
922*437bfbebSnyanmisaka cur_last_segid_flag = hw_ctx->last_segid_flag;
923*437bfbebSnyanmisaka {
924*437bfbebSnyanmisaka char *cur_fname = "stream_in.dat";
925*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
926*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
927*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path, (void *)mpp_buffer_get_ptr(streambuf)
928*437bfbebSnyanmisaka + pic_param->uncompressed_header_size_byte_aligned,
929*437bfbebSnyanmisaka 8 * (((stream_len + 15) & (~15)) + 0x80), 128, 0);
930*437bfbebSnyanmisaka }
931*437bfbebSnyanmisaka #endif
932*437bfbebSnyanmisaka /* set last segid flag */
933*437bfbebSnyanmisaka if ((pic_param->stVP9Segments.enabled && pic_param->stVP9Segments.update_map) ||
934*437bfbebSnyanmisaka (pic_param->width != hw_ctx->ls_info.last_width || pic_param->height != hw_ctx->ls_info.last_height) ||
935*437bfbebSnyanmisaka intraFlag || pic_param->error_resilient_mode) {
936*437bfbebSnyanmisaka hw_ctx->last_segid_flag = !hw_ctx->last_segid_flag;
937*437bfbebSnyanmisaka }
938*437bfbebSnyanmisaka //set cur colmv base
939*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(hw_ctx->cmv_bufs, task->dec.output);
940*437bfbebSnyanmisaka
941*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg216_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
942*437bfbebSnyanmisaka
943*437bfbebSnyanmisaka hw_ctx->mv_base_addr = vp9_hw_regs->vp9d_addrs.reg216_colmv_cur_base;
944*437bfbebSnyanmisaka if (hw_ctx->pre_mv_base_addr < 0)
945*437bfbebSnyanmisaka hw_ctx->pre_mv_base_addr = hw_ctx->mv_base_addr;
946*437bfbebSnyanmisaka
947*437bfbebSnyanmisaka // vp9 only one colmv
948*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg217_232_colmv_ref_base[0] = hw_ctx->pre_mv_base_addr;
949*437bfbebSnyanmisaka
950*437bfbebSnyanmisaka reg_ref_base = vp9_hw_regs->vp9d_addrs.reg170_185_ref_base;
951*437bfbebSnyanmisaka reg_payload_ref_base = vp9_hw_regs->vp9d_addrs.reg195_210_payload_st_ref_base;
952*437bfbebSnyanmisaka for (i = 0; i < 3; i++) {
953*437bfbebSnyanmisaka ref_idx = pic_param->frame_refs[i].Index7Bits;
954*437bfbebSnyanmisaka ref_frame_idx = pic_param->ref_frame_map[ref_idx].Index7Bits;
955*437bfbebSnyanmisaka ref_frame_width_y = pic_param->ref_frame_coded_width[ref_idx];
956*437bfbebSnyanmisaka ref_frame_height_y = pic_param->ref_frame_coded_height[ref_idx];
957*437bfbebSnyanmisaka if (ref_frame_idx < 0x7f)
958*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal ->slots, ref_frame_idx, SLOT_FRAME_PTR, &ref_frame);
959*437bfbebSnyanmisaka if (fbc_en) {
960*437bfbebSnyanmisaka y_hor_virstride = uv_hor_virstride = MPP_ALIGN(ref_frame_width_y, 64) / 64;
961*437bfbebSnyanmisaka if (*compat_ext_fbc_hdr_256_odd)
962*437bfbebSnyanmisaka y_hor_virstride = uv_hor_virstride = (MPP_ALIGN(ref_frame_width_y, 256) | 256) / 64;
963*437bfbebSnyanmisaka } else {
964*437bfbebSnyanmisaka if (ref_frame)
965*437bfbebSnyanmisaka y_hor_virstride = uv_hor_virstride = (mpp_frame_get_hor_stride(ref_frame) >> 4);
966*437bfbebSnyanmisaka else
967*437bfbebSnyanmisaka y_hor_virstride = uv_hor_virstride = (mpp_align_128_odd_plus_64((ref_frame_width_y * bit_depth) >> 3) >> 4);
968*437bfbebSnyanmisaka }
969*437bfbebSnyanmisaka if (ref_frame)
970*437bfbebSnyanmisaka y_virstride = y_hor_virstride * mpp_frame_get_ver_stride(ref_frame);
971*437bfbebSnyanmisaka else
972*437bfbebSnyanmisaka y_virstride = y_hor_virstride * vp9_ver_align(ref_frame_height_y);
973*437bfbebSnyanmisaka
974*437bfbebSnyanmisaka if (ref_frame_idx < 0x7f) {
975*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal ->slots, ref_frame_idx, SLOT_BUFFER, &framebuf);
976*437bfbebSnyanmisaka if (hw_ctx->origin_bufs && mpp_frame_get_thumbnail_en(mframe) == MPP_FRAME_THUMBNAIL_ONLY) {
977*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(hw_ctx->origin_bufs, ref_frame_idx);
978*437bfbebSnyanmisaka framebuf = origin_buf->buf[0];
979*437bfbebSnyanmisaka }
980*437bfbebSnyanmisaka
981*437bfbebSnyanmisaka switch (i) {
982*437bfbebSnyanmisaka case 0: {
983*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg83_ref0_hor_virstride = y_hor_virstride;
984*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg84_ref0_raster_uv_hor_virstride = uv_hor_virstride;
985*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg85_ref0_virstride = y_virstride;
986*437bfbebSnyanmisaka } break;
987*437bfbebSnyanmisaka case 1: {
988*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg86_ref1_hor_virstride = y_hor_virstride;
989*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg87_ref1_raster_uv_hor_virstride = uv_hor_virstride;
990*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg88_ref1_virstride = y_virstride;
991*437bfbebSnyanmisaka } break;
992*437bfbebSnyanmisaka case 2: {
993*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg89_ref2_hor_virstride = y_hor_virstride;
994*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg90_ref2_raster_uv_hor_virstride = uv_hor_virstride;
995*437bfbebSnyanmisaka vp9_hw_regs->vp9d_paras.reg91_ref2_virstride = y_virstride;
996*437bfbebSnyanmisaka } break;
997*437bfbebSnyanmisaka default:
998*437bfbebSnyanmisaka break;
999*437bfbebSnyanmisaka }
1000*437bfbebSnyanmisaka
1001*437bfbebSnyanmisaka /*0 map to 11*/
1002*437bfbebSnyanmisaka /*1 map to 12*/
1003*437bfbebSnyanmisaka /*2 map to 13*/
1004*437bfbebSnyanmisaka if (framebuf != NULL) {
1005*437bfbebSnyanmisaka reg_ref_base[i] = mpp_buffer_get_fd(framebuf);
1006*437bfbebSnyanmisaka reg_payload_ref_base[i] = mpp_buffer_get_fd(framebuf);
1007*437bfbebSnyanmisaka } else {
1008*437bfbebSnyanmisaka mpp_log("ref buff address is no valid used out as base slot index 0x%x", ref_frame_idx);
1009*437bfbebSnyanmisaka reg_ref_base[i] = vp9_hw_regs->vp9d_addrs.reg168_decout_base;
1010*437bfbebSnyanmisaka reg_payload_ref_base[i] = vp9_hw_regs->vp9d_addrs.reg168_decout_base;
1011*437bfbebSnyanmisaka }
1012*437bfbebSnyanmisaka mv_buf = hal_bufs_get_buf(hw_ctx->cmv_bufs, ref_frame_idx);
1013*437bfbebSnyanmisaka } else {
1014*437bfbebSnyanmisaka reg_ref_base[i] = vp9_hw_regs->vp9d_addrs.reg168_decout_base;
1015*437bfbebSnyanmisaka reg_payload_ref_base[i] = vp9_hw_regs->vp9d_addrs.reg168_decout_base;
1016*437bfbebSnyanmisaka }
1017*437bfbebSnyanmisaka }
1018*437bfbebSnyanmisaka
1019*437bfbebSnyanmisaka /* common register setting */
1020*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg8_dec_mode = 2; //set as vp9 dec
1021*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg9.buf_empty_en = 0;
1022*437bfbebSnyanmisaka
1023*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.strmd_auto_gating_e = 1;
1024*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.inter_auto_gating_e = 1;
1025*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.intra_auto_gating_e = 1;
1026*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.transd_auto_gating_e = 1;
1027*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.recon_auto_gating_e = 1;
1028*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.filterd_auto_gating_e = 1;
1029*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.bus_auto_gating_e = 1;
1030*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.ctrl_auto_gating_e = 1;
1031*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.rcb_auto_gating_e = 1;
1032*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg10.err_prc_auto_gating_e = 1;
1033*437bfbebSnyanmisaka
1034*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg16.error_proc_disable = 1;
1035*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg16.error_spread_disable = 0;
1036*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg16.roi_error_ctu_cal_en = 0;
1037*437bfbebSnyanmisaka
1038*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg20_cabac_error_en_lowbits = 0xffffffdf;
1039*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg21_cabac_error_en_highbits = 0x3fffffff;
1040*437bfbebSnyanmisaka
1041*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg13_core_timeout_threshold = 0x3ffff;
1042*437bfbebSnyanmisaka
1043*437bfbebSnyanmisaka //last info update
1044*437bfbebSnyanmisaka hw_ctx->ls_info.abs_delta_last = pic_param->stVP9Segments.abs_delta;
1045*437bfbebSnyanmisaka for (i = 0 ; i < 4; i ++) {
1046*437bfbebSnyanmisaka hw_ctx->ls_info.last_ref_deltas[i] = pic_param->ref_deltas[i];
1047*437bfbebSnyanmisaka }
1048*437bfbebSnyanmisaka
1049*437bfbebSnyanmisaka for (i = 0 ; i < 2; i ++) {
1050*437bfbebSnyanmisaka hw_ctx->ls_info.last_mode_deltas[i] = pic_param->mode_deltas[i];
1051*437bfbebSnyanmisaka }
1052*437bfbebSnyanmisaka
1053*437bfbebSnyanmisaka for (i = 0; i < 8; i++) {
1054*437bfbebSnyanmisaka hw_ctx->ls_info.feature_data[i][0] = pic_param->stVP9Segments.feature_data[i][0];
1055*437bfbebSnyanmisaka hw_ctx->ls_info.feature_data[i][1] = pic_param->stVP9Segments.feature_data[i][1];
1056*437bfbebSnyanmisaka hw_ctx->ls_info.feature_data[i][2] = pic_param->stVP9Segments.feature_data[i][2];
1057*437bfbebSnyanmisaka hw_ctx->ls_info.feature_data[i][3] = pic_param->stVP9Segments.feature_data[i][3];
1058*437bfbebSnyanmisaka hw_ctx->ls_info.feature_mask[i] = pic_param->stVP9Segments.feature_mask[i];
1059*437bfbebSnyanmisaka }
1060*437bfbebSnyanmisaka if (!hw_ctx->ls_info.segmentation_enable_flag_last)
1061*437bfbebSnyanmisaka hw_ctx->ls_info.segmentation_enable_flag_last = pic_param->stVP9Segments.enabled;
1062*437bfbebSnyanmisaka
1063*437bfbebSnyanmisaka hw_ctx->ls_info.last_show_frame = pic_param->show_frame;
1064*437bfbebSnyanmisaka hw_ctx->ls_info.last_width = pic_param->width;
1065*437bfbebSnyanmisaka hw_ctx->ls_info.last_height = pic_param->height;
1066*437bfbebSnyanmisaka hw_ctx->ls_info.last_frame_type = pic_param->frame_type;
1067*437bfbebSnyanmisaka
1068*437bfbebSnyanmisaka if (intraFlag)
1069*437bfbebSnyanmisaka hw_ctx->ls_info.last_intra_only = 1;
1070*437bfbebSnyanmisaka
1071*437bfbebSnyanmisaka hw_ctx->ls_info.last_intra_only = (!pic_param->frame_type || pic_param->intra_only);
1072*437bfbebSnyanmisaka hal_vp9d_dbg_par("stVP9Segments.enabled %d show_frame %d width %d height %d last_intra_only %d",
1073*437bfbebSnyanmisaka pic_param->stVP9Segments.enabled, pic_param->show_frame,
1074*437bfbebSnyanmisaka pic_param->width, pic_param->height,
1075*437bfbebSnyanmisaka hw_ctx->ls_info.last_intra_only);
1076*437bfbebSnyanmisaka
1077*437bfbebSnyanmisaka hal_vp9d_rcb_info_update(hal, vp9_hw_regs, pic_param);
1078*437bfbebSnyanmisaka {
1079*437bfbebSnyanmisaka MppBuffer rcb_buf = NULL;
1080*437bfbebSnyanmisaka
1081*437bfbebSnyanmisaka rcb_buf = p_hal->fast_mode ? hw_ctx->g_buf[task->dec.reg_index].rcb_buf : hw_ctx->rcb_buf;
1082*437bfbebSnyanmisaka vdpu383_setup_rcb(&vp9_hw_regs->common_addr, p_hal->dev, rcb_buf, hw_ctx->rcb_info);
1083*437bfbebSnyanmisaka }
1084*437bfbebSnyanmisaka vdpu383_setup_statistic(&vp9_hw_regs->ctrl_regs);
1085*437bfbebSnyanmisaka // whether need update counts
1086*437bfbebSnyanmisaka if (pic_param->refresh_frame_context && !pic_param->parallelmode) {
1087*437bfbebSnyanmisaka task->dec.flags.wait_done = 1;
1088*437bfbebSnyanmisaka }
1089*437bfbebSnyanmisaka
1090*437bfbebSnyanmisaka {
1091*437bfbebSnyanmisaka //scale down config
1092*437bfbebSnyanmisaka MppBuffer mbuffer = NULL;
1093*437bfbebSnyanmisaka RK_S32 fd = -1;
1094*437bfbebSnyanmisaka MppFrameThumbnailMode thumbnail_mode;
1095*437bfbebSnyanmisaka
1096*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->slots, task->dec.output,
1097*437bfbebSnyanmisaka SLOT_BUFFER, &mbuffer);
1098*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->slots, task->dec.output,
1099*437bfbebSnyanmisaka SLOT_FRAME_PTR, &mframe);
1100*437bfbebSnyanmisaka thumbnail_mode = mpp_frame_get_thumbnail_en(mframe);
1101*437bfbebSnyanmisaka switch (thumbnail_mode) {
1102*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_ONLY:
1103*437bfbebSnyanmisaka vp9_hw_regs->common_addr.reg133_scale_down_base = mpp_buffer_get_fd(mbuffer);
1104*437bfbebSnyanmisaka origin_buf = hal_bufs_get_buf(hw_ctx->origin_bufs, task->dec.output);
1105*437bfbebSnyanmisaka fd = mpp_buffer_get_fd(origin_buf->buf[0]);
1106*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg168_decout_base = fd;
1107*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg169_error_ref_base = fd;
1108*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg192_payload_st_cur_base = fd;
1109*437bfbebSnyanmisaka vp9_hw_regs->vp9d_addrs.reg194_payload_st_error_ref_base = fd;
1110*437bfbebSnyanmisaka vdpu383_setup_down_scale(mframe, p_hal->dev, &vp9_hw_regs->ctrl_regs,
1111*437bfbebSnyanmisaka (void *)&vp9_hw_regs->vp9d_paras);
1112*437bfbebSnyanmisaka break;
1113*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_MIXED:
1114*437bfbebSnyanmisaka vp9_hw_regs->common_addr.reg133_scale_down_base = mpp_buffer_get_fd(mbuffer);
1115*437bfbebSnyanmisaka vdpu383_setup_down_scale(mframe, p_hal->dev, &vp9_hw_regs->ctrl_regs,
1116*437bfbebSnyanmisaka (void *)&vp9_hw_regs->vp9d_paras);
1117*437bfbebSnyanmisaka break;
1118*437bfbebSnyanmisaka case MPP_FRAME_THUMBNAIL_NONE:
1119*437bfbebSnyanmisaka default:
1120*437bfbebSnyanmisaka vp9_hw_regs->ctrl_regs.reg9.scale_down_en = 0;
1121*437bfbebSnyanmisaka break;
1122*437bfbebSnyanmisaka }
1123*437bfbebSnyanmisaka }
1124*437bfbebSnyanmisaka
1125*437bfbebSnyanmisaka return MPP_OK;
1126*437bfbebSnyanmisaka }
1127*437bfbebSnyanmisaka
hal_vp9d_vdpu383_start(void * hal,HalTaskInfo * task)1128*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_start(void *hal, HalTaskInfo *task)
1129*437bfbebSnyanmisaka {
1130*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1131*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1132*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
1133*437bfbebSnyanmisaka Vdpu383Vp9dRegSet *hw_regs = (Vdpu383Vp9dRegSet *)hw_ctx->hw_regs;
1134*437bfbebSnyanmisaka MppDev dev = p_hal->dev;
1135*437bfbebSnyanmisaka
1136*437bfbebSnyanmisaka if (p_hal->fast_mode) {
1137*437bfbebSnyanmisaka RK_S32 index = task->dec.reg_index;
1138*437bfbebSnyanmisaka
1139*437bfbebSnyanmisaka hw_regs = (Vdpu383Vp9dRegSet *)hw_ctx->g_buf[index].hw_regs;
1140*437bfbebSnyanmisaka }
1141*437bfbebSnyanmisaka
1142*437bfbebSnyanmisaka mpp_assert(hw_regs);
1143*437bfbebSnyanmisaka
1144*437bfbebSnyanmisaka do {
1145*437bfbebSnyanmisaka MppDevRegWrCfg wr_cfg;
1146*437bfbebSnyanmisaka MppDevRegRdCfg rd_cfg;
1147*437bfbebSnyanmisaka
1148*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->ctrl_regs;
1149*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->ctrl_regs);
1150*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CTRL_REGS;
1151*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
1152*437bfbebSnyanmisaka if (ret) {
1153*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1154*437bfbebSnyanmisaka break;
1155*437bfbebSnyanmisaka }
1156*437bfbebSnyanmisaka
1157*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->common_addr;
1158*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->common_addr);
1159*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
1160*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
1161*437bfbebSnyanmisaka if (ret) {
1162*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1163*437bfbebSnyanmisaka break;
1164*437bfbebSnyanmisaka }
1165*437bfbebSnyanmisaka
1166*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->vp9d_paras;
1167*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->vp9d_paras);
1168*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_PARAS_REGS;
1169*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
1170*437bfbebSnyanmisaka if (ret) {
1171*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1172*437bfbebSnyanmisaka break;
1173*437bfbebSnyanmisaka }
1174*437bfbebSnyanmisaka
1175*437bfbebSnyanmisaka wr_cfg.reg = &hw_regs->vp9d_addrs;
1176*437bfbebSnyanmisaka wr_cfg.size = sizeof(hw_regs->vp9d_addrs);
1177*437bfbebSnyanmisaka wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
1178*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
1179*437bfbebSnyanmisaka if (ret) {
1180*437bfbebSnyanmisaka mpp_err_f("set register write failed %d\n", ret);
1181*437bfbebSnyanmisaka break;
1182*437bfbebSnyanmisaka }
1183*437bfbebSnyanmisaka
1184*437bfbebSnyanmisaka rd_cfg.reg = &hw_regs->ctrl_regs.reg15;
1185*437bfbebSnyanmisaka rd_cfg.size = sizeof(hw_regs->ctrl_regs.reg15);
1186*437bfbebSnyanmisaka rd_cfg.offset = OFFSET_INTERRUPT_REGS;
1187*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
1188*437bfbebSnyanmisaka if (ret) {
1189*437bfbebSnyanmisaka mpp_err_f("set register read failed %d\n", ret);
1190*437bfbebSnyanmisaka break;
1191*437bfbebSnyanmisaka }
1192*437bfbebSnyanmisaka
1193*437bfbebSnyanmisaka // rcb info for sram
1194*437bfbebSnyanmisaka vdpu383_set_rcbinfo(dev, hw_ctx->rcb_info);
1195*437bfbebSnyanmisaka
1196*437bfbebSnyanmisaka ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
1197*437bfbebSnyanmisaka if (ret) {
1198*437bfbebSnyanmisaka mpp_err_f("send cmd failed %d\n", ret);
1199*437bfbebSnyanmisaka break;
1200*437bfbebSnyanmisaka }
1201*437bfbebSnyanmisaka } while (0);
1202*437bfbebSnyanmisaka
1203*437bfbebSnyanmisaka return ret;
1204*437bfbebSnyanmisaka }
1205*437bfbebSnyanmisaka
hal_vp9d_vdpu383_wait(void * hal,HalTaskInfo * task)1206*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_wait(void *hal, HalTaskInfo *task)
1207*437bfbebSnyanmisaka {
1208*437bfbebSnyanmisaka MPP_RET ret = MPP_OK;
1209*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1210*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
1211*437bfbebSnyanmisaka Vdpu383Vp9dRegSet *hw_regs = (Vdpu383Vp9dRegSet *)hw_ctx->hw_regs;
1212*437bfbebSnyanmisaka
1213*437bfbebSnyanmisaka if (p_hal->fast_mode)
1214*437bfbebSnyanmisaka hw_regs = (Vdpu383Vp9dRegSet *)hw_ctx->g_buf[task->dec.reg_index].hw_regs;
1215*437bfbebSnyanmisaka
1216*437bfbebSnyanmisaka mpp_assert(hw_regs);
1217*437bfbebSnyanmisaka
1218*437bfbebSnyanmisaka ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
1219*437bfbebSnyanmisaka if (ret)
1220*437bfbebSnyanmisaka mpp_err_f("poll cmd failed %d\n", ret);
1221*437bfbebSnyanmisaka #ifdef DUMP_VDPU383_DATAS
1222*437bfbebSnyanmisaka {
1223*437bfbebSnyanmisaka char *cur_fname = "cabac_update_probe.dat";
1224*437bfbebSnyanmisaka DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
1225*437bfbebSnyanmisaka RK_U32 frame_ctx_id = pic_param->frame_context_idx;
1226*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
1227*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
1228*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path,
1229*437bfbebSnyanmisaka (void *)mpp_buffer_get_ptr(hw_ctx->prob_loop_base[frame_ctx_id]),
1230*437bfbebSnyanmisaka 8 * 152 * 16, 128, 0);
1231*437bfbebSnyanmisaka }
1232*437bfbebSnyanmisaka {
1233*437bfbebSnyanmisaka char *cur_fname = "segid_last.dat";
1234*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
1235*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
1236*437bfbebSnyanmisaka if (!cur_last_segid_flag)
1237*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path,
1238*437bfbebSnyanmisaka (void *)mpp_buffer_get_ptr(hw_ctx->segid_cur_base),
1239*437bfbebSnyanmisaka 8 * 1559 * 8, 64, 0);
1240*437bfbebSnyanmisaka else
1241*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path,
1242*437bfbebSnyanmisaka (void *)mpp_buffer_get_ptr(hw_ctx->segid_last_base),
1243*437bfbebSnyanmisaka 8 * 1559 * 8, 64, 0);
1244*437bfbebSnyanmisaka }
1245*437bfbebSnyanmisaka {
1246*437bfbebSnyanmisaka char *cur_fname = "segid_cur.dat";
1247*437bfbebSnyanmisaka memset(dump_cur_fname_path, 0, sizeof(dump_cur_fname_path));
1248*437bfbebSnyanmisaka sprintf(dump_cur_fname_path, "%s/%s", dump_cur_dir, cur_fname);
1249*437bfbebSnyanmisaka if (cur_last_segid_flag)
1250*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path,
1251*437bfbebSnyanmisaka (void *)mpp_buffer_get_ptr(hw_ctx->segid_cur_base),
1252*437bfbebSnyanmisaka 8 * 1559 * 8, 64, 0);
1253*437bfbebSnyanmisaka else
1254*437bfbebSnyanmisaka dump_data_to_file(dump_cur_fname_path,
1255*437bfbebSnyanmisaka (void *)mpp_buffer_get_ptr(hw_ctx->segid_last_base),
1256*437bfbebSnyanmisaka 8 * 1559 * 8, 64, 0);
1257*437bfbebSnyanmisaka }
1258*437bfbebSnyanmisaka #endif
1259*437bfbebSnyanmisaka
1260*437bfbebSnyanmisaka if (hal_vp9d_debug & HAL_VP9D_DBG_REG) {
1261*437bfbebSnyanmisaka RK_U32 *p = (RK_U32 *)hw_regs;
1262*437bfbebSnyanmisaka RK_U32 i = 0;
1263*437bfbebSnyanmisaka
1264*437bfbebSnyanmisaka for (i = 0; i < sizeof(Vdpu383Vp9dRegSet) / 4; i++)
1265*437bfbebSnyanmisaka mpp_log("get regs[%02d]: %08X\n", i, *p++);
1266*437bfbebSnyanmisaka }
1267*437bfbebSnyanmisaka
1268*437bfbebSnyanmisaka if (task->dec.flags.parse_err ||
1269*437bfbebSnyanmisaka task->dec.flags.ref_err ||
1270*437bfbebSnyanmisaka (!hw_regs->ctrl_regs.reg15.rkvdec_frame_rdy_sta) ||
1271*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_strm_error_sta ||
1272*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_core_timeout_sta ||
1273*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_ip_timeout_sta ||
1274*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_bus_error_sta ||
1275*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_buffer_empty_sta ||
1276*437bfbebSnyanmisaka hw_regs->ctrl_regs.reg15.rkvdec_colmv_ref_error_sta) {
1277*437bfbebSnyanmisaka MppFrame mframe = NULL;
1278*437bfbebSnyanmisaka
1279*437bfbebSnyanmisaka mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
1280*437bfbebSnyanmisaka mpp_frame_set_errinfo(mframe, 1);
1281*437bfbebSnyanmisaka }
1282*437bfbebSnyanmisaka
1283*437bfbebSnyanmisaka #if !HW_PROB
1284*437bfbebSnyanmisaka if (p_hal->dec_cb && task->dec.flags.wait_done) {
1285*437bfbebSnyanmisaka DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
1286*437bfbebSnyanmisaka hal_vp9d_update_counts(mpp_buffer_get_ptr(hw_ctx->count_base), task->dec.syntax.data);
1287*437bfbebSnyanmisaka mpp_callback(p_hal->dec_cb, &pic_param->counts);
1288*437bfbebSnyanmisaka }
1289*437bfbebSnyanmisaka #endif
1290*437bfbebSnyanmisaka if (p_hal->fast_mode) {
1291*437bfbebSnyanmisaka hw_ctx->g_buf[task->dec.reg_index].use_flag = 0;
1292*437bfbebSnyanmisaka }
1293*437bfbebSnyanmisaka
1294*437bfbebSnyanmisaka (void)task;
1295*437bfbebSnyanmisaka return ret;
1296*437bfbebSnyanmisaka }
1297*437bfbebSnyanmisaka
hal_vp9d_vdpu383_reset(void * hal)1298*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_reset(void *hal)
1299*437bfbebSnyanmisaka {
1300*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1301*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
1302*437bfbebSnyanmisaka
1303*437bfbebSnyanmisaka hal_vp9d_enter();
1304*437bfbebSnyanmisaka
1305*437bfbebSnyanmisaka memset(&hw_ctx->ls_info, 0, sizeof(hw_ctx->ls_info));
1306*437bfbebSnyanmisaka hw_ctx->mv_base_addr = -1;
1307*437bfbebSnyanmisaka hw_ctx->pre_mv_base_addr = -1;
1308*437bfbebSnyanmisaka hw_ctx->last_segid_flag = 1;
1309*437bfbebSnyanmisaka
1310*437bfbebSnyanmisaka hal_vp9d_leave();
1311*437bfbebSnyanmisaka
1312*437bfbebSnyanmisaka return MPP_OK;
1313*437bfbebSnyanmisaka }
1314*437bfbebSnyanmisaka
hal_vp9d_vdpu383_flush(void * hal)1315*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_flush(void *hal)
1316*437bfbebSnyanmisaka {
1317*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1318*437bfbebSnyanmisaka Vdpu383Vp9dCtx *hw_ctx = (Vdpu383Vp9dCtx*)p_hal->hw_ctx;
1319*437bfbebSnyanmisaka
1320*437bfbebSnyanmisaka hal_vp9d_enter();
1321*437bfbebSnyanmisaka
1322*437bfbebSnyanmisaka hw_ctx->mv_base_addr = -1;
1323*437bfbebSnyanmisaka hw_ctx->pre_mv_base_addr = -1;
1324*437bfbebSnyanmisaka
1325*437bfbebSnyanmisaka hal_vp9d_leave();
1326*437bfbebSnyanmisaka
1327*437bfbebSnyanmisaka return MPP_OK;
1328*437bfbebSnyanmisaka }
1329*437bfbebSnyanmisaka
hal_vp9d_vdpu383_control(void * hal,MpiCmd cmd_type,void * param)1330*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu383_control(void *hal, MpiCmd cmd_type, void *param)
1331*437bfbebSnyanmisaka {
1332*437bfbebSnyanmisaka HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1333*437bfbebSnyanmisaka
1334*437bfbebSnyanmisaka switch ((MpiCmd)cmd_type) {
1335*437bfbebSnyanmisaka case MPP_DEC_SET_FRAME_INFO : {
1336*437bfbebSnyanmisaka MppFrameFormat fmt = mpp_frame_get_fmt((MppFrame)param);
1337*437bfbebSnyanmisaka
1338*437bfbebSnyanmisaka if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1339*437bfbebSnyanmisaka vdpu383_afbc_align_calc(p_hal->slots, (MppFrame)param, 0);
1340*437bfbebSnyanmisaka } else {
1341*437bfbebSnyanmisaka mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, mpp_align_128_odd_plus_64);
1342*437bfbebSnyanmisaka }
1343*437bfbebSnyanmisaka } break;
1344*437bfbebSnyanmisaka case MPP_DEC_GET_THUMBNAIL_FRAME_INFO: {
1345*437bfbebSnyanmisaka vdpu383_update_thumbnail_frame_info((MppFrame)param);
1346*437bfbebSnyanmisaka } break;
1347*437bfbebSnyanmisaka default : {
1348*437bfbebSnyanmisaka } break;
1349*437bfbebSnyanmisaka }
1350*437bfbebSnyanmisaka
1351*437bfbebSnyanmisaka return MPP_OK;
1352*437bfbebSnyanmisaka }
1353*437bfbebSnyanmisaka
1354*437bfbebSnyanmisaka const MppHalApi hal_vp9d_vdpu383 = {
1355*437bfbebSnyanmisaka .name = "vp9d_vdpu383",
1356*437bfbebSnyanmisaka .type = MPP_CTX_DEC,
1357*437bfbebSnyanmisaka .coding = MPP_VIDEO_CodingVP9,
1358*437bfbebSnyanmisaka .ctx_size = sizeof(Vdpu383Vp9dCtx),
1359*437bfbebSnyanmisaka .flag = 0,
1360*437bfbebSnyanmisaka .init = hal_vp9d_vdpu383_init,
1361*437bfbebSnyanmisaka .deinit = hal_vp9d_vdpu383_deinit,
1362*437bfbebSnyanmisaka .reg_gen = hal_vp9d_vdpu383_gen_regs,
1363*437bfbebSnyanmisaka .start = hal_vp9d_vdpu383_start,
1364*437bfbebSnyanmisaka .wait = hal_vp9d_vdpu383_wait,
1365*437bfbebSnyanmisaka .reset = hal_vp9d_vdpu383_reset,
1366*437bfbebSnyanmisaka .flush = hal_vp9d_vdpu383_flush,
1367*437bfbebSnyanmisaka .control = hal_vp9d_vdpu383_control,
1368*437bfbebSnyanmisaka };
1369