xref: /rockchip-linux_mpp/mpp/hal/rkdec/vp9d/hal_vp9d_vdpu34x.c (revision 437bfbeb9567cca9cd9080e3f6954aa9d6a94f18)
1*437bfbebSnyanmisaka /*
2*437bfbebSnyanmisaka  * Copyright 2020 Rockchip Electronics Co. LTD
3*437bfbebSnyanmisaka  *
4*437bfbebSnyanmisaka  * Licensed under the Apache License, Version 2.0 (the "License");
5*437bfbebSnyanmisaka  * you may not use this file except in compliance with the License.
6*437bfbebSnyanmisaka  * You may obtain a copy of the License at
7*437bfbebSnyanmisaka  *
8*437bfbebSnyanmisaka  *      http://www.apache.org/licenses/LICENSE-2.0
9*437bfbebSnyanmisaka  *
10*437bfbebSnyanmisaka  * Unless required by applicable law or agreed to in writing, software
11*437bfbebSnyanmisaka  * distributed under the License is distributed on an "AS IS" BASIS,
12*437bfbebSnyanmisaka  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*437bfbebSnyanmisaka  * See the License for the specific language governing permissions and
14*437bfbebSnyanmisaka  * limitations under the License.
15*437bfbebSnyanmisaka  */
16*437bfbebSnyanmisaka 
17*437bfbebSnyanmisaka #define MODULE_TAG "hal_vp9d_vdpu34x"
18*437bfbebSnyanmisaka 
19*437bfbebSnyanmisaka #include <stdio.h>
20*437bfbebSnyanmisaka #include <string.h>
21*437bfbebSnyanmisaka 
22*437bfbebSnyanmisaka #include "mpp_env.h"
23*437bfbebSnyanmisaka #include "mpp_mem.h"
24*437bfbebSnyanmisaka #include "mpp_common.h"
25*437bfbebSnyanmisaka #include "mpp_device.h"
26*437bfbebSnyanmisaka #include "mpp_hal.h"
27*437bfbebSnyanmisaka 
28*437bfbebSnyanmisaka #include "hal_bufs.h"
29*437bfbebSnyanmisaka #include "hal_vp9d_debug.h"
30*437bfbebSnyanmisaka #include "hal_vp9d_com.h"
31*437bfbebSnyanmisaka #include "hal_vp9d_vdpu34x.h"
32*437bfbebSnyanmisaka #include "hal_vp9d_ctx.h"
33*437bfbebSnyanmisaka #include "vdpu34x_vp9d.h"
34*437bfbebSnyanmisaka #include "vp9d_syntax.h"
35*437bfbebSnyanmisaka 
36*437bfbebSnyanmisaka #define HW_PROB 1
37*437bfbebSnyanmisaka #define VP9_CONTEXT 4
38*437bfbebSnyanmisaka #define VP9_CTU_SIZE 64
39*437bfbebSnyanmisaka #define PROB_SIZE_ALIGN_TO_4K MPP_ALIGN(PROB_SIZE, SZ_4K)
40*437bfbebSnyanmisaka #define COUNT_SIZE_ALIGN_TO_4K MPP_ALIGN(COUNT_SIZE, SZ_4K)
41*437bfbebSnyanmisaka #define MAX_SEGMAP_SIZE_ALIGN_TO_4K MPP_ALIGN(MAX_SEGMAP_SIZE, SZ_4K)
42*437bfbebSnyanmisaka 
43*437bfbebSnyanmisaka #define VDPU34X_OFFSET_COUNT (PROB_SIZE_ALIGN_TO_4K)
44*437bfbebSnyanmisaka #define VDPU34X_PROBE_BUFFER_SIZE (PROB_SIZE_ALIGN_TO_4K + COUNT_SIZE_ALIGN_TO_4K)
45*437bfbebSnyanmisaka 
46*437bfbebSnyanmisaka typedef struct Vdpu34xVp9dCtx_t {
47*437bfbebSnyanmisaka     Vp9dRegBuf      g_buf[MAX_GEN_REG];
48*437bfbebSnyanmisaka     MppBuffer       probe_base;
49*437bfbebSnyanmisaka     MppBuffer       seg_base;
50*437bfbebSnyanmisaka     RK_U32          offset_count;
51*437bfbebSnyanmisaka     RK_U32          offset_segid_cur;
52*437bfbebSnyanmisaka     RK_U32          offset_segid_last;
53*437bfbebSnyanmisaka     MppBuffer       prob_default_base;
54*437bfbebSnyanmisaka     void*           hw_regs;
55*437bfbebSnyanmisaka     RK_S32          mv_base_addr;
56*437bfbebSnyanmisaka     RK_S32          pre_mv_base_addr;
57*437bfbebSnyanmisaka     Vp9dLastInfo    ls_info;
58*437bfbebSnyanmisaka     /*
59*437bfbebSnyanmisaka      * swap between segid_cur_base & segid_last_base
60*437bfbebSnyanmisaka      * 0  used segid_cur_base as last
61*437bfbebSnyanmisaka      * 1  used segid_last_base as
62*437bfbebSnyanmisaka      */
63*437bfbebSnyanmisaka     RK_U32          last_segid_flag;
64*437bfbebSnyanmisaka     RK_S32          width;
65*437bfbebSnyanmisaka     RK_S32          height;
66*437bfbebSnyanmisaka     /* rcb buffers info */
67*437bfbebSnyanmisaka     RK_S32          rcb_buf_size;
68*437bfbebSnyanmisaka     Vdpu34xRcbInfo  rcb_info[RCB_BUF_COUNT];
69*437bfbebSnyanmisaka     MppBuffer       rcb_buf;
70*437bfbebSnyanmisaka     RK_U32          num_row_tiles;
71*437bfbebSnyanmisaka     RK_U32          bit_depth;
72*437bfbebSnyanmisaka     /* colmv buffers info */
73*437bfbebSnyanmisaka     HalBufs         cmv_bufs;
74*437bfbebSnyanmisaka     RK_S32          mv_size;
75*437bfbebSnyanmisaka     RK_S32          mv_count;
76*437bfbebSnyanmisaka     RK_U32          prob_ctx_valid[VP9_CONTEXT];
77*437bfbebSnyanmisaka     MppBuffer       prob_loop_base[VP9_CONTEXT];
78*437bfbebSnyanmisaka     RK_U32          prob_ref_poc[VP9_CONTEXT];
79*437bfbebSnyanmisaka     RK_U32          col_ref_poc;
80*437bfbebSnyanmisaka     RK_U32          segid_ref_poc;
81*437bfbebSnyanmisaka } Vdpu34xVp9dCtx;
82*437bfbebSnyanmisaka 
hal_vp9d_alloc_res(HalVp9dCtx * hal)83*437bfbebSnyanmisaka static MPP_RET hal_vp9d_alloc_res(HalVp9dCtx *hal)
84*437bfbebSnyanmisaka {
85*437bfbebSnyanmisaka     RK_S32 i = 0;
86*437bfbebSnyanmisaka     RK_S32 ret = 0;
87*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
88*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
89*437bfbebSnyanmisaka     hw_ctx->offset_count = VDPU34X_OFFSET_COUNT;
90*437bfbebSnyanmisaka     hw_ctx->offset_segid_cur = 0;
91*437bfbebSnyanmisaka     hw_ctx->offset_segid_last = MAX_SEGMAP_SIZE_ALIGN_TO_4K;
92*437bfbebSnyanmisaka     /* alloc common buffer */
93*437bfbebSnyanmisaka     for (i = 0; i < VP9_CONTEXT; i++) {
94*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->group, &hw_ctx->prob_loop_base[i], PROB_SIZE);
95*437bfbebSnyanmisaka         if (ret) {
96*437bfbebSnyanmisaka             mpp_err("vp9 probe_loop_base get buffer failed\n");
97*437bfbebSnyanmisaka             return ret;
98*437bfbebSnyanmisaka         }
99*437bfbebSnyanmisaka     }
100*437bfbebSnyanmisaka     ret = mpp_buffer_get(p_hal->group, &hw_ctx->prob_default_base, PROB_SIZE);
101*437bfbebSnyanmisaka     if (ret) {
102*437bfbebSnyanmisaka         mpp_err("vp9 probe_default_base get buffer failed\n");
103*437bfbebSnyanmisaka         return ret;
104*437bfbebSnyanmisaka     }
105*437bfbebSnyanmisaka     /* alloc buffer for fast mode or normal */
106*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
107*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
108*437bfbebSnyanmisaka             hw_ctx->g_buf[i].hw_regs = mpp_calloc_size(void, sizeof(Vdpu34xVp9dRegSet));
109*437bfbebSnyanmisaka             ret = mpp_buffer_get(p_hal->group, &hw_ctx->g_buf[i].probe_base, VDPU34X_PROBE_BUFFER_SIZE);
110*437bfbebSnyanmisaka             if (ret) {
111*437bfbebSnyanmisaka                 mpp_err("vp9 probe_base get buffer failed\n");
112*437bfbebSnyanmisaka                 return ret;
113*437bfbebSnyanmisaka             }
114*437bfbebSnyanmisaka         }
115*437bfbebSnyanmisaka     } else {
116*437bfbebSnyanmisaka         hw_ctx->hw_regs = mpp_calloc_size(void, sizeof(Vdpu34xVp9dRegSet));
117*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->group, &hw_ctx->probe_base, VDPU34X_PROBE_BUFFER_SIZE);
118*437bfbebSnyanmisaka         if (ret) {
119*437bfbebSnyanmisaka             mpp_err("vp9 probe_base get buffer failed\n");
120*437bfbebSnyanmisaka             return ret;
121*437bfbebSnyanmisaka         }
122*437bfbebSnyanmisaka     }
123*437bfbebSnyanmisaka     ret = mpp_buffer_get(p_hal->group, &hw_ctx->seg_base, MAX_SEGMAP_SIZE_ALIGN_TO_4K * 2);
124*437bfbebSnyanmisaka     if (ret) {
125*437bfbebSnyanmisaka         mpp_err("vp9 segid_base get buffer failed\n");
126*437bfbebSnyanmisaka         return ret;
127*437bfbebSnyanmisaka     }
128*437bfbebSnyanmisaka     return MPP_OK;
129*437bfbebSnyanmisaka }
130*437bfbebSnyanmisaka 
hal_vp9d_release_res(HalVp9dCtx * hal)131*437bfbebSnyanmisaka static MPP_RET hal_vp9d_release_res(HalVp9dCtx *hal)
132*437bfbebSnyanmisaka {
133*437bfbebSnyanmisaka     RK_S32 i = 0;
134*437bfbebSnyanmisaka     RK_S32 ret = 0;
135*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
136*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
137*437bfbebSnyanmisaka 
138*437bfbebSnyanmisaka     if (hw_ctx->prob_default_base) {
139*437bfbebSnyanmisaka         ret = mpp_buffer_put(hw_ctx->prob_default_base);
140*437bfbebSnyanmisaka         if (ret) {
141*437bfbebSnyanmisaka             mpp_err("vp9 probe_wr_base put buffer failed\n");
142*437bfbebSnyanmisaka             return ret;
143*437bfbebSnyanmisaka         }
144*437bfbebSnyanmisaka     }
145*437bfbebSnyanmisaka     for (i = 0; i < VP9_CONTEXT; i++) {
146*437bfbebSnyanmisaka         if (hw_ctx->prob_loop_base[i]) {
147*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->prob_loop_base[i]);
148*437bfbebSnyanmisaka             if (ret) {
149*437bfbebSnyanmisaka                 mpp_err("vp9 probe_base put buffer failed\n");
150*437bfbebSnyanmisaka                 return ret;
151*437bfbebSnyanmisaka             }
152*437bfbebSnyanmisaka         }
153*437bfbebSnyanmisaka     }
154*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
155*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
156*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].probe_base) {
157*437bfbebSnyanmisaka                 ret = mpp_buffer_put(hw_ctx->g_buf[i].probe_base);
158*437bfbebSnyanmisaka                 if (ret) {
159*437bfbebSnyanmisaka                     mpp_err("vp9 probe_base put buffer failed\n");
160*437bfbebSnyanmisaka                     return ret;
161*437bfbebSnyanmisaka                 }
162*437bfbebSnyanmisaka             }
163*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].hw_regs) {
164*437bfbebSnyanmisaka                 mpp_free(hw_ctx->g_buf[i].hw_regs);
165*437bfbebSnyanmisaka                 hw_ctx->g_buf[i].hw_regs = NULL;
166*437bfbebSnyanmisaka             }
167*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].rcb_buf) {
168*437bfbebSnyanmisaka                 ret = mpp_buffer_put(hw_ctx->g_buf[i].rcb_buf);
169*437bfbebSnyanmisaka                 if (ret) {
170*437bfbebSnyanmisaka                     mpp_err("vp9 rcb_buf[%d] put buffer failed\n", i);
171*437bfbebSnyanmisaka                     return ret;
172*437bfbebSnyanmisaka                 }
173*437bfbebSnyanmisaka             }
174*437bfbebSnyanmisaka         }
175*437bfbebSnyanmisaka     } else {
176*437bfbebSnyanmisaka         if (hw_ctx->probe_base) {
177*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->probe_base);
178*437bfbebSnyanmisaka             if (ret) {
179*437bfbebSnyanmisaka                 mpp_err("vp9 probe_base put buffer failed\n");
180*437bfbebSnyanmisaka                 return ret;
181*437bfbebSnyanmisaka             }
182*437bfbebSnyanmisaka         }
183*437bfbebSnyanmisaka 
184*437bfbebSnyanmisaka         if (hw_ctx->hw_regs) {
185*437bfbebSnyanmisaka             mpp_free(hw_ctx->hw_regs);
186*437bfbebSnyanmisaka             hw_ctx->hw_regs = NULL;
187*437bfbebSnyanmisaka         }
188*437bfbebSnyanmisaka         if (hw_ctx->rcb_buf) {
189*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->rcb_buf);
190*437bfbebSnyanmisaka             if (ret) {
191*437bfbebSnyanmisaka                 mpp_err("vp9 rcb_buf put buffer failed\n");
192*437bfbebSnyanmisaka                 return ret;
193*437bfbebSnyanmisaka             }
194*437bfbebSnyanmisaka         }
195*437bfbebSnyanmisaka     }
196*437bfbebSnyanmisaka 
197*437bfbebSnyanmisaka     if (hw_ctx->cmv_bufs) {
198*437bfbebSnyanmisaka         ret = hal_bufs_deinit(hw_ctx->cmv_bufs);
199*437bfbebSnyanmisaka         if (ret) {
200*437bfbebSnyanmisaka             mpp_err("vp9 cmv bufs deinit buffer failed\n");
201*437bfbebSnyanmisaka             return ret;
202*437bfbebSnyanmisaka         }
203*437bfbebSnyanmisaka     }
204*437bfbebSnyanmisaka 
205*437bfbebSnyanmisaka     if (hw_ctx->seg_base) {
206*437bfbebSnyanmisaka         ret = mpp_buffer_put(hw_ctx->seg_base);
207*437bfbebSnyanmisaka         if (ret) {
208*437bfbebSnyanmisaka             mpp_err("vp9 seg_base put buffer failed\n");
209*437bfbebSnyanmisaka             return ret;
210*437bfbebSnyanmisaka         }
211*437bfbebSnyanmisaka     }
212*437bfbebSnyanmisaka 
213*437bfbebSnyanmisaka     return MPP_OK;
214*437bfbebSnyanmisaka }
215*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_deinit(void * hal)216*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_deinit(void *hal)
217*437bfbebSnyanmisaka {
218*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
219*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
220*437bfbebSnyanmisaka 
221*437bfbebSnyanmisaka     hal_vp9d_release_res(p_hal);
222*437bfbebSnyanmisaka 
223*437bfbebSnyanmisaka     if (p_hal->group) {
224*437bfbebSnyanmisaka         ret = mpp_buffer_group_put(p_hal->group);
225*437bfbebSnyanmisaka         if (ret) {
226*437bfbebSnyanmisaka             mpp_err("vp9d group free buffer failed\n");
227*437bfbebSnyanmisaka             return ret;
228*437bfbebSnyanmisaka         }
229*437bfbebSnyanmisaka     }
230*437bfbebSnyanmisaka     MPP_FREE(p_hal->hw_ctx);
231*437bfbebSnyanmisaka     return ret = MPP_OK;
232*437bfbebSnyanmisaka }
233*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_init(void * hal,MppHalCfg * cfg)234*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_init(void *hal, MppHalCfg *cfg)
235*437bfbebSnyanmisaka {
236*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
237*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
238*437bfbebSnyanmisaka     MEM_CHECK(ret, p_hal->hw_ctx = mpp_calloc_size(void, sizeof(Vdpu34xVp9dCtx)));
239*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
240*437bfbebSnyanmisaka 
241*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = -1;
242*437bfbebSnyanmisaka     hw_ctx->pre_mv_base_addr = -1;
243*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, vp9_hor_align);
244*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->slots, SLOTS_VER_ALIGN, vp9_ver_align);
245*437bfbebSnyanmisaka 
246*437bfbebSnyanmisaka     if (p_hal->group == NULL) {
247*437bfbebSnyanmisaka         ret = mpp_buffer_group_get_internal(&p_hal->group, MPP_BUFFER_TYPE_ION);
248*437bfbebSnyanmisaka         if (ret) {
249*437bfbebSnyanmisaka             mpp_err("vp9 mpp_buffer_group_get failed\n");
250*437bfbebSnyanmisaka             goto __FAILED;
251*437bfbebSnyanmisaka         }
252*437bfbebSnyanmisaka     }
253*437bfbebSnyanmisaka 
254*437bfbebSnyanmisaka     ret = hal_vp9d_alloc_res(p_hal);
255*437bfbebSnyanmisaka     if (ret) {
256*437bfbebSnyanmisaka         mpp_err("hal_vp9d_alloc_res failed\n");
257*437bfbebSnyanmisaka         goto __FAILED;
258*437bfbebSnyanmisaka     }
259*437bfbebSnyanmisaka 
260*437bfbebSnyanmisaka     hw_ctx->last_segid_flag = 1;
261*437bfbebSnyanmisaka 
262*437bfbebSnyanmisaka     if (cfg->hal_fbc_adj_cfg) {
263*437bfbebSnyanmisaka         cfg->hal_fbc_adj_cfg->func = vdpu34x_afbc_align_calc;
264*437bfbebSnyanmisaka         cfg->hal_fbc_adj_cfg->expand = 0;
265*437bfbebSnyanmisaka     }
266*437bfbebSnyanmisaka 
267*437bfbebSnyanmisaka     return ret;
268*437bfbebSnyanmisaka __FAILED:
269*437bfbebSnyanmisaka     hal_vp9d_vdpu34x_deinit(hal);
270*437bfbebSnyanmisaka     return ret;
271*437bfbebSnyanmisaka }
272*437bfbebSnyanmisaka 
vp9d_refine_rcb_size(Vdpu34xRcbInfo * rcb_info,Vdpu34xVp9dRegSet * vp9_hw_regs,RK_S32 width,RK_S32 height,void * data)273*437bfbebSnyanmisaka static void vp9d_refine_rcb_size(Vdpu34xRcbInfo *rcb_info,
274*437bfbebSnyanmisaka                                  Vdpu34xVp9dRegSet *vp9_hw_regs,
275*437bfbebSnyanmisaka                                  RK_S32 width, RK_S32 height, void* data)
276*437bfbebSnyanmisaka {
277*437bfbebSnyanmisaka     RK_U32 rcb_bits = 0;
278*437bfbebSnyanmisaka     DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)data;
279*437bfbebSnyanmisaka     RK_U32 num_tiles = pic_param->log2_tile_rows;
280*437bfbebSnyanmisaka     RK_U32 bit_depth = pic_param->BitDepthMinus8Luma + 8;
281*437bfbebSnyanmisaka     RK_U32 ext_align_size = num_tiles * 64 * 8;
282*437bfbebSnyanmisaka 
283*437bfbebSnyanmisaka     width = MPP_ALIGN(width, VP9_CTU_SIZE);
284*437bfbebSnyanmisaka     height = MPP_ALIGN(height, VP9_CTU_SIZE);
285*437bfbebSnyanmisaka     /* RCB_STRMD_ROW */
286*437bfbebSnyanmisaka     if (width > 4096)
287*437bfbebSnyanmisaka         rcb_bits = MPP_ALIGN(width, 64) * 232 + ext_align_size;
288*437bfbebSnyanmisaka     else
289*437bfbebSnyanmisaka         rcb_bits = 0;
290*437bfbebSnyanmisaka     rcb_info[RCB_STRMD_ROW].size = MPP_RCB_BYTES(rcb_bits);
291*437bfbebSnyanmisaka     /* RCB_TRANSD_ROW */
292*437bfbebSnyanmisaka     if (width > 8192)
293*437bfbebSnyanmisaka         rcb_bits = (MPP_ALIGN(width - 8192, 4) << 1) + ext_align_size;
294*437bfbebSnyanmisaka     else
295*437bfbebSnyanmisaka         rcb_bits = 0;
296*437bfbebSnyanmisaka     rcb_info[RCB_TRANSD_ROW].size = MPP_RCB_BYTES(rcb_bits);
297*437bfbebSnyanmisaka     /* RCB_TRANSD_COL */
298*437bfbebSnyanmisaka     if (height > 8192)
299*437bfbebSnyanmisaka         rcb_bits = (MPP_ALIGN(height - 8192, 4) << 1) + ext_align_size;
300*437bfbebSnyanmisaka     else
301*437bfbebSnyanmisaka         rcb_bits = 0;
302*437bfbebSnyanmisaka     rcb_info[RCB_TRANSD_COL].size = MPP_RCB_BYTES(rcb_bits);
303*437bfbebSnyanmisaka     /* RCB_INTER_ROW */
304*437bfbebSnyanmisaka     rcb_bits = width * 36 + ext_align_size;
305*437bfbebSnyanmisaka     rcb_info[RCB_INTER_ROW].size = MPP_RCB_BYTES(rcb_bits);
306*437bfbebSnyanmisaka     /* RCB_INTER_COL */
307*437bfbebSnyanmisaka     rcb_info[RCB_INTER_COL].size = 0;
308*437bfbebSnyanmisaka     /* RCB_INTRA_ROW */
309*437bfbebSnyanmisaka     rcb_bits = width * 48 + ext_align_size;
310*437bfbebSnyanmisaka     rcb_info[RCB_INTRA_ROW].size = MPP_RCB_BYTES(rcb_bits);
311*437bfbebSnyanmisaka     /* RCB_DBLK_ROW */
312*437bfbebSnyanmisaka     rcb_bits = width * (1 + 16 * bit_depth) + num_tiles * 192 * bit_depth + ext_align_size;
313*437bfbebSnyanmisaka     rcb_info[RCB_DBLK_ROW].size = MPP_RCB_BYTES(rcb_bits);
314*437bfbebSnyanmisaka     /* RCB_SAO_ROW */
315*437bfbebSnyanmisaka     rcb_info[RCB_SAO_ROW].size = 0;
316*437bfbebSnyanmisaka     /* RCB_FBC_ROW */
317*437bfbebSnyanmisaka     if (vp9_hw_regs->common.reg012.fbc_e) {
318*437bfbebSnyanmisaka         rcb_bits = 8 * width * bit_depth + ext_align_size;
319*437bfbebSnyanmisaka     } else
320*437bfbebSnyanmisaka         rcb_bits = 0;
321*437bfbebSnyanmisaka     rcb_info[RCB_FBC_ROW].size = MPP_RCB_BYTES(rcb_bits);
322*437bfbebSnyanmisaka     /* RCB_FILT_COL */
323*437bfbebSnyanmisaka     if (vp9_hw_regs->common.reg012.fbc_e) {
324*437bfbebSnyanmisaka         rcb_bits = height * (4 + 24 *  bit_depth);
325*437bfbebSnyanmisaka     } else
326*437bfbebSnyanmisaka         rcb_bits = height * (4 + 16 *  bit_depth);
327*437bfbebSnyanmisaka     rcb_bits += ext_align_size;
328*437bfbebSnyanmisaka     rcb_info[RCB_FILT_COL].size = MPP_RCB_BYTES(rcb_bits);
329*437bfbebSnyanmisaka }
330*437bfbebSnyanmisaka 
hal_vp9d_rcb_info_update(void * hal,Vdpu34xVp9dRegSet * hw_regs,void * data)331*437bfbebSnyanmisaka static void hal_vp9d_rcb_info_update(void *hal,  Vdpu34xVp9dRegSet *hw_regs, void *data)
332*437bfbebSnyanmisaka {
333*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
334*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
335*437bfbebSnyanmisaka     DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)data;
336*437bfbebSnyanmisaka     RK_U32 num_tiles = pic_param->log2_tile_rows;
337*437bfbebSnyanmisaka     RK_U32 bit_depth = pic_param->BitDepthMinus8Luma + 8;
338*437bfbebSnyanmisaka     RK_S32 height = vp9_ver_align(pic_param->height);
339*437bfbebSnyanmisaka     RK_S32 width  = vp9_ver_align(pic_param->width);
340*437bfbebSnyanmisaka 
341*437bfbebSnyanmisaka     if (hw_ctx->num_row_tiles != num_tiles ||
342*437bfbebSnyanmisaka         hw_ctx->bit_depth != bit_depth ||
343*437bfbebSnyanmisaka         hw_ctx->width != width ||
344*437bfbebSnyanmisaka         hw_ctx->height != height) {
345*437bfbebSnyanmisaka 
346*437bfbebSnyanmisaka         hw_ctx->rcb_buf_size = vdpu34x_get_rcb_buf_size(hw_ctx->rcb_info, width, height);
347*437bfbebSnyanmisaka         vp9d_refine_rcb_size(hw_ctx->rcb_info, hw_regs, width, height, pic_param);
348*437bfbebSnyanmisaka 
349*437bfbebSnyanmisaka         if (p_hal->fast_mode) {
350*437bfbebSnyanmisaka             RK_U32 i;
351*437bfbebSnyanmisaka 
352*437bfbebSnyanmisaka             for (i = 0; i < MPP_ARRAY_ELEMS(hw_ctx->g_buf); i++) {
353*437bfbebSnyanmisaka                 MppBuffer rcb_buf = hw_ctx->g_buf[i].rcb_buf;
354*437bfbebSnyanmisaka 
355*437bfbebSnyanmisaka                 if (rcb_buf) {
356*437bfbebSnyanmisaka                     mpp_buffer_put(rcb_buf);
357*437bfbebSnyanmisaka                     hw_ctx->g_buf[i].rcb_buf = NULL;
358*437bfbebSnyanmisaka                 }
359*437bfbebSnyanmisaka                 mpp_buffer_get(p_hal->group, &rcb_buf, hw_ctx->rcb_buf_size);
360*437bfbebSnyanmisaka                 hw_ctx->g_buf[i].rcb_buf = rcb_buf;
361*437bfbebSnyanmisaka             }
362*437bfbebSnyanmisaka         } else {
363*437bfbebSnyanmisaka             MppBuffer rcb_buf = hw_ctx->rcb_buf;
364*437bfbebSnyanmisaka 
365*437bfbebSnyanmisaka             if (rcb_buf) {
366*437bfbebSnyanmisaka                 mpp_buffer_put(rcb_buf);
367*437bfbebSnyanmisaka                 rcb_buf = NULL;
368*437bfbebSnyanmisaka             }
369*437bfbebSnyanmisaka             mpp_buffer_get(p_hal->group, &rcb_buf, hw_ctx->rcb_buf_size);
370*437bfbebSnyanmisaka             hw_ctx->rcb_buf = rcb_buf;
371*437bfbebSnyanmisaka         }
372*437bfbebSnyanmisaka 
373*437bfbebSnyanmisaka         hw_ctx->num_row_tiles  = num_tiles;
374*437bfbebSnyanmisaka         hw_ctx->bit_depth      = bit_depth;
375*437bfbebSnyanmisaka         hw_ctx->width          = width;
376*437bfbebSnyanmisaka         hw_ctx->height         = height;
377*437bfbebSnyanmisaka     }
378*437bfbebSnyanmisaka }
379*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_setup_colmv_buf(void * hal,HalTaskInfo * task)380*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_setup_colmv_buf(void *hal, HalTaskInfo *task)
381*437bfbebSnyanmisaka {
382*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
383*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
384*437bfbebSnyanmisaka     DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
385*437bfbebSnyanmisaka     RK_U32 width = pic_param->width;
386*437bfbebSnyanmisaka     RK_U32 height = pic_param->height;
387*437bfbebSnyanmisaka     RK_S32 mv_size = 0, colmv_size = 8, colmv_byte = 16;
388*437bfbebSnyanmisaka     RK_U32 compress = p_hal->hw_info ? p_hal->hw_info->cap_colmv_compress : 1;
389*437bfbebSnyanmisaka 
390*437bfbebSnyanmisaka     mv_size = vdpu34x_get_colmv_size(width, height, VP9_CTU_SIZE, colmv_byte, colmv_size, compress);
391*437bfbebSnyanmisaka     if (hw_ctx->cmv_bufs == NULL || hw_ctx->mv_size < mv_size) {
392*437bfbebSnyanmisaka         size_t size = mv_size;
393*437bfbebSnyanmisaka 
394*437bfbebSnyanmisaka         if (hw_ctx->cmv_bufs) {
395*437bfbebSnyanmisaka             hal_bufs_deinit(hw_ctx->cmv_bufs);
396*437bfbebSnyanmisaka             hw_ctx->cmv_bufs = NULL;
397*437bfbebSnyanmisaka         }
398*437bfbebSnyanmisaka 
399*437bfbebSnyanmisaka         hal_bufs_init(&hw_ctx->cmv_bufs);
400*437bfbebSnyanmisaka         if (hw_ctx->cmv_bufs == NULL) {
401*437bfbebSnyanmisaka             mpp_err_f("colmv bufs init fail");
402*437bfbebSnyanmisaka             return MPP_ERR_NOMEM;
403*437bfbebSnyanmisaka         }
404*437bfbebSnyanmisaka         hw_ctx->mv_size = mv_size;
405*437bfbebSnyanmisaka         hw_ctx->mv_count = mpp_buf_slot_get_count(p_hal ->slots);
406*437bfbebSnyanmisaka         hal_bufs_setup(hw_ctx->cmv_bufs, hw_ctx->mv_count, 1, &size);
407*437bfbebSnyanmisaka     }
408*437bfbebSnyanmisaka 
409*437bfbebSnyanmisaka     return MPP_OK;
410*437bfbebSnyanmisaka }
411*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_gen_regs(void * hal,HalTaskInfo * task)412*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_gen_regs(void *hal, HalTaskInfo *task)
413*437bfbebSnyanmisaka {
414*437bfbebSnyanmisaka     RK_S32   i;
415*437bfbebSnyanmisaka     RK_U8    bit_depth = 0;
416*437bfbebSnyanmisaka     RK_U32   ref_frame_width_y;
417*437bfbebSnyanmisaka     RK_U32   ref_frame_height_y;
418*437bfbebSnyanmisaka     RK_S32   stream_len = 0, aglin_offset = 0;
419*437bfbebSnyanmisaka     RK_U32   y_hor_virstride, uv_hor_virstride, y_virstride;
420*437bfbebSnyanmisaka     RK_U8   *bitstream = NULL;
421*437bfbebSnyanmisaka     MppBuffer streambuf = NULL;
422*437bfbebSnyanmisaka     RK_U32 sw_y_hor_virstride;
423*437bfbebSnyanmisaka     RK_U32 sw_uv_hor_virstride;
424*437bfbebSnyanmisaka     RK_U32 sw_y_virstride;
425*437bfbebSnyanmisaka     RK_U8  ref_idx = 0;
426*437bfbebSnyanmisaka     RK_U8  ref_frame_idx = 0;
427*437bfbebSnyanmisaka     RK_U32 *reg_ref_base = 0;
428*437bfbebSnyanmisaka     RK_S32 intraFlag = 0;
429*437bfbebSnyanmisaka     MppBuffer framebuf = NULL;
430*437bfbebSnyanmisaka     HalBuf *mv_buf = NULL;
431*437bfbebSnyanmisaka     RK_U32 fbc_en = 0;
432*437bfbebSnyanmisaka 
433*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
434*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
435*437bfbebSnyanmisaka     DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
436*437bfbebSnyanmisaka     RK_U32 frame_ctx_id = pic_param->frame_context_idx;
437*437bfbebSnyanmisaka 
438*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
439*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
440*437bfbebSnyanmisaka             if (!hw_ctx->g_buf[i].use_flag) {
441*437bfbebSnyanmisaka                 task->dec.reg_index = i;
442*437bfbebSnyanmisaka                 hw_ctx->probe_base = hw_ctx->g_buf[i].probe_base;
443*437bfbebSnyanmisaka 
444*437bfbebSnyanmisaka                 hw_ctx->hw_regs = hw_ctx->g_buf[i].hw_regs;
445*437bfbebSnyanmisaka                 hw_ctx->g_buf[i].use_flag = 1;
446*437bfbebSnyanmisaka                 break;
447*437bfbebSnyanmisaka             }
448*437bfbebSnyanmisaka         }
449*437bfbebSnyanmisaka         if (i == MAX_GEN_REG) {
450*437bfbebSnyanmisaka             mpp_err("vp9 fast mode buf all used\n");
451*437bfbebSnyanmisaka             return MPP_ERR_NOMEM;
452*437bfbebSnyanmisaka         }
453*437bfbebSnyanmisaka     }
454*437bfbebSnyanmisaka 
455*437bfbebSnyanmisaka     if (hal_vp9d_vdpu34x_setup_colmv_buf(hal, task))
456*437bfbebSnyanmisaka         return MPP_ERR_NOMEM;
457*437bfbebSnyanmisaka 
458*437bfbebSnyanmisaka     Vdpu34xVp9dRegSet *vp9_hw_regs = (Vdpu34xVp9dRegSet*)hw_ctx->hw_regs;
459*437bfbebSnyanmisaka     intraFlag = (!pic_param->frame_type || pic_param->intra_only);
460*437bfbebSnyanmisaka     stream_len = (RK_S32)mpp_packet_get_length(task->dec.input_packet);
461*437bfbebSnyanmisaka     memset(hw_ctx->hw_regs, 0, sizeof(Vdpu34xVp9dRegSet));
462*437bfbebSnyanmisaka #if HW_PROB
463*437bfbebSnyanmisaka     hal_vp9d_prob_flag_delta(mpp_buffer_get_ptr(hw_ctx->probe_base), task->dec.syntax.data);
464*437bfbebSnyanmisaka     mpp_buffer_sync_end(hw_ctx->probe_base);
465*437bfbebSnyanmisaka     if (intraFlag) {
466*437bfbebSnyanmisaka         hal_vp9d_prob_default(mpp_buffer_get_ptr(hw_ctx->prob_default_base), task->dec.syntax.data);
467*437bfbebSnyanmisaka         mpp_buffer_sync_end(hw_ctx->prob_default_base);
468*437bfbebSnyanmisaka     }
469*437bfbebSnyanmisaka 
470*437bfbebSnyanmisaka     /* config reg103 */
471*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.prob_update_en   = 1;
472*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.intra_only_flag  = intraFlag;
473*437bfbebSnyanmisaka     if (!intraFlag) {
474*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg103.txfmmode_rfsh_en = (pic_param->txmode == 4) ? 1 : 0;
475*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg103.interp_filter_switch_en = pic_param->interp_filter == 4 ? 1 : 0;
476*437bfbebSnyanmisaka     }
477*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.ref_mode_rfsh_en     = 1;
478*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.single_ref_rfsh_en   = 1;
479*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.comp_ref_rfsh_en     = 1;
480*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.inter_coef_rfsh_flag = 0;
481*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.refresh_en           =
482*437bfbebSnyanmisaka         !pic_param->error_resilient_mode && !pic_param->parallelmode;
483*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.prob_save_en             = pic_param->refresh_frame_context;
484*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.allow_high_precision_mv  = pic_param->allow_high_precision_mv;
485*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg103.last_key_frame_flag      = hw_ctx->ls_info.last_intra_only;
486*437bfbebSnyanmisaka 
487*437bfbebSnyanmisaka     /* set info for multi core */
488*437bfbebSnyanmisaka     {
489*437bfbebSnyanmisaka         MppFrame mframe = NULL;
490*437bfbebSnyanmisaka 
491*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
492*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg65.cur_poc = mframe ? mpp_frame_get_poc(mframe) : 0;
493*437bfbebSnyanmisaka         // last poc
494*437bfbebSnyanmisaka         ref_idx = pic_param->frame_refs[0].Index7Bits;
495*437bfbebSnyanmisaka         ref_frame_idx = pic_param->ref_frame_map[ref_idx].Index7Bits;
496*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f) {
497*437bfbebSnyanmisaka             mframe = NULL;
498*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal ->slots, ref_frame_idx, SLOT_FRAME_PTR, &mframe);
499*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg95.last_poc = mframe ? mpp_frame_get_poc(mframe) : 0;
500*437bfbebSnyanmisaka         }
501*437bfbebSnyanmisaka         // golden poc
502*437bfbebSnyanmisaka         ref_idx = pic_param->frame_refs[1].Index7Bits;
503*437bfbebSnyanmisaka         ref_frame_idx = pic_param->ref_frame_map[ref_idx].Index7Bits;
504*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f) {
505*437bfbebSnyanmisaka             mframe = NULL;
506*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal ->slots, ref_frame_idx, SLOT_FRAME_PTR, &mframe);
507*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg96.golden_poc = mframe ? mpp_frame_get_poc(mframe) : 0;
508*437bfbebSnyanmisaka         }
509*437bfbebSnyanmisaka         // altref poc
510*437bfbebSnyanmisaka         ref_idx = pic_param->frame_refs[2].Index7Bits;
511*437bfbebSnyanmisaka         ref_frame_idx = pic_param->ref_frame_map[ref_idx].Index7Bits;
512*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f) {
513*437bfbebSnyanmisaka             mframe = NULL;
514*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal ->slots, ref_frame_idx, SLOT_FRAME_PTR, &mframe);
515*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg97.altref_poc = mframe ? mpp_frame_get_poc(mframe) : 0;
516*437bfbebSnyanmisaka         }
517*437bfbebSnyanmisaka         // colref poc
518*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg98.col_ref_poc =
519*437bfbebSnyanmisaka             hw_ctx->col_ref_poc ? hw_ctx->col_ref_poc : vp9_hw_regs->vp9d_param.reg65.cur_poc;
520*437bfbebSnyanmisaka         if (pic_param->show_frame && !pic_param->show_existing_frame)
521*437bfbebSnyanmisaka             hw_ctx->col_ref_poc = vp9_hw_regs->vp9d_param.reg65.cur_poc;
522*437bfbebSnyanmisaka         // segment id ref poc
523*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg100.segid_ref_poc = hw_ctx->segid_ref_poc;
524*437bfbebSnyanmisaka 
525*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_addr.reg169_segidcur_base = mpp_buffer_get_fd(hw_ctx->seg_base);
526*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_addr.reg168_segidlast_base = mpp_buffer_get_fd(hw_ctx->seg_base);
527*437bfbebSnyanmisaka         if (hw_ctx->last_segid_flag) {
528*437bfbebSnyanmisaka             mpp_dev_set_reg_offset(p_hal->dev, 168, hw_ctx->offset_segid_last);
529*437bfbebSnyanmisaka             mpp_dev_set_reg_offset(p_hal->dev, 169, hw_ctx->offset_segid_cur);
530*437bfbebSnyanmisaka         } else {
531*437bfbebSnyanmisaka             mpp_dev_set_reg_offset(p_hal->dev, 168, hw_ctx->offset_segid_cur);
532*437bfbebSnyanmisaka             mpp_dev_set_reg_offset(p_hal->dev, 169, hw_ctx->offset_segid_last);
533*437bfbebSnyanmisaka         }
534*437bfbebSnyanmisaka 
535*437bfbebSnyanmisaka         if ((pic_param->stVP9Segments.enabled && pic_param->stVP9Segments.update_map) ||
536*437bfbebSnyanmisaka             (hw_ctx->ls_info.last_width != pic_param->width) ||
537*437bfbebSnyanmisaka             (hw_ctx->ls_info.last_height != pic_param->height) ||
538*437bfbebSnyanmisaka             intraFlag || pic_param->error_resilient_mode) {
539*437bfbebSnyanmisaka             hw_ctx->segid_ref_poc = vp9_hw_regs->vp9d_param.reg65.cur_poc;
540*437bfbebSnyanmisaka             hw_ctx->last_segid_flag = !hw_ctx->last_segid_flag;
541*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg100.segid_ref_poc = 0;
542*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg75.vp9_segment_id_update = 1;
543*437bfbebSnyanmisaka         } else
544*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg75.vp9_segment_id_update = 0;
545*437bfbebSnyanmisaka     }
546*437bfbebSnyanmisaka 
547*437bfbebSnyanmisaka     /* config last prob base and update write base */
548*437bfbebSnyanmisaka     {
549*437bfbebSnyanmisaka 
550*437bfbebSnyanmisaka         if (intraFlag || pic_param->error_resilient_mode) {
551*437bfbebSnyanmisaka             if (intraFlag
552*437bfbebSnyanmisaka                 || pic_param->error_resilient_mode
553*437bfbebSnyanmisaka                 || (pic_param->reset_frame_context == 3)) {
554*437bfbebSnyanmisaka                 memset(hw_ctx->prob_ctx_valid, 0, sizeof(hw_ctx->prob_ctx_valid));
555*437bfbebSnyanmisaka             } else if (pic_param->reset_frame_context == 2) {
556*437bfbebSnyanmisaka                 hw_ctx->prob_ctx_valid[frame_ctx_id] = 0;
557*437bfbebSnyanmisaka             }
558*437bfbebSnyanmisaka         }
559*437bfbebSnyanmisaka 
560*437bfbebSnyanmisaka #if VP9_DUMP
561*437bfbebSnyanmisaka         {
562*437bfbebSnyanmisaka             static RK_U32 file_cnt = 0;
563*437bfbebSnyanmisaka             char file_name[128];
564*437bfbebSnyanmisaka             RK_U32 i = 0;
565*437bfbebSnyanmisaka             sprintf(file_name, "/data/vp9/prob_last_%d.txt", file_cnt);
566*437bfbebSnyanmisaka             FILE *fp = fopen(file_name, "wb");
567*437bfbebSnyanmisaka             RK_U32 *tmp = NULL;
568*437bfbebSnyanmisaka             if (hw_ctx->prob_ctx_valid[frame_ctx_id]) {
569*437bfbebSnyanmisaka                 tmp = (RK_U32 *)mpp_buffer_get_ptr(hw_ctx->prob_loop_base[pic_param->frame_context_idx]);
570*437bfbebSnyanmisaka             } else {
571*437bfbebSnyanmisaka                 tmp = (RK_U32 *)mpp_buffer_get_ptr(hw_ctx->prob_default_base);
572*437bfbebSnyanmisaka             }
573*437bfbebSnyanmisaka             for (i = 0; i < PROB_SIZE / 4; i += 2) {
574*437bfbebSnyanmisaka                 fprintf(fp, "%08x%08x\n", tmp[i + 1], tmp[i]);
575*437bfbebSnyanmisaka             }
576*437bfbebSnyanmisaka             file_cnt++;
577*437bfbebSnyanmisaka             fflush(fp);
578*437bfbebSnyanmisaka             fclose(fp);
579*437bfbebSnyanmisaka         }
580*437bfbebSnyanmisaka #endif
581*437bfbebSnyanmisaka 
582*437bfbebSnyanmisaka         if (hw_ctx->prob_ctx_valid[frame_ctx_id]) {
583*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_addr.reg162_last_prob_base =
584*437bfbebSnyanmisaka                 mpp_buffer_get_fd(hw_ctx->prob_loop_base[frame_ctx_id]);
585*437bfbebSnyanmisaka             vp9_hw_regs->common.reg028.swreg_vp9_rd_prob_idx = frame_ctx_id + 1;
586*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg99.prob_ref_poc = hw_ctx->prob_ref_poc[frame_ctx_id];
587*437bfbebSnyanmisaka         } else {
588*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_addr.reg162_last_prob_base = mpp_buffer_get_fd(hw_ctx->prob_default_base);
589*437bfbebSnyanmisaka             hw_ctx->prob_ctx_valid[frame_ctx_id] |= pic_param->refresh_frame_context;
590*437bfbebSnyanmisaka             vp9_hw_regs->common.reg028.swreg_vp9_rd_prob_idx = 0;
591*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg99.prob_ref_poc = 0;
592*437bfbebSnyanmisaka             hw_ctx->prob_ref_poc[frame_ctx_id] = vp9_hw_regs->vp9d_param.reg65.cur_poc;
593*437bfbebSnyanmisaka         }
594*437bfbebSnyanmisaka         hal_vp9d_dbg_par("vp9d intra %d parallelmode %d frame_ctx_id %d refresh %d err %d\n",
595*437bfbebSnyanmisaka                          intraFlag, pic_param->parallelmode, frame_ctx_id,
596*437bfbebSnyanmisaka                          pic_param->refresh_frame_context, pic_param->error_resilient_mode);
597*437bfbebSnyanmisaka         if (!pic_param->parallelmode)
598*437bfbebSnyanmisaka             hw_ctx->prob_ref_poc[frame_ctx_id] = vp9_hw_regs->vp9d_param.reg65.cur_poc;
599*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_addr.reg172_update_prob_wr_base =
600*437bfbebSnyanmisaka             mpp_buffer_get_fd(hw_ctx->prob_loop_base[frame_ctx_id]);
601*437bfbebSnyanmisaka         vp9_hw_regs->common.reg028.swreg_vp9_wr_prob_idx = frame_ctx_id + 1;
602*437bfbebSnyanmisaka 
603*437bfbebSnyanmisaka     }
604*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_addr.reg160_delta_prob_base = mpp_buffer_get_fd(hw_ctx->probe_base);
605*437bfbebSnyanmisaka #else
606*437bfbebSnyanmisaka     hal_vp9d_output_probe(mpp_buffer_get_ptr(hw_ctx->probe_base), task->dec.syntax.data);
607*437bfbebSnyanmisaka     mpp_buffer_sync_end(hw_ctx->probe_base);
608*437bfbebSnyanmisaka #endif
609*437bfbebSnyanmisaka     vp9_hw_regs->common.reg012.colmv_compress_en = p_hal->hw_info ? p_hal->hw_info->cap_colmv_compress : 1;
610*437bfbebSnyanmisaka     vp9_hw_regs->common.reg013.cur_pic_is_idr = !pic_param->frame_type;
611*437bfbebSnyanmisaka     vp9_hw_regs->common.reg009.dec_mode = 2; //set as vp9 dec
612*437bfbebSnyanmisaka     vp9_hw_regs->common.reg016_str_len = ((stream_len + 15) & (~15)) + 0x80;
613*437bfbebSnyanmisaka 
614*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal ->packet_slots, task->dec.input, SLOT_BUFFER, &streambuf);
615*437bfbebSnyanmisaka     bitstream = mpp_buffer_get_ptr(streambuf);
616*437bfbebSnyanmisaka     aglin_offset = vp9_hw_regs->common.reg016_str_len - stream_len;
617*437bfbebSnyanmisaka     if (aglin_offset > 0) {
618*437bfbebSnyanmisaka         memset((void *)(bitstream + stream_len), 0, aglin_offset);
619*437bfbebSnyanmisaka     }
620*437bfbebSnyanmisaka 
621*437bfbebSnyanmisaka     //--- caculate the yuv_frame_size and mv_size
622*437bfbebSnyanmisaka     bit_depth = pic_param->BitDepthMinus8Luma + 8;
623*437bfbebSnyanmisaka 
624*437bfbebSnyanmisaka     {
625*437bfbebSnyanmisaka         MppFrame mframe = NULL;
626*437bfbebSnyanmisaka 
627*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
628*437bfbebSnyanmisaka         fbc_en = MPP_FRAME_FMT_IS_FBC(mpp_frame_get_fmt(mframe));
629*437bfbebSnyanmisaka 
630*437bfbebSnyanmisaka         if (fbc_en) {
631*437bfbebSnyanmisaka             RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(mframe);
632*437bfbebSnyanmisaka             RK_U32 h = MPP_ALIGN(mpp_frame_get_height(mframe), 64);
633*437bfbebSnyanmisaka             RK_U32 fbd_offset = MPP_ALIGN(fbc_hdr_stride * (h + 16) / 16, SZ_4K);
634*437bfbebSnyanmisaka 
635*437bfbebSnyanmisaka             vp9_hw_regs->common.reg012.fbc_e = 1;
636*437bfbebSnyanmisaka             vp9_hw_regs->common.reg018.y_hor_virstride = fbc_hdr_stride >> 4;
637*437bfbebSnyanmisaka             vp9_hw_regs->common.reg019.uv_hor_virstride = fbc_hdr_stride >> 4;
638*437bfbebSnyanmisaka             vp9_hw_regs->common.reg020_fbc_payload_off.payload_st_offset = fbd_offset >> 4;
639*437bfbebSnyanmisaka         } else {
640*437bfbebSnyanmisaka             sw_y_hor_virstride = mpp_frame_get_hor_stride(mframe) >> 4;
641*437bfbebSnyanmisaka             sw_uv_hor_virstride = sw_y_hor_virstride;
642*437bfbebSnyanmisaka             sw_y_virstride = mpp_frame_get_ver_stride(mframe) * sw_y_hor_virstride;
643*437bfbebSnyanmisaka 
644*437bfbebSnyanmisaka             vp9_hw_regs->common.reg012.fbc_e = 0;
645*437bfbebSnyanmisaka             vp9_hw_regs->common.reg018.y_hor_virstride = sw_y_hor_virstride;
646*437bfbebSnyanmisaka             vp9_hw_regs->common.reg019.uv_hor_virstride = sw_uv_hor_virstride;
647*437bfbebSnyanmisaka             vp9_hw_regs->common.reg020_y_virstride.y_virstride = sw_y_virstride;
648*437bfbebSnyanmisaka         }
649*437bfbebSnyanmisaka     }
650*437bfbebSnyanmisaka     if (!pic_param->intra_only && pic_param->frame_type &&
651*437bfbebSnyanmisaka         !pic_param->error_resilient_mode && hw_ctx->ls_info.last_show_frame) {
652*437bfbebSnyanmisaka         hw_ctx->pre_mv_base_addr = hw_ctx->mv_base_addr;
653*437bfbebSnyanmisaka     }
654*437bfbebSnyanmisaka 
655*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal ->slots, task->dec.output, SLOT_BUFFER, &framebuf);
656*437bfbebSnyanmisaka     vp9_hw_regs->common_addr.reg130_decout_base =  mpp_buffer_get_fd(framebuf);
657*437bfbebSnyanmisaka     vp9_hw_regs->common_addr.reg128_rlc_base = mpp_buffer_get_fd(streambuf);
658*437bfbebSnyanmisaka     vp9_hw_regs->common_addr.reg129_rlcwrite_base = mpp_buffer_get_fd(streambuf);
659*437bfbebSnyanmisaka 
660*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_addr.reg167_count_prob_base = mpp_buffer_get_fd(hw_ctx->probe_base);
661*437bfbebSnyanmisaka     mpp_dev_set_reg_offset(p_hal->dev, 167, hw_ctx->offset_count);
662*437bfbebSnyanmisaka 
663*437bfbebSnyanmisaka     //set cur colmv base
664*437bfbebSnyanmisaka     mv_buf = hal_bufs_get_buf(hw_ctx->cmv_bufs, task->dec.output);
665*437bfbebSnyanmisaka     vp9_hw_regs->common_addr.reg131_colmv_cur_base = mpp_buffer_get_fd(mv_buf->buf[0]);
666*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = vp9_hw_regs->common_addr.reg131_colmv_cur_base;
667*437bfbebSnyanmisaka     if (hw_ctx->pre_mv_base_addr < 0) {
668*437bfbebSnyanmisaka         hw_ctx->pre_mv_base_addr = hw_ctx->mv_base_addr;
669*437bfbebSnyanmisaka     }
670*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_addr.reg170_ref_colmv_base = hw_ctx->pre_mv_base_addr;
671*437bfbebSnyanmisaka 
672*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg64.cprheader_offset = 0;
673*437bfbebSnyanmisaka     reg_ref_base = (RK_U32*)&vp9_hw_regs->vp9d_addr.reg164_ref_last_base;
674*437bfbebSnyanmisaka     for (i = 0; i < 3; i++) {
675*437bfbebSnyanmisaka         MppFrame frame = NULL;
676*437bfbebSnyanmisaka 
677*437bfbebSnyanmisaka         ref_idx = pic_param->frame_refs[i].Index7Bits;
678*437bfbebSnyanmisaka         ref_frame_idx = pic_param->ref_frame_map[ref_idx].Index7Bits;
679*437bfbebSnyanmisaka         ref_frame_width_y = pic_param->ref_frame_coded_width[ref_idx];
680*437bfbebSnyanmisaka         ref_frame_height_y = pic_param->ref_frame_coded_height[ref_idx];
681*437bfbebSnyanmisaka 
682*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f)
683*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal ->slots, ref_frame_idx, SLOT_FRAME_PTR, &frame);
684*437bfbebSnyanmisaka 
685*437bfbebSnyanmisaka         if (fbc_en && frame) {
686*437bfbebSnyanmisaka             RK_U32 fbc_hdr_stride = mpp_frame_get_fbc_hdr_stride(frame);
687*437bfbebSnyanmisaka             RK_U32 h = MPP_ALIGN(mpp_frame_get_height(frame), 64);
688*437bfbebSnyanmisaka             RK_U32 fbd_offset = MPP_ALIGN(fbc_hdr_stride * (h + 16) / 16, SZ_4K);
689*437bfbebSnyanmisaka 
690*437bfbebSnyanmisaka             y_hor_virstride = uv_hor_virstride = fbc_hdr_stride >> 4;
691*437bfbebSnyanmisaka             y_virstride = fbd_offset;
692*437bfbebSnyanmisaka         } else {
693*437bfbebSnyanmisaka             if (frame) {
694*437bfbebSnyanmisaka                 y_hor_virstride = uv_hor_virstride = mpp_frame_get_hor_stride(frame) >> 4;
695*437bfbebSnyanmisaka                 y_virstride = y_hor_virstride * mpp_frame_get_ver_stride(frame);
696*437bfbebSnyanmisaka             } else {
697*437bfbebSnyanmisaka                 y_hor_virstride = uv_hor_virstride = (vp9_hor_align((ref_frame_width_y * bit_depth) >> 3) >> 4);
698*437bfbebSnyanmisaka                 y_virstride = y_hor_virstride * vp9_ver_align(ref_frame_height_y);
699*437bfbebSnyanmisaka             }
700*437bfbebSnyanmisaka         }
701*437bfbebSnyanmisaka 
702*437bfbebSnyanmisaka         if (pic_param->ref_frame_map[ref_idx].Index7Bits < 0x7f) {
703*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal ->slots, pic_param->ref_frame_map[ref_idx].Index7Bits, SLOT_BUFFER, &framebuf);
704*437bfbebSnyanmisaka         }
705*437bfbebSnyanmisaka 
706*437bfbebSnyanmisaka         if (pic_param->ref_frame_map[ref_idx].Index7Bits < 0x7f) {
707*437bfbebSnyanmisaka             switch (i) {
708*437bfbebSnyanmisaka             case 0: {
709*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg106.framewidth_last = ref_frame_width_y;
710*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg107.frameheight_last = ref_frame_height_y;
711*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg79.lastfy_hor_virstride = y_hor_virstride;
712*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg80.lastfuv_hor_virstride = uv_hor_virstride;
713*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg85.lastfy_virstride = y_virstride;
714*437bfbebSnyanmisaka             } break;
715*437bfbebSnyanmisaka             case 1: {
716*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg108.framewidth_golden = ref_frame_width_y;
717*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg109.frameheight_golden = ref_frame_height_y;
718*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg81.goldenfy_hor_virstride = y_hor_virstride;
719*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg82.goldenfuv_hor_virstride = uv_hor_virstride;
720*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg86.goldeny_virstride = y_virstride;
721*437bfbebSnyanmisaka             } break;
722*437bfbebSnyanmisaka             case 2: {
723*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg110.framewidth_alfter = ref_frame_width_y;
724*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg111.frameheight_alfter = ref_frame_height_y;
725*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg83.altreffy_hor_virstride = y_hor_virstride;
726*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg84.altreffuv_hor_virstride = uv_hor_virstride;
727*437bfbebSnyanmisaka                 vp9_hw_regs->vp9d_param.reg87.altrefy_virstride = y_virstride;
728*437bfbebSnyanmisaka             } break;
729*437bfbebSnyanmisaka             default:
730*437bfbebSnyanmisaka                 break;
731*437bfbebSnyanmisaka             }
732*437bfbebSnyanmisaka 
733*437bfbebSnyanmisaka             /*0 map to 11*/
734*437bfbebSnyanmisaka             /*1 map to 12*/
735*437bfbebSnyanmisaka             /*2 map to 13*/
736*437bfbebSnyanmisaka             if (framebuf != NULL) {
737*437bfbebSnyanmisaka                 reg_ref_base[i] = mpp_buffer_get_fd(framebuf);
738*437bfbebSnyanmisaka             } else {
739*437bfbebSnyanmisaka                 mpp_log("ref buff address is no valid used out as base slot index 0x%x", pic_param->ref_frame_map[ref_idx].Index7Bits);
740*437bfbebSnyanmisaka                 reg_ref_base[i] = vp9_hw_regs->common_addr.reg130_decout_base;
741*437bfbebSnyanmisaka             }
742*437bfbebSnyanmisaka             mv_buf = hal_bufs_get_buf(hw_ctx->cmv_bufs, pic_param->ref_frame_map[ref_idx].Index7Bits);
743*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_addr.reg181_196_ref_colmv_base[i] = mpp_buffer_get_fd(mv_buf->buf[0]);
744*437bfbebSnyanmisaka         } else {
745*437bfbebSnyanmisaka             reg_ref_base[i] = vp9_hw_regs->common_addr.reg130_decout_base;
746*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_addr.reg181_196_ref_colmv_base[i] = vp9_hw_regs->common_addr.reg131_colmv_cur_base;
747*437bfbebSnyanmisaka         }
748*437bfbebSnyanmisaka     }
749*437bfbebSnyanmisaka 
750*437bfbebSnyanmisaka     for (i = 0; i < 8; i++) {
751*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_frame_qp_delta_en         = (hw_ctx->ls_info.feature_mask[i]) & 0x1;
752*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_frame_qp_delta            = hw_ctx->ls_info.feature_data[i][0];
753*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_frame_loopfitler_value_en = (hw_ctx->ls_info.feature_mask[i] >> 1) & 0x1;
754*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_frame_loopfilter_value    = hw_ctx->ls_info.feature_data[i][1];
755*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_referinfo_en              = (hw_ctx->ls_info.feature_mask[i] >> 2) & 0x1;
756*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_referinfo                 = hw_ctx->ls_info.feature_data[i][2];
757*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg67_74[i].segid_frame_skip_en             = (hw_ctx->ls_info.feature_mask[i] >> 3) & 0x1;
758*437bfbebSnyanmisaka     }
759*437bfbebSnyanmisaka 
760*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg67_74[0].segid_abs_delta = hw_ctx->ls_info.abs_delta_last;
761*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg76.tx_mode               = pic_param->txmode;
762*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg76.frame_reference_mode  = pic_param->refmode;
763*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg94.ref_deltas_lastframe  = 0;
764*437bfbebSnyanmisaka 
765*437bfbebSnyanmisaka     if (!intraFlag) {
766*437bfbebSnyanmisaka         for (i = 0; i < 4; i++)
767*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg94.ref_deltas_lastframe   |= (hw_ctx->ls_info.last_ref_deltas[i] & 0x7f) << (7 * i);
768*437bfbebSnyanmisaka 
769*437bfbebSnyanmisaka         for (i = 0; i < 2; i++)
770*437bfbebSnyanmisaka             vp9_hw_regs->vp9d_param.reg75.mode_deltas_lastframe  |= (hw_ctx->ls_info.last_mode_deltas[i] & 0x7f) << (7 * i);
771*437bfbebSnyanmisaka     } else {
772*437bfbebSnyanmisaka         hw_ctx->ls_info.segmentation_enable_flag_last = 0;
773*437bfbebSnyanmisaka         hw_ctx->ls_info.last_intra_only = 1;
774*437bfbebSnyanmisaka     }
775*437bfbebSnyanmisaka 
776*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg75.segmentation_enable_lstframe     = hw_ctx->ls_info.segmentation_enable_flag_last;
777*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg75.last_show_frame                  = hw_ctx->ls_info.last_show_frame;
778*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg75.last_intra_only                  = hw_ctx->ls_info.last_intra_only;
779*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg75.last_widthheight_eqcur           = (pic_param->width == hw_ctx->ls_info.last_width) && (pic_param->height == hw_ctx->ls_info.last_height);
780*437bfbebSnyanmisaka     vp9_hw_regs->vp9d_param.reg78.lasttile_size                    = stream_len - pic_param->first_partition_size;
781*437bfbebSnyanmisaka 
782*437bfbebSnyanmisaka 
783*437bfbebSnyanmisaka     if (!intraFlag) {
784*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg88.lref_hor_scale = pic_param->mvscale[0][0];
785*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg89.lref_ver_scale = pic_param->mvscale[0][1];
786*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg90.gref_hor_scale = pic_param->mvscale[1][0];
787*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg91.gref_ver_scale = pic_param->mvscale[1][1];
788*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg92.aref_hor_scale = pic_param->mvscale[2][0];
789*437bfbebSnyanmisaka         vp9_hw_regs->vp9d_param.reg93.aref_ver_scale = pic_param->mvscale[2][1];
790*437bfbebSnyanmisaka     }
791*437bfbebSnyanmisaka 
792*437bfbebSnyanmisaka     vp9_hw_regs->common.reg010.dec_e            = 1;
793*437bfbebSnyanmisaka     vp9_hw_regs->common.reg011.dec_timeout_e    = 1;
794*437bfbebSnyanmisaka     vp9_hw_regs->common.reg011.buf_empty_en     = 1;
795*437bfbebSnyanmisaka     vp9_hw_regs->common.reg011.dec_clkgate_e    = 1;
796*437bfbebSnyanmisaka     vp9_hw_regs->common.reg011.dec_e_strmd_clkgate_dis = 0;
797*437bfbebSnyanmisaka 
798*437bfbebSnyanmisaka     vp9_hw_regs->common.reg012.wait_reset_en    = 1;
799*437bfbebSnyanmisaka     vp9_hw_regs->common.reg013.timeout_mode     = 1;
800*437bfbebSnyanmisaka 
801*437bfbebSnyanmisaka     vp9_hw_regs->common.reg026.swreg_block_gating_e =
802*437bfbebSnyanmisaka         (mpp_get_soc_type() == ROCKCHIP_SOC_RK3588) ? 0xfffef : 0xfffff;
803*437bfbebSnyanmisaka     vp9_hw_regs->common.reg026.reg_cfg_gating_en = 1;
804*437bfbebSnyanmisaka     vp9_hw_regs->common.reg032_timeout_threshold = 0x3ffff;
805*437bfbebSnyanmisaka 
806*437bfbebSnyanmisaka     //last info  update
807*437bfbebSnyanmisaka     hw_ctx->ls_info.abs_delta_last = pic_param->stVP9Segments.abs_delta;
808*437bfbebSnyanmisaka     for (i = 0 ; i < 4; i ++) {
809*437bfbebSnyanmisaka         hw_ctx->ls_info.last_ref_deltas[i] = pic_param->ref_deltas[i];
810*437bfbebSnyanmisaka     }
811*437bfbebSnyanmisaka 
812*437bfbebSnyanmisaka     for (i = 0 ; i < 2; i ++) {
813*437bfbebSnyanmisaka         hw_ctx->ls_info.last_mode_deltas[i] = pic_param->mode_deltas[i];
814*437bfbebSnyanmisaka     }
815*437bfbebSnyanmisaka 
816*437bfbebSnyanmisaka     for (i = 0; i < 8; i++) {
817*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][0] = pic_param->stVP9Segments.feature_data[i][0];
818*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][1] = pic_param->stVP9Segments.feature_data[i][1];
819*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][2] = pic_param->stVP9Segments.feature_data[i][2];
820*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][3] = pic_param->stVP9Segments.feature_data[i][3];
821*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_mask[i]  = pic_param->stVP9Segments.feature_mask[i];
822*437bfbebSnyanmisaka     }
823*437bfbebSnyanmisaka     if (!hw_ctx->ls_info.segmentation_enable_flag_last)
824*437bfbebSnyanmisaka         hw_ctx->ls_info.segmentation_enable_flag_last = pic_param->stVP9Segments.enabled;
825*437bfbebSnyanmisaka 
826*437bfbebSnyanmisaka     hw_ctx->ls_info.last_show_frame = pic_param->show_frame;
827*437bfbebSnyanmisaka     hw_ctx->ls_info.last_width = pic_param->width;
828*437bfbebSnyanmisaka     hw_ctx->ls_info.last_height = pic_param->height;
829*437bfbebSnyanmisaka     hw_ctx->ls_info.last_intra_only = (!pic_param->frame_type || pic_param->intra_only);
830*437bfbebSnyanmisaka     hal_vp9d_dbg_par("stVP9Segments.enabled %d show_frame %d  width %d  height %d last_intra_only %d",
831*437bfbebSnyanmisaka                      pic_param->stVP9Segments.enabled, pic_param->show_frame,
832*437bfbebSnyanmisaka                      pic_param->width, pic_param->height,
833*437bfbebSnyanmisaka                      hw_ctx->ls_info.last_intra_only);
834*437bfbebSnyanmisaka 
835*437bfbebSnyanmisaka     hal_vp9d_rcb_info_update(hal, vp9_hw_regs, pic_param);
836*437bfbebSnyanmisaka     {
837*437bfbebSnyanmisaka         MppBuffer rcb_buf = NULL;
838*437bfbebSnyanmisaka 
839*437bfbebSnyanmisaka         rcb_buf = p_hal->fast_mode ? hw_ctx->g_buf[task->dec.reg_index].rcb_buf : hw_ctx->rcb_buf;
840*437bfbebSnyanmisaka         vdpu34x_setup_rcb(&vp9_hw_regs->common_addr, p_hal->dev, rcb_buf, hw_ctx->rcb_info);
841*437bfbebSnyanmisaka     }
842*437bfbebSnyanmisaka     vdpu34x_setup_statistic(&vp9_hw_regs->common, &vp9_hw_regs->statistic);
843*437bfbebSnyanmisaka 
844*437bfbebSnyanmisaka     // whether need update counts
845*437bfbebSnyanmisaka     if (pic_param->refresh_frame_context && !pic_param->parallelmode) {
846*437bfbebSnyanmisaka         task->dec.flags.wait_done = 1;
847*437bfbebSnyanmisaka     }
848*437bfbebSnyanmisaka 
849*437bfbebSnyanmisaka     return MPP_OK;
850*437bfbebSnyanmisaka }
851*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_start(void * hal,HalTaskInfo * task)852*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_start(void *hal, HalTaskInfo *task)
853*437bfbebSnyanmisaka {
854*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
855*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
856*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
857*437bfbebSnyanmisaka     Vdpu34xVp9dRegSet *hw_regs = (Vdpu34xVp9dRegSet *)hw_ctx->hw_regs;
858*437bfbebSnyanmisaka     MppDev dev = p_hal->dev;
859*437bfbebSnyanmisaka 
860*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
861*437bfbebSnyanmisaka         RK_S32 index =  task->dec.reg_index;
862*437bfbebSnyanmisaka         hw_regs = (Vdpu34xVp9dRegSet *)hw_ctx->g_buf[index].hw_regs;
863*437bfbebSnyanmisaka     }
864*437bfbebSnyanmisaka 
865*437bfbebSnyanmisaka     mpp_assert(hw_regs);
866*437bfbebSnyanmisaka 
867*437bfbebSnyanmisaka 
868*437bfbebSnyanmisaka #if VP9_DUMP
869*437bfbebSnyanmisaka     {
870*437bfbebSnyanmisaka         static RK_U32 file_cnt = 0;
871*437bfbebSnyanmisaka         char file_name[128];
872*437bfbebSnyanmisaka         sprintf(file_name, "/data/vp9_regs/reg_%d.txt", file_cnt);
873*437bfbebSnyanmisaka         FILE *fp = fopen(file_name, "wb");
874*437bfbebSnyanmisaka         RK_U32 i = 0;
875*437bfbebSnyanmisaka         RK_U32 *tmp = NULL;
876*437bfbebSnyanmisaka         tmp = (RK_U32 *)&hw_regs->common;
877*437bfbebSnyanmisaka         for (i = 0; i < sizeof(hw_regs->common) / 4; i++) {
878*437bfbebSnyanmisaka             fprintf(fp, "reg[%d] 0x%08x\n", i + 8, tmp[i]);
879*437bfbebSnyanmisaka         }
880*437bfbebSnyanmisaka         fprintf(fp, "\n");
881*437bfbebSnyanmisaka         tmp = (RK_U32 *)&hw_regs->vp9d_param;
882*437bfbebSnyanmisaka         for (i = 0; i < sizeof(hw_regs->vp9d_param) / 4; i++) {
883*437bfbebSnyanmisaka             fprintf(fp, "reg[%d] 0x%08x\n", i + 64, tmp[i]);
884*437bfbebSnyanmisaka         }
885*437bfbebSnyanmisaka         fprintf(fp, "\n");
886*437bfbebSnyanmisaka         tmp = (RK_U32 *)&hw_regs->common_addr;
887*437bfbebSnyanmisaka         for (i = 0; i < sizeof(hw_regs->common_addr) / 4; i++) {
888*437bfbebSnyanmisaka             fprintf(fp, "reg[%d] 0x%08x\n", i + 128, tmp[i]);
889*437bfbebSnyanmisaka         }
890*437bfbebSnyanmisaka         fprintf(fp, "\n");
891*437bfbebSnyanmisaka         tmp = (RK_U32 *)&hw_regs->vp9d_addr;
892*437bfbebSnyanmisaka         for (i = 0; i < sizeof(hw_regs->vp9d_addr) / 4; i++) {
893*437bfbebSnyanmisaka             fprintf(fp, "reg[%d] 0x%08x\n", i + 160, tmp[i]);
894*437bfbebSnyanmisaka         }
895*437bfbebSnyanmisaka         file_cnt++;
896*437bfbebSnyanmisaka         fflush(fp);
897*437bfbebSnyanmisaka         fclose(fp);
898*437bfbebSnyanmisaka     }
899*437bfbebSnyanmisaka #endif
900*437bfbebSnyanmisaka 
901*437bfbebSnyanmisaka     do {
902*437bfbebSnyanmisaka         MppDevRegWrCfg wr_cfg;
903*437bfbebSnyanmisaka         MppDevRegRdCfg rd_cfg;
904*437bfbebSnyanmisaka 
905*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->common;
906*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->common);
907*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_COMMON_REGS;
908*437bfbebSnyanmisaka 
909*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
910*437bfbebSnyanmisaka         if (ret) {
911*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
912*437bfbebSnyanmisaka             break;
913*437bfbebSnyanmisaka         }
914*437bfbebSnyanmisaka 
915*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->vp9d_param;
916*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->vp9d_param);
917*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_PARAMS_REGS;
918*437bfbebSnyanmisaka 
919*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
920*437bfbebSnyanmisaka         if (ret) {
921*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
922*437bfbebSnyanmisaka             break;
923*437bfbebSnyanmisaka         }
924*437bfbebSnyanmisaka 
925*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->common_addr;
926*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->common_addr);
927*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_COMMON_ADDR_REGS;
928*437bfbebSnyanmisaka 
929*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
930*437bfbebSnyanmisaka         if (ret) {
931*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
932*437bfbebSnyanmisaka             break;
933*437bfbebSnyanmisaka         }
934*437bfbebSnyanmisaka 
935*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->vp9d_addr;
936*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->vp9d_addr);
937*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_CODEC_ADDR_REGS;
938*437bfbebSnyanmisaka 
939*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
940*437bfbebSnyanmisaka         if (ret) {
941*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
942*437bfbebSnyanmisaka             break;
943*437bfbebSnyanmisaka         }
944*437bfbebSnyanmisaka 
945*437bfbebSnyanmisaka         wr_cfg.reg = &hw_regs->statistic;
946*437bfbebSnyanmisaka         wr_cfg.size = sizeof(hw_regs->statistic);
947*437bfbebSnyanmisaka         wr_cfg.offset = OFFSET_STATISTIC_REGS;
948*437bfbebSnyanmisaka 
949*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
950*437bfbebSnyanmisaka         if (ret) {
951*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
952*437bfbebSnyanmisaka             break;
953*437bfbebSnyanmisaka         }
954*437bfbebSnyanmisaka 
955*437bfbebSnyanmisaka         rd_cfg.reg = &hw_regs->irq_status;
956*437bfbebSnyanmisaka         rd_cfg.size = sizeof(hw_regs->irq_status);
957*437bfbebSnyanmisaka         rd_cfg.offset = OFFSET_INTERRUPT_REGS;
958*437bfbebSnyanmisaka 
959*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
960*437bfbebSnyanmisaka         if (ret) {
961*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
962*437bfbebSnyanmisaka             break;
963*437bfbebSnyanmisaka         }
964*437bfbebSnyanmisaka 
965*437bfbebSnyanmisaka         /* rcb info for sram */
966*437bfbebSnyanmisaka         vdpu34x_set_rcbinfo(dev, hw_ctx->rcb_info);
967*437bfbebSnyanmisaka 
968*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
969*437bfbebSnyanmisaka         if (ret) {
970*437bfbebSnyanmisaka             mpp_err_f("send cmd failed %d\n", ret);
971*437bfbebSnyanmisaka             break;
972*437bfbebSnyanmisaka         }
973*437bfbebSnyanmisaka     } while (0);
974*437bfbebSnyanmisaka 
975*437bfbebSnyanmisaka     (void)task;
976*437bfbebSnyanmisaka     return ret;
977*437bfbebSnyanmisaka }
978*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_wait(void * hal,HalTaskInfo * task)979*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_wait(void *hal, HalTaskInfo *task)
980*437bfbebSnyanmisaka {
981*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
982*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
983*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
984*437bfbebSnyanmisaka     Vdpu34xVp9dRegSet *hw_regs = (Vdpu34xVp9dRegSet *)hw_ctx->hw_regs;
985*437bfbebSnyanmisaka 
986*437bfbebSnyanmisaka     if (p_hal->fast_mode)
987*437bfbebSnyanmisaka         hw_regs = (Vdpu34xVp9dRegSet *)hw_ctx->g_buf[task->dec.reg_index].hw_regs;
988*437bfbebSnyanmisaka 
989*437bfbebSnyanmisaka     mpp_assert(hw_regs);
990*437bfbebSnyanmisaka 
991*437bfbebSnyanmisaka     ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
992*437bfbebSnyanmisaka     if (ret)
993*437bfbebSnyanmisaka         mpp_err_f("poll cmd failed %d\n", ret);
994*437bfbebSnyanmisaka 
995*437bfbebSnyanmisaka     if (hal_vp9d_debug & HAL_VP9D_DBG_REG) {
996*437bfbebSnyanmisaka         RK_U32 *p = (RK_U32 *)hw_regs;
997*437bfbebSnyanmisaka         RK_U32 i = 0;
998*437bfbebSnyanmisaka 
999*437bfbebSnyanmisaka         for (i = 0; i < sizeof(Vdpu34xVp9dRegSet) / 4; i++)
1000*437bfbebSnyanmisaka             mpp_log("get regs[%02d]: %08X\n", i, *p++);
1001*437bfbebSnyanmisaka     }
1002*437bfbebSnyanmisaka 
1003*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
1004*437bfbebSnyanmisaka         task->dec.flags.ref_err ||
1005*437bfbebSnyanmisaka         !hw_regs->irq_status.reg224.dec_rdy_sta) {
1006*437bfbebSnyanmisaka         MppFrame mframe = NULL;
1007*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
1008*437bfbebSnyanmisaka         mpp_frame_set_errinfo(mframe, 1);
1009*437bfbebSnyanmisaka     }
1010*437bfbebSnyanmisaka #if !HW_PROB
1011*437bfbebSnyanmisaka     if (p_hal->dec_cb && task->dec.flags.wait_done) {
1012*437bfbebSnyanmisaka         DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
1013*437bfbebSnyanmisaka 
1014*437bfbebSnyanmisaka         mpp_buffer_sync_end(hw_ctx->count_base);
1015*437bfbebSnyanmisaka         hal_vp9d_update_counts(mpp_buffer_get_ptr(hw_ctx->count_base), task->dec.syntax.data);
1016*437bfbebSnyanmisaka         mpp_callback(p_hal->dec_cb, &pic_param->counts);
1017*437bfbebSnyanmisaka     }
1018*437bfbebSnyanmisaka #endif
1019*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
1020*437bfbebSnyanmisaka         hw_ctx->g_buf[task->dec.reg_index].use_flag = 0;
1021*437bfbebSnyanmisaka     }
1022*437bfbebSnyanmisaka 
1023*437bfbebSnyanmisaka     (void)task;
1024*437bfbebSnyanmisaka     return ret;
1025*437bfbebSnyanmisaka }
1026*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_reset(void * hal)1027*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_reset(void *hal)
1028*437bfbebSnyanmisaka {
1029*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1030*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
1031*437bfbebSnyanmisaka 
1032*437bfbebSnyanmisaka     hal_vp9d_enter();
1033*437bfbebSnyanmisaka 
1034*437bfbebSnyanmisaka     memset(&hw_ctx->ls_info, 0, sizeof(hw_ctx->ls_info));
1035*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = -1;
1036*437bfbebSnyanmisaka     hw_ctx->pre_mv_base_addr = -1;
1037*437bfbebSnyanmisaka     hw_ctx->last_segid_flag = 1;
1038*437bfbebSnyanmisaka     memset(&hw_ctx->prob_ref_poc, 0, sizeof(hw_ctx->prob_ref_poc));
1039*437bfbebSnyanmisaka     hw_ctx->col_ref_poc = 0;
1040*437bfbebSnyanmisaka     hw_ctx->segid_ref_poc = 0;
1041*437bfbebSnyanmisaka 
1042*437bfbebSnyanmisaka     hal_vp9d_leave();
1043*437bfbebSnyanmisaka 
1044*437bfbebSnyanmisaka     return MPP_OK;
1045*437bfbebSnyanmisaka }
1046*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_flush(void * hal)1047*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_flush(void *hal)
1048*437bfbebSnyanmisaka {
1049*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1050*437bfbebSnyanmisaka     Vdpu34xVp9dCtx *hw_ctx = (Vdpu34xVp9dCtx*)p_hal->hw_ctx;
1051*437bfbebSnyanmisaka 
1052*437bfbebSnyanmisaka     hal_vp9d_enter();
1053*437bfbebSnyanmisaka 
1054*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = -1;
1055*437bfbebSnyanmisaka     hw_ctx->pre_mv_base_addr = -1;
1056*437bfbebSnyanmisaka 
1057*437bfbebSnyanmisaka     hal_vp9d_leave();
1058*437bfbebSnyanmisaka 
1059*437bfbebSnyanmisaka     return MPP_OK;
1060*437bfbebSnyanmisaka }
1061*437bfbebSnyanmisaka 
hal_vp9d_vdpu34x_control(void * hal,MpiCmd cmd_type,void * param)1062*437bfbebSnyanmisaka static MPP_RET hal_vp9d_vdpu34x_control(void *hal, MpiCmd cmd_type, void *param)
1063*437bfbebSnyanmisaka {
1064*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
1065*437bfbebSnyanmisaka 
1066*437bfbebSnyanmisaka     switch ((MpiCmd)cmd_type) {
1067*437bfbebSnyanmisaka     case MPP_DEC_SET_FRAME_INFO : {
1068*437bfbebSnyanmisaka         MppFrameFormat fmt = mpp_frame_get_fmt((MppFrame)param);
1069*437bfbebSnyanmisaka 
1070*437bfbebSnyanmisaka         if (MPP_FRAME_FMT_IS_FBC(fmt)) {
1071*437bfbebSnyanmisaka             vdpu34x_afbc_align_calc(p_hal->slots, (MppFrame)param, 0);
1072*437bfbebSnyanmisaka         } else {
1073*437bfbebSnyanmisaka             mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, vp9_hor_align);
1074*437bfbebSnyanmisaka         }
1075*437bfbebSnyanmisaka     } break;
1076*437bfbebSnyanmisaka     default : {
1077*437bfbebSnyanmisaka     } break;
1078*437bfbebSnyanmisaka     }
1079*437bfbebSnyanmisaka 
1080*437bfbebSnyanmisaka     return MPP_OK;
1081*437bfbebSnyanmisaka }
1082*437bfbebSnyanmisaka 
1083*437bfbebSnyanmisaka const MppHalApi hal_vp9d_vdpu34x = {
1084*437bfbebSnyanmisaka     .name = "vp9d_vdpu34x",
1085*437bfbebSnyanmisaka     .type = MPP_CTX_DEC,
1086*437bfbebSnyanmisaka     .coding = MPP_VIDEO_CodingVP9,
1087*437bfbebSnyanmisaka     .ctx_size = sizeof(Vdpu34xVp9dCtx),
1088*437bfbebSnyanmisaka     .flag = 0,
1089*437bfbebSnyanmisaka     .init = hal_vp9d_vdpu34x_init,
1090*437bfbebSnyanmisaka     .deinit = hal_vp9d_vdpu34x_deinit,
1091*437bfbebSnyanmisaka     .reg_gen = hal_vp9d_vdpu34x_gen_regs,
1092*437bfbebSnyanmisaka     .start = hal_vp9d_vdpu34x_start,
1093*437bfbebSnyanmisaka     .wait = hal_vp9d_vdpu34x_wait,
1094*437bfbebSnyanmisaka     .reset = hal_vp9d_vdpu34x_reset,
1095*437bfbebSnyanmisaka     .flush = hal_vp9d_vdpu34x_flush,
1096*437bfbebSnyanmisaka     .control = hal_vp9d_vdpu34x_control,
1097*437bfbebSnyanmisaka };
1098