xref: /rockchip-linux_mpp/mpp/hal/rkdec/vp9d/hal_vp9d_rkv.c (revision 437bfbeb9567cca9cd9080e3f6954aa9d6a94f18)
1*437bfbebSnyanmisaka /*
2*437bfbebSnyanmisaka  * Copyright 2020 Rockchip Electronics Co. LTD
3*437bfbebSnyanmisaka  *
4*437bfbebSnyanmisaka  * Licensed under the Apache License, Version 2.0 (the "License");
5*437bfbebSnyanmisaka  * you may not use this file except in compliance with the License.
6*437bfbebSnyanmisaka  * You may obtain a copy of the License at
7*437bfbebSnyanmisaka  *
8*437bfbebSnyanmisaka  *      http://www.apache.org/licenses/LICENSE-2.0
9*437bfbebSnyanmisaka  *
10*437bfbebSnyanmisaka  * Unless required by applicable law or agreed to in writing, software
11*437bfbebSnyanmisaka  * distributed under the License is distributed on an "AS IS" BASIS,
12*437bfbebSnyanmisaka  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13*437bfbebSnyanmisaka  * See the License for the specific language governing permissions and
14*437bfbebSnyanmisaka  * limitations under the License.
15*437bfbebSnyanmisaka  */
16*437bfbebSnyanmisaka 
17*437bfbebSnyanmisaka #define MODULE_TAG "hal_vp9d_rkv"
18*437bfbebSnyanmisaka 
19*437bfbebSnyanmisaka #include <stdio.h>
20*437bfbebSnyanmisaka #include <string.h>
21*437bfbebSnyanmisaka 
22*437bfbebSnyanmisaka #include "mpp_env.h"
23*437bfbebSnyanmisaka #include "mpp_mem.h"
24*437bfbebSnyanmisaka #include "mpp_common.h"
25*437bfbebSnyanmisaka 
26*437bfbebSnyanmisaka #include "hal_vp9d_debug.h"
27*437bfbebSnyanmisaka #include "hal_vp9d_ctx.h"
28*437bfbebSnyanmisaka #include "hal_vp9d_com.h"
29*437bfbebSnyanmisaka #include "hal_vp9d_rkv.h"
30*437bfbebSnyanmisaka #include "hal_vp9d_rkv_reg.h"
31*437bfbebSnyanmisaka #include "vp9d_syntax.h"
32*437bfbebSnyanmisaka 
33*437bfbebSnyanmisaka 
34*437bfbebSnyanmisaka typedef struct Vp9dRkvCtx_t {
35*437bfbebSnyanmisaka     Vp9dRegBuf      g_buf[MAX_GEN_REG];
36*437bfbebSnyanmisaka     MppBuffer       probe_base;
37*437bfbebSnyanmisaka     MppBuffer       count_base;
38*437bfbebSnyanmisaka     MppBuffer       segid_cur_base;
39*437bfbebSnyanmisaka     MppBuffer       segid_last_base;
40*437bfbebSnyanmisaka     void*           hw_regs;
41*437bfbebSnyanmisaka     RK_S32          mv_base_addr;
42*437bfbebSnyanmisaka     RK_U32          mv_base_offset;
43*437bfbebSnyanmisaka     RK_S32          pre_mv_base_addr;
44*437bfbebSnyanmisaka     RK_U32          pre_mv_base_offset;
45*437bfbebSnyanmisaka     Vp9dLastInfo    ls_info;
46*437bfbebSnyanmisaka     /*
47*437bfbebSnyanmisaka      * swap between segid_cur_base & segid_last_base
48*437bfbebSnyanmisaka      * 0  used segid_cur_base as last
49*437bfbebSnyanmisaka      * 1  used segid_last_base as
50*437bfbebSnyanmisaka      */
51*437bfbebSnyanmisaka     RK_U32          last_segid_flag;
52*437bfbebSnyanmisaka } Vp9dRkvCtx;
53*437bfbebSnyanmisaka 
hal_vp9d_alloc_res(HalVp9dCtx * hal)54*437bfbebSnyanmisaka static MPP_RET hal_vp9d_alloc_res(HalVp9dCtx *hal)
55*437bfbebSnyanmisaka {
56*437bfbebSnyanmisaka     RK_S32 i = 0;
57*437bfbebSnyanmisaka     RK_S32 ret = 0;
58*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
59*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = (Vp9dRkvCtx*)p_hal->hw_ctx;
60*437bfbebSnyanmisaka 
61*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
62*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
63*437bfbebSnyanmisaka             hw_ctx->g_buf[i].hw_regs = mpp_calloc_size(void, sizeof(VP9_REGS));
64*437bfbebSnyanmisaka             ret = mpp_buffer_get(p_hal->group,
65*437bfbebSnyanmisaka                                  &hw_ctx->g_buf[i].probe_base, PROB_SIZE);
66*437bfbebSnyanmisaka             if (ret) {
67*437bfbebSnyanmisaka                 mpp_err("vp9 probe_base get buffer failed\n");
68*437bfbebSnyanmisaka                 return ret;
69*437bfbebSnyanmisaka             }
70*437bfbebSnyanmisaka             ret = mpp_buffer_get(p_hal->group,
71*437bfbebSnyanmisaka                                  &hw_ctx->g_buf[i].count_base, COUNT_SIZE);
72*437bfbebSnyanmisaka             if (ret) {
73*437bfbebSnyanmisaka                 mpp_err("vp9 count_base get buffer failed\n");
74*437bfbebSnyanmisaka                 return ret;
75*437bfbebSnyanmisaka             }
76*437bfbebSnyanmisaka             ret = mpp_buffer_get(p_hal->group,
77*437bfbebSnyanmisaka                                  &hw_ctx->g_buf[i].segid_cur_base, MAX_SEGMAP_SIZE);
78*437bfbebSnyanmisaka             if (ret) {
79*437bfbebSnyanmisaka                 mpp_err("vp9 segid_cur_base get buffer failed\n");
80*437bfbebSnyanmisaka                 return ret;
81*437bfbebSnyanmisaka             }
82*437bfbebSnyanmisaka             ret = mpp_buffer_get(p_hal->group,
83*437bfbebSnyanmisaka                                  &hw_ctx->g_buf[i].segid_last_base, MAX_SEGMAP_SIZE);
84*437bfbebSnyanmisaka             if (ret) {
85*437bfbebSnyanmisaka                 mpp_err("vp9 segid_last_base get buffer failed\n");
86*437bfbebSnyanmisaka                 return ret;
87*437bfbebSnyanmisaka             }
88*437bfbebSnyanmisaka         }
89*437bfbebSnyanmisaka     } else {
90*437bfbebSnyanmisaka         hw_ctx->hw_regs = mpp_calloc_size(void, sizeof(VP9_REGS));
91*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->group, &hw_ctx->probe_base, PROB_SIZE);
92*437bfbebSnyanmisaka         if (ret) {
93*437bfbebSnyanmisaka             mpp_err("vp9 probe_base get buffer failed\n");
94*437bfbebSnyanmisaka             return ret;
95*437bfbebSnyanmisaka         }
96*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->group, &hw_ctx->count_base, COUNT_SIZE);
97*437bfbebSnyanmisaka         if (ret) {
98*437bfbebSnyanmisaka             mpp_err("vp9 count_base get buffer failed\n");
99*437bfbebSnyanmisaka             return ret;
100*437bfbebSnyanmisaka         }
101*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->group, &hw_ctx->segid_cur_base, MAX_SEGMAP_SIZE);
102*437bfbebSnyanmisaka         if (ret) {
103*437bfbebSnyanmisaka             mpp_err("vp9 segid_cur_base get buffer failed\n");
104*437bfbebSnyanmisaka             return ret;
105*437bfbebSnyanmisaka         }
106*437bfbebSnyanmisaka         ret = mpp_buffer_get(p_hal->group, &hw_ctx->segid_last_base, MAX_SEGMAP_SIZE);
107*437bfbebSnyanmisaka         if (ret) {
108*437bfbebSnyanmisaka             mpp_err("vp9 segid_last_base get buffer failed\n");
109*437bfbebSnyanmisaka             return ret;
110*437bfbebSnyanmisaka         }
111*437bfbebSnyanmisaka     }
112*437bfbebSnyanmisaka     return MPP_OK;
113*437bfbebSnyanmisaka }
114*437bfbebSnyanmisaka 
hal_vp9d_release_res(HalVp9dCtx * hal)115*437bfbebSnyanmisaka static MPP_RET hal_vp9d_release_res(HalVp9dCtx *hal)
116*437bfbebSnyanmisaka {
117*437bfbebSnyanmisaka     RK_S32 i = 0;
118*437bfbebSnyanmisaka     RK_S32 ret = 0;
119*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = hal;
120*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = (Vp9dRkvCtx*)p_hal->hw_ctx;
121*437bfbebSnyanmisaka 
122*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
123*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
124*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].probe_base) {
125*437bfbebSnyanmisaka                 ret = mpp_buffer_put(hw_ctx->g_buf[i].probe_base);
126*437bfbebSnyanmisaka                 if (ret) {
127*437bfbebSnyanmisaka                     mpp_err("vp9 probe_base put buffer failed\n");
128*437bfbebSnyanmisaka                     return ret;
129*437bfbebSnyanmisaka                 }
130*437bfbebSnyanmisaka             }
131*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].count_base) {
132*437bfbebSnyanmisaka                 ret = mpp_buffer_put(hw_ctx->g_buf[i].count_base);
133*437bfbebSnyanmisaka                 if (ret) {
134*437bfbebSnyanmisaka                     mpp_err("vp9 count_base put buffer failed\n");
135*437bfbebSnyanmisaka                     return ret;
136*437bfbebSnyanmisaka                 }
137*437bfbebSnyanmisaka             }
138*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].segid_cur_base) {
139*437bfbebSnyanmisaka                 ret = mpp_buffer_put(hw_ctx->g_buf[i].segid_cur_base);
140*437bfbebSnyanmisaka                 if (ret) {
141*437bfbebSnyanmisaka                     mpp_err("vp9 segid_cur_base put buffer failed\n");
142*437bfbebSnyanmisaka                     return ret;
143*437bfbebSnyanmisaka                 }
144*437bfbebSnyanmisaka             }
145*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].segid_last_base) {
146*437bfbebSnyanmisaka                 ret = mpp_buffer_put(hw_ctx->g_buf[i].segid_last_base);
147*437bfbebSnyanmisaka                 if (ret) {
148*437bfbebSnyanmisaka                     mpp_err("vp9 segid_last_base put buffer failed\n");
149*437bfbebSnyanmisaka                     return ret;
150*437bfbebSnyanmisaka                 }
151*437bfbebSnyanmisaka             }
152*437bfbebSnyanmisaka             if (hw_ctx->g_buf[i].hw_regs) {
153*437bfbebSnyanmisaka                 mpp_free(hw_ctx->g_buf[i].hw_regs);
154*437bfbebSnyanmisaka                 hw_ctx->g_buf[i].hw_regs = NULL;
155*437bfbebSnyanmisaka             }
156*437bfbebSnyanmisaka         }
157*437bfbebSnyanmisaka     } else {
158*437bfbebSnyanmisaka         if (hw_ctx->probe_base) {
159*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->probe_base);
160*437bfbebSnyanmisaka             if (ret) {
161*437bfbebSnyanmisaka                 mpp_err("vp9 probe_base get buffer failed\n");
162*437bfbebSnyanmisaka                 return ret;
163*437bfbebSnyanmisaka             }
164*437bfbebSnyanmisaka         }
165*437bfbebSnyanmisaka         if (hw_ctx->count_base) {
166*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->count_base);
167*437bfbebSnyanmisaka             if (ret) {
168*437bfbebSnyanmisaka                 mpp_err("vp9 count_base put buffer failed\n");
169*437bfbebSnyanmisaka                 return ret;
170*437bfbebSnyanmisaka             }
171*437bfbebSnyanmisaka         }
172*437bfbebSnyanmisaka         if (hw_ctx->segid_cur_base) {
173*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->segid_cur_base);
174*437bfbebSnyanmisaka             if (ret) {
175*437bfbebSnyanmisaka                 mpp_err("vp9 segid_cur_base put buffer failed\n");
176*437bfbebSnyanmisaka                 return ret;
177*437bfbebSnyanmisaka             }
178*437bfbebSnyanmisaka         }
179*437bfbebSnyanmisaka         if (hw_ctx->segid_last_base) {
180*437bfbebSnyanmisaka             ret = mpp_buffer_put(hw_ctx->segid_last_base);
181*437bfbebSnyanmisaka             if (ret) {
182*437bfbebSnyanmisaka                 mpp_err("vp9 segid_last_base put buffer failed\n");
183*437bfbebSnyanmisaka                 return ret;
184*437bfbebSnyanmisaka             }
185*437bfbebSnyanmisaka         }
186*437bfbebSnyanmisaka         if (hw_ctx->hw_regs) {
187*437bfbebSnyanmisaka             mpp_free(hw_ctx->hw_regs);
188*437bfbebSnyanmisaka             hw_ctx->hw_regs = NULL;
189*437bfbebSnyanmisaka         }
190*437bfbebSnyanmisaka     }
191*437bfbebSnyanmisaka     return MPP_OK;
192*437bfbebSnyanmisaka }
193*437bfbebSnyanmisaka 
hal_vp9d_rkv_init(void * hal,MppHalCfg * cfg)194*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_init(void *hal, MppHalCfg *cfg)
195*437bfbebSnyanmisaka {
196*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
197*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
198*437bfbebSnyanmisaka     MEM_CHECK(ret, p_hal->hw_ctx = mpp_calloc_size(void, sizeof(Vp9dRkvCtx)));
199*437bfbebSnyanmisaka     Vp9dRkvCtx *ctx = (Vp9dRkvCtx *)p_hal->hw_ctx;
200*437bfbebSnyanmisaka 
201*437bfbebSnyanmisaka     mpp_log("hal_vp9d_rkv_init in");
202*437bfbebSnyanmisaka     ctx->mv_base_addr = -1;
203*437bfbebSnyanmisaka     ctx->pre_mv_base_addr = -1;
204*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->slots, SLOTS_HOR_ALIGN, vp9_hor_align);
205*437bfbebSnyanmisaka     mpp_slots_set_prop(p_hal->slots, SLOTS_VER_ALIGN, vp9_ver_align);
206*437bfbebSnyanmisaka 
207*437bfbebSnyanmisaka     if (p_hal->group == NULL) {
208*437bfbebSnyanmisaka         ret = mpp_buffer_group_get_internal(&p_hal->group, MPP_BUFFER_TYPE_ION);
209*437bfbebSnyanmisaka         if (ret) {
210*437bfbebSnyanmisaka             mpp_err("vp9 mpp_buffer_group_get failed\n");
211*437bfbebSnyanmisaka             return ret;
212*437bfbebSnyanmisaka         }
213*437bfbebSnyanmisaka     }
214*437bfbebSnyanmisaka 
215*437bfbebSnyanmisaka     ret = hal_vp9d_alloc_res(p_hal);
216*437bfbebSnyanmisaka     if (ret) {
217*437bfbebSnyanmisaka         mpp_err("hal_vp9d_alloc_res failed\n");
218*437bfbebSnyanmisaka         return ret;
219*437bfbebSnyanmisaka     }
220*437bfbebSnyanmisaka 
221*437bfbebSnyanmisaka     ctx->last_segid_flag = 1;
222*437bfbebSnyanmisaka 
223*437bfbebSnyanmisaka     (void) cfg;
224*437bfbebSnyanmisaka     return ret = MPP_OK;
225*437bfbebSnyanmisaka __FAILED:
226*437bfbebSnyanmisaka     return ret = MPP_NOK;
227*437bfbebSnyanmisaka }
228*437bfbebSnyanmisaka 
hal_vp9d_rkv_deinit(void * hal)229*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_deinit(void *hal)
230*437bfbebSnyanmisaka {
231*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
232*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
233*437bfbebSnyanmisaka 
234*437bfbebSnyanmisaka     hal_vp9d_release_res(p_hal);
235*437bfbebSnyanmisaka 
236*437bfbebSnyanmisaka     if (p_hal->group) {
237*437bfbebSnyanmisaka         ret = mpp_buffer_group_put(p_hal->group);
238*437bfbebSnyanmisaka         if (ret) {
239*437bfbebSnyanmisaka             mpp_err("vp9d group free buffer failed\n");
240*437bfbebSnyanmisaka             return ret;
241*437bfbebSnyanmisaka         }
242*437bfbebSnyanmisaka     }
243*437bfbebSnyanmisaka     MPP_FREE(p_hal->hw_ctx);
244*437bfbebSnyanmisaka     return ret = MPP_OK;
245*437bfbebSnyanmisaka }
246*437bfbebSnyanmisaka 
hal_vp9d_rkv_gen_regs(void * hal,HalTaskInfo * task)247*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_gen_regs(void *hal, HalTaskInfo *task)
248*437bfbebSnyanmisaka {
249*437bfbebSnyanmisaka     RK_S32   i;
250*437bfbebSnyanmisaka     RK_U8    bit_depth = 0;
251*437bfbebSnyanmisaka     RK_U32   ref_frame_width_y;
252*437bfbebSnyanmisaka     RK_U32   ref_frame_height_y;
253*437bfbebSnyanmisaka     RK_S32   stream_len = 0, aglin_offset = 0;
254*437bfbebSnyanmisaka     RK_U32   y_hor_virstride, uv_hor_virstride, y_virstride, uv_virstride, yuv_virstride;
255*437bfbebSnyanmisaka     RK_U8   *bitstream = NULL;
256*437bfbebSnyanmisaka     MppBuffer streambuf = NULL;
257*437bfbebSnyanmisaka     RK_U32 sw_y_hor_virstride;
258*437bfbebSnyanmisaka     RK_U32 sw_uv_hor_virstride;
259*437bfbebSnyanmisaka     RK_U32 sw_y_virstride;
260*437bfbebSnyanmisaka     RK_U32 sw_uv_virstride;
261*437bfbebSnyanmisaka     RK_U32 sw_yuv_virstride ;
262*437bfbebSnyanmisaka     RK_U8  ref_idx = 0;
263*437bfbebSnyanmisaka     RK_U8  ref_frame_idx = 0;
264*437bfbebSnyanmisaka     RK_U32 *reg_ref_base = 0;
265*437bfbebSnyanmisaka     RK_S32 intraFlag = 0;
266*437bfbebSnyanmisaka     MppBuffer framebuf = NULL;
267*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx*)hal;
268*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = (Vp9dRkvCtx*)p_hal->hw_ctx;
269*437bfbebSnyanmisaka     DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
270*437bfbebSnyanmisaka     MppFrame mframe = NULL;
271*437bfbebSnyanmisaka 
272*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
273*437bfbebSnyanmisaka 
274*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
275*437bfbebSnyanmisaka         for (i = 0; i < MAX_GEN_REG; i++) {
276*437bfbebSnyanmisaka             if (!hw_ctx->g_buf[i].use_flag) {
277*437bfbebSnyanmisaka                 task->dec.reg_index = i;
278*437bfbebSnyanmisaka                 hw_ctx->probe_base = hw_ctx->g_buf[i].probe_base;
279*437bfbebSnyanmisaka                 hw_ctx->count_base = hw_ctx->g_buf[i].count_base;
280*437bfbebSnyanmisaka                 hw_ctx->segid_cur_base = hw_ctx->g_buf[i].segid_cur_base;
281*437bfbebSnyanmisaka                 hw_ctx->segid_last_base = hw_ctx->g_buf[i].segid_last_base;
282*437bfbebSnyanmisaka                 hw_ctx->hw_regs = hw_ctx->g_buf[i].hw_regs;
283*437bfbebSnyanmisaka                 hw_ctx->g_buf[i].use_flag = 1;
284*437bfbebSnyanmisaka                 break;
285*437bfbebSnyanmisaka             }
286*437bfbebSnyanmisaka         }
287*437bfbebSnyanmisaka         if (i == MAX_GEN_REG) {
288*437bfbebSnyanmisaka             mpp_err("vp9 fast mode buf all used\n");
289*437bfbebSnyanmisaka             return MPP_ERR_NOMEM;
290*437bfbebSnyanmisaka         }
291*437bfbebSnyanmisaka     }
292*437bfbebSnyanmisaka     VP9_REGS *vp9_hw_regs = (VP9_REGS*)hw_ctx->hw_regs;
293*437bfbebSnyanmisaka     intraFlag = (!pic_param->frame_type || pic_param->intra_only);
294*437bfbebSnyanmisaka     hal_vp9d_output_probe(mpp_buffer_get_ptr(hw_ctx->probe_base), task->dec.syntax.data);
295*437bfbebSnyanmisaka     mpp_buffer_sync_end(hw_ctx->count_base);
296*437bfbebSnyanmisaka     stream_len = (RK_S32)mpp_packet_get_length(task->dec.input_packet);
297*437bfbebSnyanmisaka     memset(hw_ctx->hw_regs, 0, sizeof(VP9_REGS));
298*437bfbebSnyanmisaka     vp9_hw_regs->swreg2_sysctrl.sw_dec_mode = 2; //set as vp9 dec
299*437bfbebSnyanmisaka     vp9_hw_regs->swreg5_stream_len = ((stream_len + 15) & (~15)) + 0x80;
300*437bfbebSnyanmisaka 
301*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->packet_slots, task->dec.input, SLOT_BUFFER, &streambuf);
302*437bfbebSnyanmisaka     bitstream = mpp_buffer_get_ptr(streambuf);
303*437bfbebSnyanmisaka     aglin_offset = vp9_hw_regs->swreg5_stream_len - stream_len;
304*437bfbebSnyanmisaka     if (aglin_offset > 0) {
305*437bfbebSnyanmisaka         memset((void *)(bitstream + stream_len), 0, aglin_offset);
306*437bfbebSnyanmisaka     }
307*437bfbebSnyanmisaka 
308*437bfbebSnyanmisaka     //--- caculate the yuv_frame_size and mv_size
309*437bfbebSnyanmisaka     bit_depth = pic_param->BitDepthMinus8Luma + 8;
310*437bfbebSnyanmisaka 
311*437bfbebSnyanmisaka     sw_y_hor_virstride = mpp_frame_get_hor_stride(mframe) >> 4;
312*437bfbebSnyanmisaka     sw_uv_hor_virstride = mpp_frame_get_hor_stride(mframe) >> 4;
313*437bfbebSnyanmisaka     sw_y_virstride = sw_y_hor_virstride * mpp_frame_get_ver_stride(mframe);
314*437bfbebSnyanmisaka 
315*437bfbebSnyanmisaka     sw_uv_virstride = sw_uv_hor_virstride * mpp_frame_get_ver_stride(mframe) / 2;
316*437bfbebSnyanmisaka     sw_yuv_virstride = sw_y_virstride + sw_uv_virstride;
317*437bfbebSnyanmisaka 
318*437bfbebSnyanmisaka     vp9_hw_regs->swreg3_picpar.sw_y_hor_virstride = sw_y_hor_virstride;
319*437bfbebSnyanmisaka     vp9_hw_regs->swreg3_picpar.sw_uv_hor_virstride = sw_uv_hor_virstride;
320*437bfbebSnyanmisaka     vp9_hw_regs->swreg8_y_virstride.sw_y_virstride = sw_y_virstride;
321*437bfbebSnyanmisaka     vp9_hw_regs->swreg9_yuv_virstride.sw_yuv_virstride = sw_yuv_virstride;
322*437bfbebSnyanmisaka 
323*437bfbebSnyanmisaka     if (!pic_param->intra_only && pic_param->frame_type &&
324*437bfbebSnyanmisaka         !pic_param->error_resilient_mode && hw_ctx->ls_info.last_show_frame) {
325*437bfbebSnyanmisaka         hw_ctx->pre_mv_base_addr = hw_ctx->mv_base_addr;
326*437bfbebSnyanmisaka         hw_ctx->pre_mv_base_offset = hw_ctx->mv_base_offset;
327*437bfbebSnyanmisaka     }
328*437bfbebSnyanmisaka 
329*437bfbebSnyanmisaka 
330*437bfbebSnyanmisaka     mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_BUFFER, &framebuf);
331*437bfbebSnyanmisaka     vp9_hw_regs->swreg7_decout_base =  mpp_buffer_get_fd(framebuf);
332*437bfbebSnyanmisaka     vp9_hw_regs->swreg4_strm_rlc_base = mpp_buffer_get_fd(streambuf);
333*437bfbebSnyanmisaka 
334*437bfbebSnyanmisaka     vp9_hw_regs->swreg6_cabactbl_prob_base = mpp_buffer_get_fd(hw_ctx->probe_base);
335*437bfbebSnyanmisaka     vp9_hw_regs->swreg14_vp9_count_base  = mpp_buffer_get_fd(hw_ctx->count_base);
336*437bfbebSnyanmisaka 
337*437bfbebSnyanmisaka     if (hw_ctx->last_segid_flag) {
338*437bfbebSnyanmisaka         vp9_hw_regs->swreg15_vp9_segidlast_base = mpp_buffer_get_fd(hw_ctx->segid_last_base);
339*437bfbebSnyanmisaka         vp9_hw_regs->swreg16_vp9_segidcur_base = mpp_buffer_get_fd(hw_ctx->segid_cur_base);
340*437bfbebSnyanmisaka     } else {
341*437bfbebSnyanmisaka         vp9_hw_regs->swreg15_vp9_segidlast_base = mpp_buffer_get_fd(hw_ctx->segid_cur_base);
342*437bfbebSnyanmisaka         vp9_hw_regs->swreg16_vp9_segidcur_base = mpp_buffer_get_fd(hw_ctx->segid_last_base);
343*437bfbebSnyanmisaka     }
344*437bfbebSnyanmisaka 
345*437bfbebSnyanmisaka     if (pic_param->stVP9Segments.enabled && pic_param->stVP9Segments.update_map) {
346*437bfbebSnyanmisaka         hw_ctx->last_segid_flag = !hw_ctx->last_segid_flag;
347*437bfbebSnyanmisaka     }
348*437bfbebSnyanmisaka 
349*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = vp9_hw_regs->swreg7_decout_base;
350*437bfbebSnyanmisaka     hw_ctx->mv_base_offset = mpp_get_ioctl_version() ? sw_yuv_virstride << 4 : sw_yuv_virstride;
351*437bfbebSnyanmisaka     if (hw_ctx->pre_mv_base_addr < 0) {
352*437bfbebSnyanmisaka         hw_ctx->pre_mv_base_addr = hw_ctx->mv_base_addr;
353*437bfbebSnyanmisaka         hw_ctx->pre_mv_base_offset = hw_ctx->mv_base_offset;
354*437bfbebSnyanmisaka     }
355*437bfbebSnyanmisaka     vp9_hw_regs->swreg52_vp9_refcolmv_base = hw_ctx->pre_mv_base_addr;
356*437bfbebSnyanmisaka     mpp_dev_set_reg_offset(p_hal->dev, 52, hw_ctx->pre_mv_base_offset);
357*437bfbebSnyanmisaka 
358*437bfbebSnyanmisaka     vp9_hw_regs->swreg10_vp9_cprheader_offset.sw_vp9_cprheader_offset = 0; //no use now.
359*437bfbebSnyanmisaka     reg_ref_base = &vp9_hw_regs->swreg11_vp9_referlast_base;
360*437bfbebSnyanmisaka     for (i = 0; i < 3; i++) {
361*437bfbebSnyanmisaka         ref_idx = pic_param->frame_refs[i].Index7Bits;
362*437bfbebSnyanmisaka         ref_frame_idx = pic_param->ref_frame_map[ref_idx].Index7Bits;
363*437bfbebSnyanmisaka         ref_frame_width_y = pic_param->ref_frame_coded_width[ref_idx];
364*437bfbebSnyanmisaka         ref_frame_height_y = pic_param->ref_frame_coded_height[ref_idx];
365*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f) {
366*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal->slots, ref_frame_idx, SLOT_FRAME_PTR, &mframe);
367*437bfbebSnyanmisaka             y_hor_virstride = mpp_frame_get_hor_stride(mframe) >> 4;
368*437bfbebSnyanmisaka             uv_hor_virstride = mpp_frame_get_hor_stride(mframe) >> 4;
369*437bfbebSnyanmisaka             y_virstride = y_hor_virstride * mpp_frame_get_ver_stride(mframe);
370*437bfbebSnyanmisaka             uv_virstride = uv_hor_virstride * mpp_frame_get_ver_stride(mframe) / 2;
371*437bfbebSnyanmisaka         } else {
372*437bfbebSnyanmisaka             y_hor_virstride = (vp9_hor_align((ref_frame_width_y * bit_depth) >> 3) >> 4);
373*437bfbebSnyanmisaka             uv_hor_virstride = (vp9_hor_align((ref_frame_width_y * bit_depth) >> 3) >> 4);
374*437bfbebSnyanmisaka             y_virstride = y_hor_virstride * vp9_ver_align(ref_frame_height_y);
375*437bfbebSnyanmisaka             uv_virstride = uv_hor_virstride * vp9_ver_align(ref_frame_height_y) / 2;
376*437bfbebSnyanmisaka         }
377*437bfbebSnyanmisaka         yuv_virstride = y_virstride + uv_virstride;
378*437bfbebSnyanmisaka 
379*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f)
380*437bfbebSnyanmisaka             mpp_buf_slot_get_prop(p_hal->slots, ref_frame_idx, SLOT_BUFFER, &framebuf);
381*437bfbebSnyanmisaka 
382*437bfbebSnyanmisaka         if (ref_frame_idx < 0x7f) {
383*437bfbebSnyanmisaka             switch (i) {
384*437bfbebSnyanmisaka             case 0: {
385*437bfbebSnyanmisaka                 vp9_hw_regs->swreg17_vp9_frame_size_last.sw_framewidth_last = ref_frame_width_y;
386*437bfbebSnyanmisaka                 vp9_hw_regs->swreg17_vp9_frame_size_last.sw_frameheight_last = ref_frame_height_y;
387*437bfbebSnyanmisaka                 vp9_hw_regs->swreg37_vp9_lastf_hor_virstride.sw_vp9_lastfy_hor_virstride = y_hor_virstride;
388*437bfbebSnyanmisaka                 vp9_hw_regs->swreg37_vp9_lastf_hor_virstride.sw_vp9_lastfuv_hor_virstride = uv_hor_virstride;
389*437bfbebSnyanmisaka                 vp9_hw_regs->swreg48_vp9_last_ystride.sw_vp9_lastfy_virstride = y_virstride;
390*437bfbebSnyanmisaka                 vp9_hw_regs->swreg51_vp9_lastref_yuvstride.sw_vp9_lastref_yuv_virstride = yuv_virstride;
391*437bfbebSnyanmisaka                 break;
392*437bfbebSnyanmisaka             }
393*437bfbebSnyanmisaka             case 1: {
394*437bfbebSnyanmisaka                 vp9_hw_regs->swreg18_vp9_frame_size_golden.sw_framewidth_golden = ref_frame_width_y;
395*437bfbebSnyanmisaka                 vp9_hw_regs->swreg18_vp9_frame_size_golden.sw_frameheight_golden = ref_frame_height_y;
396*437bfbebSnyanmisaka                 vp9_hw_regs->swreg38_vp9_goldenf_hor_virstride.sw_vp9_goldenfy_hor_virstride = y_hor_virstride;
397*437bfbebSnyanmisaka                 vp9_hw_regs->swreg38_vp9_goldenf_hor_virstride.sw_vp9_goldenuv_hor_virstride = uv_hor_virstride;
398*437bfbebSnyanmisaka                 vp9_hw_regs->swreg49_vp9_golden_ystride.sw_vp9_goldeny_virstride = y_virstride;
399*437bfbebSnyanmisaka                 break;
400*437bfbebSnyanmisaka             }
401*437bfbebSnyanmisaka             case 2: {
402*437bfbebSnyanmisaka                 vp9_hw_regs->swreg19_vp9_frame_size_altref.sw_framewidth_alfter = ref_frame_width_y;
403*437bfbebSnyanmisaka                 vp9_hw_regs->swreg19_vp9_frame_size_altref.sw_frameheight_alfter = ref_frame_height_y;
404*437bfbebSnyanmisaka                 vp9_hw_regs->swreg39_vp9_altreff_hor_virstride.sw_vp9_altreffy_hor_virstride = y_hor_virstride;
405*437bfbebSnyanmisaka                 vp9_hw_regs->swreg39_vp9_altreff_hor_virstride.sw_vp9_altreffuv_hor_virstride = uv_hor_virstride;
406*437bfbebSnyanmisaka                 vp9_hw_regs->swreg50_vp9_altrefy_ystride.sw_vp9_altrefy_virstride = y_virstride;
407*437bfbebSnyanmisaka                 break;
408*437bfbebSnyanmisaka             }
409*437bfbebSnyanmisaka             default:
410*437bfbebSnyanmisaka                 break;
411*437bfbebSnyanmisaka             }
412*437bfbebSnyanmisaka 
413*437bfbebSnyanmisaka             /*0 map to 11*/
414*437bfbebSnyanmisaka             /*1 map to 12*/
415*437bfbebSnyanmisaka             /*2 map to 13*/
416*437bfbebSnyanmisaka             if (framebuf != NULL) {
417*437bfbebSnyanmisaka                 reg_ref_base[i] = mpp_buffer_get_fd(framebuf);
418*437bfbebSnyanmisaka             } else {
419*437bfbebSnyanmisaka                 mpp_log("ref buff address is no valid used out as base slot index 0x%x", ref_frame_idx);
420*437bfbebSnyanmisaka                 reg_ref_base[i] = vp9_hw_regs->swreg7_decout_base; //set
421*437bfbebSnyanmisaka             }
422*437bfbebSnyanmisaka         } else {
423*437bfbebSnyanmisaka             reg_ref_base[i] = vp9_hw_regs->swreg7_decout_base; //set
424*437bfbebSnyanmisaka         }
425*437bfbebSnyanmisaka     }
426*437bfbebSnyanmisaka 
427*437bfbebSnyanmisaka     for (i = 0; i < 8; i++) {
428*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_frame_qp_delta_en              = (hw_ctx->ls_info.feature_mask[i]) & 0x1;
429*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_frame_qp_delta                 = hw_ctx->ls_info.feature_data[i][0];
430*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_frame_loopfitler_value_en      = (hw_ctx->ls_info.feature_mask[i] >> 1) & 0x1;
431*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_frame_loopfilter_value         = hw_ctx->ls_info.feature_data[i][1];
432*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_referinfo_en                   = (hw_ctx->ls_info.feature_mask[i] >> 2) & 0x1;
433*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_referinfo                      = hw_ctx->ls_info.feature_data[i][2];
434*437bfbebSnyanmisaka         vp9_hw_regs->swreg20_27_vp9_segid_grp[i].sw_vp9segid_frame_skip_en                  = (hw_ctx->ls_info.feature_mask[i] >> 3) & 0x1;
435*437bfbebSnyanmisaka     }
436*437bfbebSnyanmisaka 
437*437bfbebSnyanmisaka 
438*437bfbebSnyanmisaka     vp9_hw_regs->swreg20_27_vp9_segid_grp[0].sw_vp9segid_abs_delta                              = hw_ctx->ls_info.abs_delta_last;
439*437bfbebSnyanmisaka 
440*437bfbebSnyanmisaka     vp9_hw_regs->swreg28_vp9_cprheader_config.sw_vp9_tx_mode                                    = pic_param->txmode;
441*437bfbebSnyanmisaka 
442*437bfbebSnyanmisaka     vp9_hw_regs->swreg28_vp9_cprheader_config.sw_vp9_frame_reference_mode                   = pic_param->refmode;
443*437bfbebSnyanmisaka 
444*437bfbebSnyanmisaka     vp9_hw_regs->swreg32_vp9_ref_deltas_lastframe.sw_vp9_ref_deltas_lastframe               = 0;
445*437bfbebSnyanmisaka 
446*437bfbebSnyanmisaka     if (!intraFlag) {
447*437bfbebSnyanmisaka         for (i = 0; i < 4; i++)
448*437bfbebSnyanmisaka             vp9_hw_regs->swreg32_vp9_ref_deltas_lastframe.sw_vp9_ref_deltas_lastframe           |= (hw_ctx->ls_info.last_ref_deltas[i] & 0x7f) << (7 * i);
449*437bfbebSnyanmisaka 
450*437bfbebSnyanmisaka         for (i = 0; i < 2; i++)
451*437bfbebSnyanmisaka             vp9_hw_regs->swreg33_vp9_info_lastframe.sw_vp9_mode_deltas_lastframe                |= (hw_ctx->ls_info.last_mode_deltas[i] & 0x7f) << (7 * i);
452*437bfbebSnyanmisaka 
453*437bfbebSnyanmisaka 
454*437bfbebSnyanmisaka     } else {
455*437bfbebSnyanmisaka         hw_ctx->ls_info.segmentation_enable_flag_last = 0;
456*437bfbebSnyanmisaka         hw_ctx->ls_info.last_intra_only = 1;
457*437bfbebSnyanmisaka     }
458*437bfbebSnyanmisaka 
459*437bfbebSnyanmisaka     vp9_hw_regs->swreg33_vp9_info_lastframe.sw_vp9_mode_deltas_lastframe                        = 0;
460*437bfbebSnyanmisaka 
461*437bfbebSnyanmisaka     vp9_hw_regs->swreg33_vp9_info_lastframe.sw_segmentation_enable_lstframe                  = hw_ctx->ls_info.segmentation_enable_flag_last;
462*437bfbebSnyanmisaka     vp9_hw_regs->swreg33_vp9_info_lastframe.sw_vp9_last_show_frame                          = hw_ctx->ls_info.last_show_frame;
463*437bfbebSnyanmisaka     vp9_hw_regs->swreg33_vp9_info_lastframe.sw_vp9_last_intra_only                          = hw_ctx->ls_info.last_intra_only;
464*437bfbebSnyanmisaka     vp9_hw_regs->swreg33_vp9_info_lastframe.sw_vp9_last_widthheight_eqcur                   = (pic_param->width == hw_ctx->ls_info.last_width) && (pic_param->height == hw_ctx->ls_info.last_height);
465*437bfbebSnyanmisaka 
466*437bfbebSnyanmisaka     vp9_hw_regs->swreg36_vp9_lasttile_size.sw_vp9_lasttile_size                             =  stream_len - pic_param->first_partition_size;
467*437bfbebSnyanmisaka 
468*437bfbebSnyanmisaka 
469*437bfbebSnyanmisaka     if (!intraFlag) {
470*437bfbebSnyanmisaka         vp9_hw_regs->swreg29_vp9_lref_scale.sw_vp9_lref_hor_scale = pic_param->mvscale[0][0];
471*437bfbebSnyanmisaka         vp9_hw_regs->swreg29_vp9_lref_scale.sw_vp9_lref_ver_scale = pic_param->mvscale[0][1];
472*437bfbebSnyanmisaka         vp9_hw_regs->swreg30_vp9_gref_scale.sw_vp9_gref_hor_scale = pic_param->mvscale[1][0];
473*437bfbebSnyanmisaka         vp9_hw_regs->swreg30_vp9_gref_scale.sw_vp9_gref_ver_scale = pic_param->mvscale[1][1];
474*437bfbebSnyanmisaka         vp9_hw_regs->swreg31_vp9_aref_scale.sw_vp9_aref_hor_scale = pic_param->mvscale[2][0];
475*437bfbebSnyanmisaka         vp9_hw_regs->swreg31_vp9_aref_scale.sw_vp9_aref_ver_scale = pic_param->mvscale[2][1];
476*437bfbebSnyanmisaka         // vp9_hw_regs.swreg33_vp9_info_lastframe.sw_vp9_color_space_lastkeyframe = p_cm->color_space_last;
477*437bfbebSnyanmisaka     }
478*437bfbebSnyanmisaka 
479*437bfbebSnyanmisaka 
480*437bfbebSnyanmisaka     //reuse reg64, and it will be written by hardware to show performance.
481*437bfbebSnyanmisaka     vp9_hw_regs->swreg64_performance_cycle.sw_performance_cycle = 0;
482*437bfbebSnyanmisaka     vp9_hw_regs->swreg64_performance_cycle.sw_performance_cycle |= pic_param->width;
483*437bfbebSnyanmisaka     vp9_hw_regs->swreg64_performance_cycle.sw_performance_cycle |= pic_param->height << 16;
484*437bfbebSnyanmisaka 
485*437bfbebSnyanmisaka     vp9_hw_regs->swreg1_int.sw_dec_e         = 1;
486*437bfbebSnyanmisaka     vp9_hw_regs->swreg1_int.sw_dec_timeout_e = 1;
487*437bfbebSnyanmisaka 
488*437bfbebSnyanmisaka     //last info  update
489*437bfbebSnyanmisaka     hw_ctx->ls_info.abs_delta_last = pic_param->stVP9Segments.abs_delta;
490*437bfbebSnyanmisaka     for (i = 0 ; i < 4; i ++) {
491*437bfbebSnyanmisaka         hw_ctx->ls_info.last_ref_deltas[i] = pic_param->ref_deltas[i];
492*437bfbebSnyanmisaka     }
493*437bfbebSnyanmisaka 
494*437bfbebSnyanmisaka     for (i = 0 ; i < 2; i ++) {
495*437bfbebSnyanmisaka         hw_ctx->ls_info.last_mode_deltas[i] = pic_param->mode_deltas[i];
496*437bfbebSnyanmisaka     }
497*437bfbebSnyanmisaka 
498*437bfbebSnyanmisaka     for (i = 0; i < 8; i++) {
499*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][0] = pic_param->stVP9Segments.feature_data[i][0];
500*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][1] = pic_param->stVP9Segments.feature_data[i][1];
501*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][2] = pic_param->stVP9Segments.feature_data[i][2];
502*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_data[i][3] = pic_param->stVP9Segments.feature_data[i][3];
503*437bfbebSnyanmisaka         hw_ctx->ls_info.feature_mask[i]  = pic_param->stVP9Segments.feature_mask[i];
504*437bfbebSnyanmisaka     }
505*437bfbebSnyanmisaka     if (!hw_ctx->ls_info.segmentation_enable_flag_last)
506*437bfbebSnyanmisaka         hw_ctx->ls_info.segmentation_enable_flag_last = pic_param->stVP9Segments.enabled;
507*437bfbebSnyanmisaka 
508*437bfbebSnyanmisaka     hw_ctx->ls_info.last_show_frame = pic_param->show_frame;
509*437bfbebSnyanmisaka     hw_ctx->ls_info.last_width = pic_param->width;
510*437bfbebSnyanmisaka     hw_ctx->ls_info.last_height = pic_param->height;
511*437bfbebSnyanmisaka     hw_ctx->ls_info.last_intra_only = (!pic_param->frame_type || pic_param->intra_only);
512*437bfbebSnyanmisaka     hal_vp9d_dbg_par("stVP9Segments.enabled %d show_frame %d  width %d  height %d last_intra_only %d",
513*437bfbebSnyanmisaka                      pic_param->stVP9Segments.enabled, pic_param->show_frame,
514*437bfbebSnyanmisaka                      pic_param->width, pic_param->height,
515*437bfbebSnyanmisaka                      hw_ctx->ls_info.last_intra_only);
516*437bfbebSnyanmisaka 
517*437bfbebSnyanmisaka     // whether need update counts
518*437bfbebSnyanmisaka     if (pic_param->refresh_frame_context && !pic_param->parallelmode) {
519*437bfbebSnyanmisaka         task->dec.flags.wait_done = 1;
520*437bfbebSnyanmisaka     }
521*437bfbebSnyanmisaka 
522*437bfbebSnyanmisaka     return MPP_OK;
523*437bfbebSnyanmisaka }
524*437bfbebSnyanmisaka 
hal_vp9d_rkv_start(void * hal,HalTaskInfo * task)525*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_start(void *hal, HalTaskInfo *task)
526*437bfbebSnyanmisaka {
527*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
528*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
529*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = (Vp9dRkvCtx*)p_hal->hw_ctx;
530*437bfbebSnyanmisaka     VP9_REGS *hw_regs = (VP9_REGS *)hw_ctx->hw_regs;
531*437bfbebSnyanmisaka     MppDev dev = p_hal->dev;
532*437bfbebSnyanmisaka 
533*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
534*437bfbebSnyanmisaka         RK_S32 index =  task->dec.reg_index;
535*437bfbebSnyanmisaka         hw_regs = (VP9_REGS *)hw_ctx->g_buf[index].hw_regs;
536*437bfbebSnyanmisaka     }
537*437bfbebSnyanmisaka 
538*437bfbebSnyanmisaka     mpp_assert(hw_regs);
539*437bfbebSnyanmisaka 
540*437bfbebSnyanmisaka     if (hal_vp9d_debug & HAL_VP9D_DBG_REG) {
541*437bfbebSnyanmisaka         RK_U32 *p = (RK_U32 *)hw_regs;
542*437bfbebSnyanmisaka         RK_U32 i = 0;
543*437bfbebSnyanmisaka 
544*437bfbebSnyanmisaka         for (i = 0; i < sizeof(VP9_REGS) / 4; i++)
545*437bfbebSnyanmisaka             mpp_log("set regs[%02d]: %08X\n", i, *p++);
546*437bfbebSnyanmisaka     }
547*437bfbebSnyanmisaka 
548*437bfbebSnyanmisaka     do {
549*437bfbebSnyanmisaka         MppDevRegWrCfg wr_cfg;
550*437bfbebSnyanmisaka         MppDevRegRdCfg rd_cfg;
551*437bfbebSnyanmisaka         RK_U32 reg_size = sizeof(VP9_REGS);
552*437bfbebSnyanmisaka 
553*437bfbebSnyanmisaka         wr_cfg.reg = hw_ctx->hw_regs;
554*437bfbebSnyanmisaka         wr_cfg.size = reg_size;
555*437bfbebSnyanmisaka         wr_cfg.offset = 0;
556*437bfbebSnyanmisaka 
557*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_WR, &wr_cfg);
558*437bfbebSnyanmisaka         if (ret) {
559*437bfbebSnyanmisaka             mpp_err_f("set register write failed %d\n", ret);
560*437bfbebSnyanmisaka             break;
561*437bfbebSnyanmisaka         }
562*437bfbebSnyanmisaka 
563*437bfbebSnyanmisaka         rd_cfg.reg = hw_ctx->hw_regs;
564*437bfbebSnyanmisaka         rd_cfg.size = reg_size;
565*437bfbebSnyanmisaka         rd_cfg.offset = 0;
566*437bfbebSnyanmisaka 
567*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_REG_RD, &rd_cfg);
568*437bfbebSnyanmisaka         if (ret) {
569*437bfbebSnyanmisaka             mpp_err_f("set register read failed %d\n", ret);
570*437bfbebSnyanmisaka             break;
571*437bfbebSnyanmisaka         }
572*437bfbebSnyanmisaka 
573*437bfbebSnyanmisaka         ret = mpp_dev_ioctl(dev, MPP_DEV_CMD_SEND, NULL);
574*437bfbebSnyanmisaka         if (ret) {
575*437bfbebSnyanmisaka             mpp_err_f("send cmd failed %d\n", ret);
576*437bfbebSnyanmisaka             break;
577*437bfbebSnyanmisaka         }
578*437bfbebSnyanmisaka     } while (0);
579*437bfbebSnyanmisaka 
580*437bfbebSnyanmisaka     (void)task;
581*437bfbebSnyanmisaka     return ret;
582*437bfbebSnyanmisaka }
583*437bfbebSnyanmisaka 
hal_vp9d_rkv_wait(void * hal,HalTaskInfo * task)584*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_wait(void *hal, HalTaskInfo *task)
585*437bfbebSnyanmisaka {
586*437bfbebSnyanmisaka     MPP_RET ret = MPP_OK;
587*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
588*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = (Vp9dRkvCtx*)p_hal->hw_ctx;
589*437bfbebSnyanmisaka     VP9_REGS *hw_regs = (VP9_REGS *)hw_ctx->hw_regs;
590*437bfbebSnyanmisaka 
591*437bfbebSnyanmisaka     if (p_hal->fast_mode)
592*437bfbebSnyanmisaka         hw_regs = (VP9_REGS *)hw_ctx->g_buf[task->dec.reg_index].hw_regs;
593*437bfbebSnyanmisaka 
594*437bfbebSnyanmisaka     mpp_assert(hw_regs);
595*437bfbebSnyanmisaka 
596*437bfbebSnyanmisaka     ret = mpp_dev_ioctl(p_hal->dev, MPP_DEV_CMD_POLL, NULL);
597*437bfbebSnyanmisaka     if (ret)
598*437bfbebSnyanmisaka         mpp_err_f("poll cmd failed %d\n", ret);
599*437bfbebSnyanmisaka 
600*437bfbebSnyanmisaka     if (hal_vp9d_debug & HAL_VP9D_DBG_REG) {
601*437bfbebSnyanmisaka         RK_U32 *p = (RK_U32 *)hw_regs;
602*437bfbebSnyanmisaka         RK_U32 i = 0;
603*437bfbebSnyanmisaka 
604*437bfbebSnyanmisaka         for (i = 0; i < sizeof(VP9_REGS) / 4; i++)
605*437bfbebSnyanmisaka             mpp_log("get regs[%02d]: %08X\n", i, *p++);
606*437bfbebSnyanmisaka     }
607*437bfbebSnyanmisaka 
608*437bfbebSnyanmisaka     if (task->dec.flags.parse_err ||
609*437bfbebSnyanmisaka         task->dec.flags.ref_err ||
610*437bfbebSnyanmisaka         !hw_regs->swreg1_int.sw_dec_rdy_sta) {
611*437bfbebSnyanmisaka         MppFrame mframe = NULL;
612*437bfbebSnyanmisaka         mpp_buf_slot_get_prop(p_hal->slots, task->dec.output, SLOT_FRAME_PTR, &mframe);
613*437bfbebSnyanmisaka         mpp_frame_set_errinfo(mframe, 1);
614*437bfbebSnyanmisaka     }
615*437bfbebSnyanmisaka 
616*437bfbebSnyanmisaka     if (p_hal->dec_cb && task->dec.flags.wait_done) {
617*437bfbebSnyanmisaka         DXVA_PicParams_VP9 *pic_param = (DXVA_PicParams_VP9*)task->dec.syntax.data;
618*437bfbebSnyanmisaka 
619*437bfbebSnyanmisaka         mpp_buffer_sync_ro_begin(hw_ctx->count_base);
620*437bfbebSnyanmisaka         hal_vp9d_update_counts(mpp_buffer_get_ptr(hw_ctx->count_base), task->dec.syntax.data);
621*437bfbebSnyanmisaka 
622*437bfbebSnyanmisaka         mpp_callback(p_hal->dec_cb, &pic_param->counts);
623*437bfbebSnyanmisaka     }
624*437bfbebSnyanmisaka     if (p_hal->fast_mode) {
625*437bfbebSnyanmisaka         hw_ctx->g_buf[task->dec.reg_index].use_flag = 0;
626*437bfbebSnyanmisaka     }
627*437bfbebSnyanmisaka 
628*437bfbebSnyanmisaka     (void)task;
629*437bfbebSnyanmisaka     return ret;
630*437bfbebSnyanmisaka }
631*437bfbebSnyanmisaka 
hal_vp9d_rkv_reset(void * hal)632*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_reset(void *hal)
633*437bfbebSnyanmisaka {
634*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
635*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = (Vp9dRkvCtx*)p_hal->hw_ctx;
636*437bfbebSnyanmisaka 
637*437bfbebSnyanmisaka     hal_vp9d_enter();
638*437bfbebSnyanmisaka 
639*437bfbebSnyanmisaka     memset(&hw_ctx->ls_info, 0, sizeof(hw_ctx->ls_info));
640*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = -1;
641*437bfbebSnyanmisaka     hw_ctx->pre_mv_base_addr = -1;
642*437bfbebSnyanmisaka     hw_ctx->last_segid_flag = 1;
643*437bfbebSnyanmisaka 
644*437bfbebSnyanmisaka     hal_vp9d_leave();
645*437bfbebSnyanmisaka 
646*437bfbebSnyanmisaka     return MPP_OK;
647*437bfbebSnyanmisaka }
648*437bfbebSnyanmisaka 
hal_vp9d_rkv_flush(void * hal)649*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_flush(void *hal)
650*437bfbebSnyanmisaka {
651*437bfbebSnyanmisaka     HalVp9dCtx *p_hal = (HalVp9dCtx *)hal;
652*437bfbebSnyanmisaka     Vp9dRkvCtx *hw_ctx = p_hal->hw_ctx;
653*437bfbebSnyanmisaka 
654*437bfbebSnyanmisaka     hal_vp9d_enter();
655*437bfbebSnyanmisaka 
656*437bfbebSnyanmisaka     hw_ctx->mv_base_addr = -1;
657*437bfbebSnyanmisaka     hw_ctx->pre_mv_base_addr = -1;
658*437bfbebSnyanmisaka 
659*437bfbebSnyanmisaka     hal_vp9d_leave();
660*437bfbebSnyanmisaka 
661*437bfbebSnyanmisaka     return MPP_OK;
662*437bfbebSnyanmisaka }
663*437bfbebSnyanmisaka 
hal_vp9d_rkv_control(void * hal,MpiCmd cmd_type,void * param)664*437bfbebSnyanmisaka MPP_RET hal_vp9d_rkv_control(void *hal, MpiCmd cmd_type, void *param)
665*437bfbebSnyanmisaka {
666*437bfbebSnyanmisaka     switch ((MpiCmd)cmd_type) {
667*437bfbebSnyanmisaka     case MPP_DEC_SET_FRAME_INFO: {
668*437bfbebSnyanmisaka         /* commit buffer stride */
669*437bfbebSnyanmisaka         RK_U32 width = mpp_frame_get_width((MppFrame)param);
670*437bfbebSnyanmisaka         RK_U32 height = mpp_frame_get_height((MppFrame)param);
671*437bfbebSnyanmisaka 
672*437bfbebSnyanmisaka         mpp_frame_set_hor_stride((MppFrame)param, vp9_hor_align(width));
673*437bfbebSnyanmisaka         mpp_frame_set_ver_stride((MppFrame)param, vp9_ver_align(height));
674*437bfbebSnyanmisaka     } break;
675*437bfbebSnyanmisaka     default: {
676*437bfbebSnyanmisaka     } break;
677*437bfbebSnyanmisaka     }
678*437bfbebSnyanmisaka     (void)hal;
679*437bfbebSnyanmisaka 
680*437bfbebSnyanmisaka     return MPP_OK;
681*437bfbebSnyanmisaka }
682*437bfbebSnyanmisaka 
683*437bfbebSnyanmisaka const MppHalApi hal_vp9d_rkv = {
684*437bfbebSnyanmisaka     .name = "vp9d_rkdec",
685*437bfbebSnyanmisaka     .type = MPP_CTX_DEC,
686*437bfbebSnyanmisaka     .coding = MPP_VIDEO_CodingVP9,
687*437bfbebSnyanmisaka     .ctx_size = sizeof(HalVp9dCtx),
688*437bfbebSnyanmisaka     .flag = 0,
689*437bfbebSnyanmisaka     .init = hal_vp9d_rkv_init,
690*437bfbebSnyanmisaka     .deinit = hal_vp9d_rkv_deinit,
691*437bfbebSnyanmisaka     .reg_gen = hal_vp9d_rkv_gen_regs,
692*437bfbebSnyanmisaka     .start = hal_vp9d_rkv_start,
693*437bfbebSnyanmisaka     .wait = hal_vp9d_rkv_wait,
694*437bfbebSnyanmisaka     .reset = hal_vp9d_rkv_reset,
695*437bfbebSnyanmisaka     .flush = hal_vp9d_rkv_flush,
696*437bfbebSnyanmisaka     .control = hal_vp9d_rkv_control,
697*437bfbebSnyanmisaka };
698