1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright(c) 2011-2016 Intel Corporation. All rights reserved.
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Permission is hereby granted, free of charge, to any person obtaining a
5*4882a593Smuzhiyun * copy of this software and associated documentation files (the "Software"),
6*4882a593Smuzhiyun * to deal in the Software without restriction, including without limitation
7*4882a593Smuzhiyun * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8*4882a593Smuzhiyun * and/or sell copies of the Software, and to permit persons to whom the
9*4882a593Smuzhiyun * Software is furnished to do so, subject to the following conditions:
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * The above copyright notice and this permission notice (including the next
12*4882a593Smuzhiyun * paragraph) shall be included in all copies or substantial portions of the
13*4882a593Smuzhiyun * Software.
14*4882a593Smuzhiyun *
15*4882a593Smuzhiyun * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16*4882a593Smuzhiyun * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17*4882a593Smuzhiyun * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18*4882a593Smuzhiyun * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19*4882a593Smuzhiyun * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
20*4882a593Smuzhiyun * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
21*4882a593Smuzhiyun * SOFTWARE.
22*4882a593Smuzhiyun *
23*4882a593Smuzhiyun * Authors:
24*4882a593Smuzhiyun * Ke Yu
25*4882a593Smuzhiyun * Kevin Tian <kevin.tian@intel.com>
26*4882a593Smuzhiyun * Zhiyuan Lv <zhiyuan.lv@intel.com>
27*4882a593Smuzhiyun *
28*4882a593Smuzhiyun * Contributors:
29*4882a593Smuzhiyun * Min He <min.he@intel.com>
30*4882a593Smuzhiyun * Ping Gao <ping.a.gao@intel.com>
31*4882a593Smuzhiyun * Tina Zhang <tina.zhang@intel.com>
32*4882a593Smuzhiyun * Yulei Zhang <yulei.zhang@intel.com>
33*4882a593Smuzhiyun * Zhi Wang <zhi.a.wang@intel.com>
34*4882a593Smuzhiyun *
35*4882a593Smuzhiyun */
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun #include <linux/slab.h>
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun #include "i915_drv.h"
40*4882a593Smuzhiyun #include "gt/intel_ring.h"
41*4882a593Smuzhiyun #include "gvt.h"
42*4882a593Smuzhiyun #include "i915_pvinfo.h"
43*4882a593Smuzhiyun #include "trace.h"
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun #define INVALID_OP (~0U)
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun #define OP_LEN_MI 9
48*4882a593Smuzhiyun #define OP_LEN_2D 10
49*4882a593Smuzhiyun #define OP_LEN_3D_MEDIA 16
50*4882a593Smuzhiyun #define OP_LEN_MFX_VC 16
51*4882a593Smuzhiyun #define OP_LEN_VEBOX 16
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun #define CMD_TYPE(cmd) (((cmd) >> 29) & 7)
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun struct sub_op_bits {
56*4882a593Smuzhiyun int hi;
57*4882a593Smuzhiyun int low;
58*4882a593Smuzhiyun };
59*4882a593Smuzhiyun struct decode_info {
60*4882a593Smuzhiyun const char *name;
61*4882a593Smuzhiyun int op_len;
62*4882a593Smuzhiyun int nr_sub_op;
63*4882a593Smuzhiyun const struct sub_op_bits *sub_op;
64*4882a593Smuzhiyun };
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun #define MAX_CMD_BUDGET 0x7fffffff
67*4882a593Smuzhiyun #define MI_WAIT_FOR_PLANE_C_FLIP_PENDING (1<<15)
68*4882a593Smuzhiyun #define MI_WAIT_FOR_PLANE_B_FLIP_PENDING (1<<9)
69*4882a593Smuzhiyun #define MI_WAIT_FOR_PLANE_A_FLIP_PENDING (1<<1)
70*4882a593Smuzhiyun
71*4882a593Smuzhiyun #define MI_WAIT_FOR_SPRITE_C_FLIP_PENDING (1<<20)
72*4882a593Smuzhiyun #define MI_WAIT_FOR_SPRITE_B_FLIP_PENDING (1<<10)
73*4882a593Smuzhiyun #define MI_WAIT_FOR_SPRITE_A_FLIP_PENDING (1<<2)
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun /* Render Command Map */
76*4882a593Smuzhiyun
77*4882a593Smuzhiyun /* MI_* command Opcode (28:23) */
78*4882a593Smuzhiyun #define OP_MI_NOOP 0x0
79*4882a593Smuzhiyun #define OP_MI_SET_PREDICATE 0x1 /* HSW+ */
80*4882a593Smuzhiyun #define OP_MI_USER_INTERRUPT 0x2
81*4882a593Smuzhiyun #define OP_MI_WAIT_FOR_EVENT 0x3
82*4882a593Smuzhiyun #define OP_MI_FLUSH 0x4
83*4882a593Smuzhiyun #define OP_MI_ARB_CHECK 0x5
84*4882a593Smuzhiyun #define OP_MI_RS_CONTROL 0x6 /* HSW+ */
85*4882a593Smuzhiyun #define OP_MI_REPORT_HEAD 0x7
86*4882a593Smuzhiyun #define OP_MI_ARB_ON_OFF 0x8
87*4882a593Smuzhiyun #define OP_MI_URB_ATOMIC_ALLOC 0x9 /* HSW+ */
88*4882a593Smuzhiyun #define OP_MI_BATCH_BUFFER_END 0xA
89*4882a593Smuzhiyun #define OP_MI_SUSPEND_FLUSH 0xB
90*4882a593Smuzhiyun #define OP_MI_PREDICATE 0xC /* IVB+ */
91*4882a593Smuzhiyun #define OP_MI_TOPOLOGY_FILTER 0xD /* IVB+ */
92*4882a593Smuzhiyun #define OP_MI_SET_APPID 0xE /* IVB+ */
93*4882a593Smuzhiyun #define OP_MI_RS_CONTEXT 0xF /* HSW+ */
94*4882a593Smuzhiyun #define OP_MI_LOAD_SCAN_LINES_INCL 0x12 /* HSW+ */
95*4882a593Smuzhiyun #define OP_MI_DISPLAY_FLIP 0x14
96*4882a593Smuzhiyun #define OP_MI_SEMAPHORE_MBOX 0x16
97*4882a593Smuzhiyun #define OP_MI_SET_CONTEXT 0x18
98*4882a593Smuzhiyun #define OP_MI_MATH 0x1A
99*4882a593Smuzhiyun #define OP_MI_URB_CLEAR 0x19
100*4882a593Smuzhiyun #define OP_MI_SEMAPHORE_SIGNAL 0x1B /* BDW+ */
101*4882a593Smuzhiyun #define OP_MI_SEMAPHORE_WAIT 0x1C /* BDW+ */
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun #define OP_MI_STORE_DATA_IMM 0x20
104*4882a593Smuzhiyun #define OP_MI_STORE_DATA_INDEX 0x21
105*4882a593Smuzhiyun #define OP_MI_LOAD_REGISTER_IMM 0x22
106*4882a593Smuzhiyun #define OP_MI_UPDATE_GTT 0x23
107*4882a593Smuzhiyun #define OP_MI_STORE_REGISTER_MEM 0x24
108*4882a593Smuzhiyun #define OP_MI_FLUSH_DW 0x26
109*4882a593Smuzhiyun #define OP_MI_CLFLUSH 0x27
110*4882a593Smuzhiyun #define OP_MI_REPORT_PERF_COUNT 0x28
111*4882a593Smuzhiyun #define OP_MI_LOAD_REGISTER_MEM 0x29 /* HSW+ */
112*4882a593Smuzhiyun #define OP_MI_LOAD_REGISTER_REG 0x2A /* HSW+ */
113*4882a593Smuzhiyun #define OP_MI_RS_STORE_DATA_IMM 0x2B /* HSW+ */
114*4882a593Smuzhiyun #define OP_MI_LOAD_URB_MEM 0x2C /* HSW+ */
115*4882a593Smuzhiyun #define OP_MI_STORE_URM_MEM 0x2D /* HSW+ */
116*4882a593Smuzhiyun #define OP_MI_2E 0x2E /* BDW+ */
117*4882a593Smuzhiyun #define OP_MI_2F 0x2F /* BDW+ */
118*4882a593Smuzhiyun #define OP_MI_BATCH_BUFFER_START 0x31
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun /* Bit definition for dword 0 */
121*4882a593Smuzhiyun #define _CMDBIT_BB_START_IN_PPGTT (1UL << 8)
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun #define OP_MI_CONDITIONAL_BATCH_BUFFER_END 0x36
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun #define BATCH_BUFFER_ADDR_MASK ((1UL << 32) - (1U << 2))
126*4882a593Smuzhiyun #define BATCH_BUFFER_ADDR_HIGH_MASK ((1UL << 16) - (1U))
127*4882a593Smuzhiyun #define BATCH_BUFFER_ADR_SPACE_BIT(x) (((x) >> 8) & 1U)
128*4882a593Smuzhiyun #define BATCH_BUFFER_2ND_LEVEL_BIT(x) ((x) >> 22 & 1U)
129*4882a593Smuzhiyun
130*4882a593Smuzhiyun /* 2D command: Opcode (28:22) */
131*4882a593Smuzhiyun #define OP_2D(x) ((2<<7) | x)
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun #define OP_XY_SETUP_BLT OP_2D(0x1)
134*4882a593Smuzhiyun #define OP_XY_SETUP_CLIP_BLT OP_2D(0x3)
135*4882a593Smuzhiyun #define OP_XY_SETUP_MONO_PATTERN_SL_BLT OP_2D(0x11)
136*4882a593Smuzhiyun #define OP_XY_PIXEL_BLT OP_2D(0x24)
137*4882a593Smuzhiyun #define OP_XY_SCANLINES_BLT OP_2D(0x25)
138*4882a593Smuzhiyun #define OP_XY_TEXT_BLT OP_2D(0x26)
139*4882a593Smuzhiyun #define OP_XY_TEXT_IMMEDIATE_BLT OP_2D(0x31)
140*4882a593Smuzhiyun #define OP_XY_COLOR_BLT OP_2D(0x50)
141*4882a593Smuzhiyun #define OP_XY_PAT_BLT OP_2D(0x51)
142*4882a593Smuzhiyun #define OP_XY_MONO_PAT_BLT OP_2D(0x52)
143*4882a593Smuzhiyun #define OP_XY_SRC_COPY_BLT OP_2D(0x53)
144*4882a593Smuzhiyun #define OP_XY_MONO_SRC_COPY_BLT OP_2D(0x54)
145*4882a593Smuzhiyun #define OP_XY_FULL_BLT OP_2D(0x55)
146*4882a593Smuzhiyun #define OP_XY_FULL_MONO_SRC_BLT OP_2D(0x56)
147*4882a593Smuzhiyun #define OP_XY_FULL_MONO_PATTERN_BLT OP_2D(0x57)
148*4882a593Smuzhiyun #define OP_XY_FULL_MONO_PATTERN_MONO_SRC_BLT OP_2D(0x58)
149*4882a593Smuzhiyun #define OP_XY_MONO_PAT_FIXED_BLT OP_2D(0x59)
150*4882a593Smuzhiyun #define OP_XY_MONO_SRC_COPY_IMMEDIATE_BLT OP_2D(0x71)
151*4882a593Smuzhiyun #define OP_XY_PAT_BLT_IMMEDIATE OP_2D(0x72)
152*4882a593Smuzhiyun #define OP_XY_SRC_COPY_CHROMA_BLT OP_2D(0x73)
153*4882a593Smuzhiyun #define OP_XY_FULL_IMMEDIATE_PATTERN_BLT OP_2D(0x74)
154*4882a593Smuzhiyun #define OP_XY_FULL_MONO_SRC_IMMEDIATE_PATTERN_BLT OP_2D(0x75)
155*4882a593Smuzhiyun #define OP_XY_PAT_CHROMA_BLT OP_2D(0x76)
156*4882a593Smuzhiyun #define OP_XY_PAT_CHROMA_BLT_IMMEDIATE OP_2D(0x77)
157*4882a593Smuzhiyun
158*4882a593Smuzhiyun /* 3D/Media Command: Pipeline Type(28:27) Opcode(26:24) Sub Opcode(23:16) */
159*4882a593Smuzhiyun #define OP_3D_MEDIA(sub_type, opcode, sub_opcode) \
160*4882a593Smuzhiyun ((3 << 13) | ((sub_type) << 11) | ((opcode) << 8) | (sub_opcode))
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun #define OP_STATE_PREFETCH OP_3D_MEDIA(0x0, 0x0, 0x03)
163*4882a593Smuzhiyun
164*4882a593Smuzhiyun #define OP_STATE_BASE_ADDRESS OP_3D_MEDIA(0x0, 0x1, 0x01)
165*4882a593Smuzhiyun #define OP_STATE_SIP OP_3D_MEDIA(0x0, 0x1, 0x02)
166*4882a593Smuzhiyun #define OP_3D_MEDIA_0_1_4 OP_3D_MEDIA(0x0, 0x1, 0x04)
167*4882a593Smuzhiyun #define OP_SWTESS_BASE_ADDRESS OP_3D_MEDIA(0x0, 0x1, 0x03)
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun #define OP_3DSTATE_VF_STATISTICS_GM45 OP_3D_MEDIA(0x1, 0x0, 0x0B)
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun #define OP_PIPELINE_SELECT OP_3D_MEDIA(0x1, 0x1, 0x04)
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun #define OP_MEDIA_VFE_STATE OP_3D_MEDIA(0x2, 0x0, 0x0)
174*4882a593Smuzhiyun #define OP_MEDIA_CURBE_LOAD OP_3D_MEDIA(0x2, 0x0, 0x1)
175*4882a593Smuzhiyun #define OP_MEDIA_INTERFACE_DESCRIPTOR_LOAD OP_3D_MEDIA(0x2, 0x0, 0x2)
176*4882a593Smuzhiyun #define OP_MEDIA_GATEWAY_STATE OP_3D_MEDIA(0x2, 0x0, 0x3)
177*4882a593Smuzhiyun #define OP_MEDIA_STATE_FLUSH OP_3D_MEDIA(0x2, 0x0, 0x4)
178*4882a593Smuzhiyun #define OP_MEDIA_POOL_STATE OP_3D_MEDIA(0x2, 0x0, 0x5)
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun #define OP_MEDIA_OBJECT OP_3D_MEDIA(0x2, 0x1, 0x0)
181*4882a593Smuzhiyun #define OP_MEDIA_OBJECT_PRT OP_3D_MEDIA(0x2, 0x1, 0x2)
182*4882a593Smuzhiyun #define OP_MEDIA_OBJECT_WALKER OP_3D_MEDIA(0x2, 0x1, 0x3)
183*4882a593Smuzhiyun #define OP_GPGPU_WALKER OP_3D_MEDIA(0x2, 0x1, 0x5)
184*4882a593Smuzhiyun
185*4882a593Smuzhiyun #define OP_3DSTATE_CLEAR_PARAMS OP_3D_MEDIA(0x3, 0x0, 0x04) /* IVB+ */
186*4882a593Smuzhiyun #define OP_3DSTATE_DEPTH_BUFFER OP_3D_MEDIA(0x3, 0x0, 0x05) /* IVB+ */
187*4882a593Smuzhiyun #define OP_3DSTATE_STENCIL_BUFFER OP_3D_MEDIA(0x3, 0x0, 0x06) /* IVB+ */
188*4882a593Smuzhiyun #define OP_3DSTATE_HIER_DEPTH_BUFFER OP_3D_MEDIA(0x3, 0x0, 0x07) /* IVB+ */
189*4882a593Smuzhiyun #define OP_3DSTATE_VERTEX_BUFFERS OP_3D_MEDIA(0x3, 0x0, 0x08)
190*4882a593Smuzhiyun #define OP_3DSTATE_VERTEX_ELEMENTS OP_3D_MEDIA(0x3, 0x0, 0x09)
191*4882a593Smuzhiyun #define OP_3DSTATE_INDEX_BUFFER OP_3D_MEDIA(0x3, 0x0, 0x0A)
192*4882a593Smuzhiyun #define OP_3DSTATE_VF_STATISTICS OP_3D_MEDIA(0x3, 0x0, 0x0B)
193*4882a593Smuzhiyun #define OP_3DSTATE_VF OP_3D_MEDIA(0x3, 0x0, 0x0C) /* HSW+ */
194*4882a593Smuzhiyun #define OP_3DSTATE_CC_STATE_POINTERS OP_3D_MEDIA(0x3, 0x0, 0x0E)
195*4882a593Smuzhiyun #define OP_3DSTATE_SCISSOR_STATE_POINTERS OP_3D_MEDIA(0x3, 0x0, 0x0F)
196*4882a593Smuzhiyun #define OP_3DSTATE_VS OP_3D_MEDIA(0x3, 0x0, 0x10)
197*4882a593Smuzhiyun #define OP_3DSTATE_GS OP_3D_MEDIA(0x3, 0x0, 0x11)
198*4882a593Smuzhiyun #define OP_3DSTATE_CLIP OP_3D_MEDIA(0x3, 0x0, 0x12)
199*4882a593Smuzhiyun #define OP_3DSTATE_SF OP_3D_MEDIA(0x3, 0x0, 0x13)
200*4882a593Smuzhiyun #define OP_3DSTATE_WM OP_3D_MEDIA(0x3, 0x0, 0x14)
201*4882a593Smuzhiyun #define OP_3DSTATE_CONSTANT_VS OP_3D_MEDIA(0x3, 0x0, 0x15)
202*4882a593Smuzhiyun #define OP_3DSTATE_CONSTANT_GS OP_3D_MEDIA(0x3, 0x0, 0x16)
203*4882a593Smuzhiyun #define OP_3DSTATE_CONSTANT_PS OP_3D_MEDIA(0x3, 0x0, 0x17)
204*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLE_MASK OP_3D_MEDIA(0x3, 0x0, 0x18)
205*4882a593Smuzhiyun #define OP_3DSTATE_CONSTANT_HS OP_3D_MEDIA(0x3, 0x0, 0x19) /* IVB+ */
206*4882a593Smuzhiyun #define OP_3DSTATE_CONSTANT_DS OP_3D_MEDIA(0x3, 0x0, 0x1A) /* IVB+ */
207*4882a593Smuzhiyun #define OP_3DSTATE_HS OP_3D_MEDIA(0x3, 0x0, 0x1B) /* IVB+ */
208*4882a593Smuzhiyun #define OP_3DSTATE_TE OP_3D_MEDIA(0x3, 0x0, 0x1C) /* IVB+ */
209*4882a593Smuzhiyun #define OP_3DSTATE_DS OP_3D_MEDIA(0x3, 0x0, 0x1D) /* IVB+ */
210*4882a593Smuzhiyun #define OP_3DSTATE_STREAMOUT OP_3D_MEDIA(0x3, 0x0, 0x1E) /* IVB+ */
211*4882a593Smuzhiyun #define OP_3DSTATE_SBE OP_3D_MEDIA(0x3, 0x0, 0x1F) /* IVB+ */
212*4882a593Smuzhiyun #define OP_3DSTATE_PS OP_3D_MEDIA(0x3, 0x0, 0x20) /* IVB+ */
213*4882a593Smuzhiyun #define OP_3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP OP_3D_MEDIA(0x3, 0x0, 0x21) /* IVB+ */
214*4882a593Smuzhiyun #define OP_3DSTATE_VIEWPORT_STATE_POINTERS_CC OP_3D_MEDIA(0x3, 0x0, 0x23) /* IVB+ */
215*4882a593Smuzhiyun #define OP_3DSTATE_BLEND_STATE_POINTERS OP_3D_MEDIA(0x3, 0x0, 0x24) /* IVB+ */
216*4882a593Smuzhiyun #define OP_3DSTATE_DEPTH_STENCIL_STATE_POINTERS OP_3D_MEDIA(0x3, 0x0, 0x25) /* IVB+ */
217*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_POINTERS_VS OP_3D_MEDIA(0x3, 0x0, 0x26) /* IVB+ */
218*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_POINTERS_HS OP_3D_MEDIA(0x3, 0x0, 0x27) /* IVB+ */
219*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_POINTERS_DS OP_3D_MEDIA(0x3, 0x0, 0x28) /* IVB+ */
220*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_POINTERS_GS OP_3D_MEDIA(0x3, 0x0, 0x29) /* IVB+ */
221*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_POINTERS_PS OP_3D_MEDIA(0x3, 0x0, 0x2A) /* IVB+ */
222*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_STATE_POINTERS_VS OP_3D_MEDIA(0x3, 0x0, 0x2B) /* IVB+ */
223*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_STATE_POINTERS_HS OP_3D_MEDIA(0x3, 0x0, 0x2C) /* IVB+ */
224*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_STATE_POINTERS_DS OP_3D_MEDIA(0x3, 0x0, 0x2D) /* IVB+ */
225*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_STATE_POINTERS_GS OP_3D_MEDIA(0x3, 0x0, 0x2E) /* IVB+ */
226*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_STATE_POINTERS_PS OP_3D_MEDIA(0x3, 0x0, 0x2F) /* IVB+ */
227*4882a593Smuzhiyun #define OP_3DSTATE_URB_VS OP_3D_MEDIA(0x3, 0x0, 0x30) /* IVB+ */
228*4882a593Smuzhiyun #define OP_3DSTATE_URB_HS OP_3D_MEDIA(0x3, 0x0, 0x31) /* IVB+ */
229*4882a593Smuzhiyun #define OP_3DSTATE_URB_DS OP_3D_MEDIA(0x3, 0x0, 0x32) /* IVB+ */
230*4882a593Smuzhiyun #define OP_3DSTATE_URB_GS OP_3D_MEDIA(0x3, 0x0, 0x33) /* IVB+ */
231*4882a593Smuzhiyun #define OP_3DSTATE_GATHER_CONSTANT_VS OP_3D_MEDIA(0x3, 0x0, 0x34) /* HSW+ */
232*4882a593Smuzhiyun #define OP_3DSTATE_GATHER_CONSTANT_GS OP_3D_MEDIA(0x3, 0x0, 0x35) /* HSW+ */
233*4882a593Smuzhiyun #define OP_3DSTATE_GATHER_CONSTANT_HS OP_3D_MEDIA(0x3, 0x0, 0x36) /* HSW+ */
234*4882a593Smuzhiyun #define OP_3DSTATE_GATHER_CONSTANT_DS OP_3D_MEDIA(0x3, 0x0, 0x37) /* HSW+ */
235*4882a593Smuzhiyun #define OP_3DSTATE_GATHER_CONSTANT_PS OP_3D_MEDIA(0x3, 0x0, 0x38) /* HSW+ */
236*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANTF_VS OP_3D_MEDIA(0x3, 0x0, 0x39) /* HSW+ */
237*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANTF_PS OP_3D_MEDIA(0x3, 0x0, 0x3A) /* HSW+ */
238*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANTI_VS OP_3D_MEDIA(0x3, 0x0, 0x3B) /* HSW+ */
239*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANTI_PS OP_3D_MEDIA(0x3, 0x0, 0x3C) /* HSW+ */
240*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANTB_VS OP_3D_MEDIA(0x3, 0x0, 0x3D) /* HSW+ */
241*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANTB_PS OP_3D_MEDIA(0x3, 0x0, 0x3E) /* HSW+ */
242*4882a593Smuzhiyun #define OP_3DSTATE_DX9_LOCAL_VALID_VS OP_3D_MEDIA(0x3, 0x0, 0x3F) /* HSW+ */
243*4882a593Smuzhiyun #define OP_3DSTATE_DX9_LOCAL_VALID_PS OP_3D_MEDIA(0x3, 0x0, 0x40) /* HSW+ */
244*4882a593Smuzhiyun #define OP_3DSTATE_DX9_GENERATE_ACTIVE_VS OP_3D_MEDIA(0x3, 0x0, 0x41) /* HSW+ */
245*4882a593Smuzhiyun #define OP_3DSTATE_DX9_GENERATE_ACTIVE_PS OP_3D_MEDIA(0x3, 0x0, 0x42) /* HSW+ */
246*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_EDIT_VS OP_3D_MEDIA(0x3, 0x0, 0x43) /* HSW+ */
247*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_EDIT_GS OP_3D_MEDIA(0x3, 0x0, 0x44) /* HSW+ */
248*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_EDIT_HS OP_3D_MEDIA(0x3, 0x0, 0x45) /* HSW+ */
249*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_EDIT_DS OP_3D_MEDIA(0x3, 0x0, 0x46) /* HSW+ */
250*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_EDIT_PS OP_3D_MEDIA(0x3, 0x0, 0x47) /* HSW+ */
251*4882a593Smuzhiyun
252*4882a593Smuzhiyun #define OP_3DSTATE_VF_INSTANCING OP_3D_MEDIA(0x3, 0x0, 0x49) /* BDW+ */
253*4882a593Smuzhiyun #define OP_3DSTATE_VF_SGVS OP_3D_MEDIA(0x3, 0x0, 0x4A) /* BDW+ */
254*4882a593Smuzhiyun #define OP_3DSTATE_VF_TOPOLOGY OP_3D_MEDIA(0x3, 0x0, 0x4B) /* BDW+ */
255*4882a593Smuzhiyun #define OP_3DSTATE_WM_CHROMAKEY OP_3D_MEDIA(0x3, 0x0, 0x4C) /* BDW+ */
256*4882a593Smuzhiyun #define OP_3DSTATE_PS_BLEND OP_3D_MEDIA(0x3, 0x0, 0x4D) /* BDW+ */
257*4882a593Smuzhiyun #define OP_3DSTATE_WM_DEPTH_STENCIL OP_3D_MEDIA(0x3, 0x0, 0x4E) /* BDW+ */
258*4882a593Smuzhiyun #define OP_3DSTATE_PS_EXTRA OP_3D_MEDIA(0x3, 0x0, 0x4F) /* BDW+ */
259*4882a593Smuzhiyun #define OP_3DSTATE_RASTER OP_3D_MEDIA(0x3, 0x0, 0x50) /* BDW+ */
260*4882a593Smuzhiyun #define OP_3DSTATE_SBE_SWIZ OP_3D_MEDIA(0x3, 0x0, 0x51) /* BDW+ */
261*4882a593Smuzhiyun #define OP_3DSTATE_WM_HZ_OP OP_3D_MEDIA(0x3, 0x0, 0x52) /* BDW+ */
262*4882a593Smuzhiyun #define OP_3DSTATE_COMPONENT_PACKING OP_3D_MEDIA(0x3, 0x0, 0x55) /* SKL+ */
263*4882a593Smuzhiyun
264*4882a593Smuzhiyun #define OP_3DSTATE_DRAWING_RECTANGLE OP_3D_MEDIA(0x3, 0x1, 0x00)
265*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_PALETTE_LOAD0 OP_3D_MEDIA(0x3, 0x1, 0x02)
266*4882a593Smuzhiyun #define OP_3DSTATE_CHROMA_KEY OP_3D_MEDIA(0x3, 0x1, 0x04)
267*4882a593Smuzhiyun #define OP_SNB_3DSTATE_DEPTH_BUFFER OP_3D_MEDIA(0x3, 0x1, 0x05)
268*4882a593Smuzhiyun #define OP_3DSTATE_POLY_STIPPLE_OFFSET OP_3D_MEDIA(0x3, 0x1, 0x06)
269*4882a593Smuzhiyun #define OP_3DSTATE_POLY_STIPPLE_PATTERN OP_3D_MEDIA(0x3, 0x1, 0x07)
270*4882a593Smuzhiyun #define OP_3DSTATE_LINE_STIPPLE OP_3D_MEDIA(0x3, 0x1, 0x08)
271*4882a593Smuzhiyun #define OP_3DSTATE_AA_LINE_PARAMS OP_3D_MEDIA(0x3, 0x1, 0x0A)
272*4882a593Smuzhiyun #define OP_3DSTATE_GS_SVB_INDEX OP_3D_MEDIA(0x3, 0x1, 0x0B)
273*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLER_PALETTE_LOAD1 OP_3D_MEDIA(0x3, 0x1, 0x0C)
274*4882a593Smuzhiyun #define OP_3DSTATE_MULTISAMPLE_BDW OP_3D_MEDIA(0x3, 0x0, 0x0D)
275*4882a593Smuzhiyun #define OP_SNB_3DSTATE_STENCIL_BUFFER OP_3D_MEDIA(0x3, 0x1, 0x0E)
276*4882a593Smuzhiyun #define OP_SNB_3DSTATE_HIER_DEPTH_BUFFER OP_3D_MEDIA(0x3, 0x1, 0x0F)
277*4882a593Smuzhiyun #define OP_SNB_3DSTATE_CLEAR_PARAMS OP_3D_MEDIA(0x3, 0x1, 0x10)
278*4882a593Smuzhiyun #define OP_3DSTATE_MONOFILTER_SIZE OP_3D_MEDIA(0x3, 0x1, 0x11)
279*4882a593Smuzhiyun #define OP_3DSTATE_PUSH_CONSTANT_ALLOC_VS OP_3D_MEDIA(0x3, 0x1, 0x12) /* IVB+ */
280*4882a593Smuzhiyun #define OP_3DSTATE_PUSH_CONSTANT_ALLOC_HS OP_3D_MEDIA(0x3, 0x1, 0x13) /* IVB+ */
281*4882a593Smuzhiyun #define OP_3DSTATE_PUSH_CONSTANT_ALLOC_DS OP_3D_MEDIA(0x3, 0x1, 0x14) /* IVB+ */
282*4882a593Smuzhiyun #define OP_3DSTATE_PUSH_CONSTANT_ALLOC_GS OP_3D_MEDIA(0x3, 0x1, 0x15) /* IVB+ */
283*4882a593Smuzhiyun #define OP_3DSTATE_PUSH_CONSTANT_ALLOC_PS OP_3D_MEDIA(0x3, 0x1, 0x16) /* IVB+ */
284*4882a593Smuzhiyun #define OP_3DSTATE_SO_DECL_LIST OP_3D_MEDIA(0x3, 0x1, 0x17)
285*4882a593Smuzhiyun #define OP_3DSTATE_SO_BUFFER OP_3D_MEDIA(0x3, 0x1, 0x18)
286*4882a593Smuzhiyun #define OP_3DSTATE_BINDING_TABLE_POOL_ALLOC OP_3D_MEDIA(0x3, 0x1, 0x19) /* HSW+ */
287*4882a593Smuzhiyun #define OP_3DSTATE_GATHER_POOL_ALLOC OP_3D_MEDIA(0x3, 0x1, 0x1A) /* HSW+ */
288*4882a593Smuzhiyun #define OP_3DSTATE_DX9_CONSTANT_BUFFER_POOL_ALLOC OP_3D_MEDIA(0x3, 0x1, 0x1B) /* HSW+ */
289*4882a593Smuzhiyun #define OP_3DSTATE_SAMPLE_PATTERN OP_3D_MEDIA(0x3, 0x1, 0x1C)
290*4882a593Smuzhiyun #define OP_PIPE_CONTROL OP_3D_MEDIA(0x3, 0x2, 0x00)
291*4882a593Smuzhiyun #define OP_3DPRIMITIVE OP_3D_MEDIA(0x3, 0x3, 0x00)
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun /* VCCP Command Parser */
294*4882a593Smuzhiyun
295*4882a593Smuzhiyun /*
296*4882a593Smuzhiyun * Below MFX and VBE cmd definition is from vaapi intel driver project (BSD License)
297*4882a593Smuzhiyun * git://anongit.freedesktop.org/vaapi/intel-driver
298*4882a593Smuzhiyun * src/i965_defines.h
299*4882a593Smuzhiyun *
300*4882a593Smuzhiyun */
301*4882a593Smuzhiyun
302*4882a593Smuzhiyun #define OP_MFX(pipeline, op, sub_opa, sub_opb) \
303*4882a593Smuzhiyun (3 << 13 | \
304*4882a593Smuzhiyun (pipeline) << 11 | \
305*4882a593Smuzhiyun (op) << 8 | \
306*4882a593Smuzhiyun (sub_opa) << 5 | \
307*4882a593Smuzhiyun (sub_opb))
308*4882a593Smuzhiyun
309*4882a593Smuzhiyun #define OP_MFX_PIPE_MODE_SELECT OP_MFX(2, 0, 0, 0) /* ALL */
310*4882a593Smuzhiyun #define OP_MFX_SURFACE_STATE OP_MFX(2, 0, 0, 1) /* ALL */
311*4882a593Smuzhiyun #define OP_MFX_PIPE_BUF_ADDR_STATE OP_MFX(2, 0, 0, 2) /* ALL */
312*4882a593Smuzhiyun #define OP_MFX_IND_OBJ_BASE_ADDR_STATE OP_MFX(2, 0, 0, 3) /* ALL */
313*4882a593Smuzhiyun #define OP_MFX_BSP_BUF_BASE_ADDR_STATE OP_MFX(2, 0, 0, 4) /* ALL */
314*4882a593Smuzhiyun #define OP_2_0_0_5 OP_MFX(2, 0, 0, 5) /* ALL */
315*4882a593Smuzhiyun #define OP_MFX_STATE_POINTER OP_MFX(2, 0, 0, 6) /* ALL */
316*4882a593Smuzhiyun #define OP_MFX_QM_STATE OP_MFX(2, 0, 0, 7) /* IVB+ */
317*4882a593Smuzhiyun #define OP_MFX_FQM_STATE OP_MFX(2, 0, 0, 8) /* IVB+ */
318*4882a593Smuzhiyun #define OP_MFX_PAK_INSERT_OBJECT OP_MFX(2, 0, 2, 8) /* IVB+ */
319*4882a593Smuzhiyun #define OP_MFX_STITCH_OBJECT OP_MFX(2, 0, 2, 0xA) /* IVB+ */
320*4882a593Smuzhiyun
321*4882a593Smuzhiyun #define OP_MFD_IT_OBJECT OP_MFX(2, 0, 1, 9) /* ALL */
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun #define OP_MFX_WAIT OP_MFX(1, 0, 0, 0) /* IVB+ */
324*4882a593Smuzhiyun #define OP_MFX_AVC_IMG_STATE OP_MFX(2, 1, 0, 0) /* ALL */
325*4882a593Smuzhiyun #define OP_MFX_AVC_QM_STATE OP_MFX(2, 1, 0, 1) /* ALL */
326*4882a593Smuzhiyun #define OP_MFX_AVC_DIRECTMODE_STATE OP_MFX(2, 1, 0, 2) /* ALL */
327*4882a593Smuzhiyun #define OP_MFX_AVC_SLICE_STATE OP_MFX(2, 1, 0, 3) /* ALL */
328*4882a593Smuzhiyun #define OP_MFX_AVC_REF_IDX_STATE OP_MFX(2, 1, 0, 4) /* ALL */
329*4882a593Smuzhiyun #define OP_MFX_AVC_WEIGHTOFFSET_STATE OP_MFX(2, 1, 0, 5) /* ALL */
330*4882a593Smuzhiyun #define OP_MFD_AVC_PICID_STATE OP_MFX(2, 1, 1, 5) /* HSW+ */
331*4882a593Smuzhiyun #define OP_MFD_AVC_DPB_STATE OP_MFX(2, 1, 1, 6) /* IVB+ */
332*4882a593Smuzhiyun #define OP_MFD_AVC_SLICEADDR OP_MFX(2, 1, 1, 7) /* IVB+ */
333*4882a593Smuzhiyun #define OP_MFD_AVC_BSD_OBJECT OP_MFX(2, 1, 1, 8) /* ALL */
334*4882a593Smuzhiyun #define OP_MFC_AVC_PAK_OBJECT OP_MFX(2, 1, 2, 9) /* ALL */
335*4882a593Smuzhiyun
336*4882a593Smuzhiyun #define OP_MFX_VC1_PRED_PIPE_STATE OP_MFX(2, 2, 0, 1) /* ALL */
337*4882a593Smuzhiyun #define OP_MFX_VC1_DIRECTMODE_STATE OP_MFX(2, 2, 0, 2) /* ALL */
338*4882a593Smuzhiyun #define OP_MFD_VC1_SHORT_PIC_STATE OP_MFX(2, 2, 1, 0) /* IVB+ */
339*4882a593Smuzhiyun #define OP_MFD_VC1_LONG_PIC_STATE OP_MFX(2, 2, 1, 1) /* IVB+ */
340*4882a593Smuzhiyun #define OP_MFD_VC1_BSD_OBJECT OP_MFX(2, 2, 1, 8) /* ALL */
341*4882a593Smuzhiyun
342*4882a593Smuzhiyun #define OP_MFX_MPEG2_PIC_STATE OP_MFX(2, 3, 0, 0) /* ALL */
343*4882a593Smuzhiyun #define OP_MFX_MPEG2_QM_STATE OP_MFX(2, 3, 0, 1) /* ALL */
344*4882a593Smuzhiyun #define OP_MFD_MPEG2_BSD_OBJECT OP_MFX(2, 3, 1, 8) /* ALL */
345*4882a593Smuzhiyun #define OP_MFC_MPEG2_SLICEGROUP_STATE OP_MFX(2, 3, 2, 3) /* ALL */
346*4882a593Smuzhiyun #define OP_MFC_MPEG2_PAK_OBJECT OP_MFX(2, 3, 2, 9) /* ALL */
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun #define OP_MFX_2_6_0_0 OP_MFX(2, 6, 0, 0) /* IVB+ */
349*4882a593Smuzhiyun #define OP_MFX_2_6_0_8 OP_MFX(2, 6, 0, 8) /* IVB+ */
350*4882a593Smuzhiyun #define OP_MFX_2_6_0_9 OP_MFX(2, 6, 0, 9) /* IVB+ */
351*4882a593Smuzhiyun
352*4882a593Smuzhiyun #define OP_MFX_JPEG_PIC_STATE OP_MFX(2, 7, 0, 0)
353*4882a593Smuzhiyun #define OP_MFX_JPEG_HUFF_TABLE_STATE OP_MFX(2, 7, 0, 2)
354*4882a593Smuzhiyun #define OP_MFD_JPEG_BSD_OBJECT OP_MFX(2, 7, 1, 8)
355*4882a593Smuzhiyun
356*4882a593Smuzhiyun #define OP_VEB(pipeline, op, sub_opa, sub_opb) \
357*4882a593Smuzhiyun (3 << 13 | \
358*4882a593Smuzhiyun (pipeline) << 11 | \
359*4882a593Smuzhiyun (op) << 8 | \
360*4882a593Smuzhiyun (sub_opa) << 5 | \
361*4882a593Smuzhiyun (sub_opb))
362*4882a593Smuzhiyun
363*4882a593Smuzhiyun #define OP_VEB_SURFACE_STATE OP_VEB(2, 4, 0, 0)
364*4882a593Smuzhiyun #define OP_VEB_STATE OP_VEB(2, 4, 0, 2)
365*4882a593Smuzhiyun #define OP_VEB_DNDI_IECP_STATE OP_VEB(2, 4, 0, 3)
366*4882a593Smuzhiyun
367*4882a593Smuzhiyun struct parser_exec_state;
368*4882a593Smuzhiyun
369*4882a593Smuzhiyun typedef int (*parser_cmd_handler)(struct parser_exec_state *s);
370*4882a593Smuzhiyun
371*4882a593Smuzhiyun #define GVT_CMD_HASH_BITS 7
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun /* which DWords need address fix */
374*4882a593Smuzhiyun #define ADDR_FIX_1(x1) (1 << (x1))
375*4882a593Smuzhiyun #define ADDR_FIX_2(x1, x2) (ADDR_FIX_1(x1) | ADDR_FIX_1(x2))
376*4882a593Smuzhiyun #define ADDR_FIX_3(x1, x2, x3) (ADDR_FIX_1(x1) | ADDR_FIX_2(x2, x3))
377*4882a593Smuzhiyun #define ADDR_FIX_4(x1, x2, x3, x4) (ADDR_FIX_1(x1) | ADDR_FIX_3(x2, x3, x4))
378*4882a593Smuzhiyun #define ADDR_FIX_5(x1, x2, x3, x4, x5) (ADDR_FIX_1(x1) | ADDR_FIX_4(x2, x3, x4, x5))
379*4882a593Smuzhiyun
380*4882a593Smuzhiyun #define DWORD_FIELD(dword, end, start) \
381*4882a593Smuzhiyun FIELD_GET(GENMASK(end, start), cmd_val(s, dword))
382*4882a593Smuzhiyun
383*4882a593Smuzhiyun #define OP_LENGTH_BIAS 2
384*4882a593Smuzhiyun #define CMD_LEN(value) (value + OP_LENGTH_BIAS)
385*4882a593Smuzhiyun
gvt_check_valid_cmd_length(int len,int valid_len)386*4882a593Smuzhiyun static int gvt_check_valid_cmd_length(int len, int valid_len)
387*4882a593Smuzhiyun {
388*4882a593Smuzhiyun if (valid_len != len) {
389*4882a593Smuzhiyun gvt_err("len is not valid: len=%u valid_len=%u\n",
390*4882a593Smuzhiyun len, valid_len);
391*4882a593Smuzhiyun return -EFAULT;
392*4882a593Smuzhiyun }
393*4882a593Smuzhiyun return 0;
394*4882a593Smuzhiyun }
395*4882a593Smuzhiyun
396*4882a593Smuzhiyun struct cmd_info {
397*4882a593Smuzhiyun const char *name;
398*4882a593Smuzhiyun u32 opcode;
399*4882a593Smuzhiyun
400*4882a593Smuzhiyun #define F_LEN_MASK 3U
401*4882a593Smuzhiyun #define F_LEN_CONST 1U
402*4882a593Smuzhiyun #define F_LEN_VAR 0U
403*4882a593Smuzhiyun /* value is const although LEN maybe variable */
404*4882a593Smuzhiyun #define F_LEN_VAR_FIXED (1<<1)
405*4882a593Smuzhiyun
406*4882a593Smuzhiyun /*
407*4882a593Smuzhiyun * command has its own ip advance logic
408*4882a593Smuzhiyun * e.g. MI_BATCH_START, MI_BATCH_END
409*4882a593Smuzhiyun */
410*4882a593Smuzhiyun #define F_IP_ADVANCE_CUSTOM (1<<2)
411*4882a593Smuzhiyun u32 flag;
412*4882a593Smuzhiyun
413*4882a593Smuzhiyun #define R_RCS BIT(RCS0)
414*4882a593Smuzhiyun #define R_VCS1 BIT(VCS0)
415*4882a593Smuzhiyun #define R_VCS2 BIT(VCS1)
416*4882a593Smuzhiyun #define R_VCS (R_VCS1 | R_VCS2)
417*4882a593Smuzhiyun #define R_BCS BIT(BCS0)
418*4882a593Smuzhiyun #define R_VECS BIT(VECS0)
419*4882a593Smuzhiyun #define R_ALL (R_RCS | R_VCS | R_BCS | R_VECS)
420*4882a593Smuzhiyun /* rings that support this cmd: BLT/RCS/VCS/VECS */
421*4882a593Smuzhiyun u16 rings;
422*4882a593Smuzhiyun
423*4882a593Smuzhiyun /* devices that support this cmd: SNB/IVB/HSW/... */
424*4882a593Smuzhiyun u16 devices;
425*4882a593Smuzhiyun
426*4882a593Smuzhiyun /* which DWords are address that need fix up.
427*4882a593Smuzhiyun * bit 0 means a 32-bit non address operand in command
428*4882a593Smuzhiyun * bit 1 means address operand, which could be 32-bit
429*4882a593Smuzhiyun * or 64-bit depending on different architectures.(
430*4882a593Smuzhiyun * defined by "gmadr_bytes_in_cmd" in intel_gvt.
431*4882a593Smuzhiyun * No matter the address length, each address only takes
432*4882a593Smuzhiyun * one bit in the bitmap.
433*4882a593Smuzhiyun */
434*4882a593Smuzhiyun u16 addr_bitmap;
435*4882a593Smuzhiyun
436*4882a593Smuzhiyun /* flag == F_LEN_CONST : command length
437*4882a593Smuzhiyun * flag == F_LEN_VAR : length bias bits
438*4882a593Smuzhiyun * Note: length is in DWord
439*4882a593Smuzhiyun */
440*4882a593Smuzhiyun u32 len;
441*4882a593Smuzhiyun
442*4882a593Smuzhiyun parser_cmd_handler handler;
443*4882a593Smuzhiyun
444*4882a593Smuzhiyun /* valid length in DWord */
445*4882a593Smuzhiyun u32 valid_len;
446*4882a593Smuzhiyun };
447*4882a593Smuzhiyun
448*4882a593Smuzhiyun struct cmd_entry {
449*4882a593Smuzhiyun struct hlist_node hlist;
450*4882a593Smuzhiyun const struct cmd_info *info;
451*4882a593Smuzhiyun };
452*4882a593Smuzhiyun
453*4882a593Smuzhiyun enum {
454*4882a593Smuzhiyun RING_BUFFER_INSTRUCTION,
455*4882a593Smuzhiyun BATCH_BUFFER_INSTRUCTION,
456*4882a593Smuzhiyun BATCH_BUFFER_2ND_LEVEL,
457*4882a593Smuzhiyun };
458*4882a593Smuzhiyun
459*4882a593Smuzhiyun enum {
460*4882a593Smuzhiyun GTT_BUFFER,
461*4882a593Smuzhiyun PPGTT_BUFFER
462*4882a593Smuzhiyun };
463*4882a593Smuzhiyun
464*4882a593Smuzhiyun struct parser_exec_state {
465*4882a593Smuzhiyun struct intel_vgpu *vgpu;
466*4882a593Smuzhiyun const struct intel_engine_cs *engine;
467*4882a593Smuzhiyun
468*4882a593Smuzhiyun int buf_type;
469*4882a593Smuzhiyun
470*4882a593Smuzhiyun /* batch buffer address type */
471*4882a593Smuzhiyun int buf_addr_type;
472*4882a593Smuzhiyun
473*4882a593Smuzhiyun /* graphics memory address of ring buffer start */
474*4882a593Smuzhiyun unsigned long ring_start;
475*4882a593Smuzhiyun unsigned long ring_size;
476*4882a593Smuzhiyun unsigned long ring_head;
477*4882a593Smuzhiyun unsigned long ring_tail;
478*4882a593Smuzhiyun
479*4882a593Smuzhiyun /* instruction graphics memory address */
480*4882a593Smuzhiyun unsigned long ip_gma;
481*4882a593Smuzhiyun
482*4882a593Smuzhiyun /* mapped va of the instr_gma */
483*4882a593Smuzhiyun void *ip_va;
484*4882a593Smuzhiyun void *rb_va;
485*4882a593Smuzhiyun
486*4882a593Smuzhiyun void *ret_bb_va;
487*4882a593Smuzhiyun /* next instruction when return from batch buffer to ring buffer */
488*4882a593Smuzhiyun unsigned long ret_ip_gma_ring;
489*4882a593Smuzhiyun
490*4882a593Smuzhiyun /* next instruction when return from 2nd batch buffer to batch buffer */
491*4882a593Smuzhiyun unsigned long ret_ip_gma_bb;
492*4882a593Smuzhiyun
493*4882a593Smuzhiyun /* batch buffer address type (GTT or PPGTT)
494*4882a593Smuzhiyun * used when ret from 2nd level batch buffer
495*4882a593Smuzhiyun */
496*4882a593Smuzhiyun int saved_buf_addr_type;
497*4882a593Smuzhiyun bool is_ctx_wa;
498*4882a593Smuzhiyun
499*4882a593Smuzhiyun const struct cmd_info *info;
500*4882a593Smuzhiyun
501*4882a593Smuzhiyun struct intel_vgpu_workload *workload;
502*4882a593Smuzhiyun };
503*4882a593Smuzhiyun
504*4882a593Smuzhiyun #define gmadr_dw_number(s) \
505*4882a593Smuzhiyun (s->vgpu->gvt->device_info.gmadr_bytes_in_cmd >> 2)
506*4882a593Smuzhiyun
507*4882a593Smuzhiyun static unsigned long bypass_scan_mask = 0;
508*4882a593Smuzhiyun
509*4882a593Smuzhiyun /* ring ALL, type = 0 */
510*4882a593Smuzhiyun static const struct sub_op_bits sub_op_mi[] = {
511*4882a593Smuzhiyun {31, 29},
512*4882a593Smuzhiyun {28, 23},
513*4882a593Smuzhiyun };
514*4882a593Smuzhiyun
515*4882a593Smuzhiyun static const struct decode_info decode_info_mi = {
516*4882a593Smuzhiyun "MI",
517*4882a593Smuzhiyun OP_LEN_MI,
518*4882a593Smuzhiyun ARRAY_SIZE(sub_op_mi),
519*4882a593Smuzhiyun sub_op_mi,
520*4882a593Smuzhiyun };
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun /* ring RCS, command type 2 */
523*4882a593Smuzhiyun static const struct sub_op_bits sub_op_2d[] = {
524*4882a593Smuzhiyun {31, 29},
525*4882a593Smuzhiyun {28, 22},
526*4882a593Smuzhiyun };
527*4882a593Smuzhiyun
528*4882a593Smuzhiyun static const struct decode_info decode_info_2d = {
529*4882a593Smuzhiyun "2D",
530*4882a593Smuzhiyun OP_LEN_2D,
531*4882a593Smuzhiyun ARRAY_SIZE(sub_op_2d),
532*4882a593Smuzhiyun sub_op_2d,
533*4882a593Smuzhiyun };
534*4882a593Smuzhiyun
535*4882a593Smuzhiyun /* ring RCS, command type 3 */
536*4882a593Smuzhiyun static const struct sub_op_bits sub_op_3d_media[] = {
537*4882a593Smuzhiyun {31, 29},
538*4882a593Smuzhiyun {28, 27},
539*4882a593Smuzhiyun {26, 24},
540*4882a593Smuzhiyun {23, 16},
541*4882a593Smuzhiyun };
542*4882a593Smuzhiyun
543*4882a593Smuzhiyun static const struct decode_info decode_info_3d_media = {
544*4882a593Smuzhiyun "3D_Media",
545*4882a593Smuzhiyun OP_LEN_3D_MEDIA,
546*4882a593Smuzhiyun ARRAY_SIZE(sub_op_3d_media),
547*4882a593Smuzhiyun sub_op_3d_media,
548*4882a593Smuzhiyun };
549*4882a593Smuzhiyun
550*4882a593Smuzhiyun /* ring VCS, command type 3 */
551*4882a593Smuzhiyun static const struct sub_op_bits sub_op_mfx_vc[] = {
552*4882a593Smuzhiyun {31, 29},
553*4882a593Smuzhiyun {28, 27},
554*4882a593Smuzhiyun {26, 24},
555*4882a593Smuzhiyun {23, 21},
556*4882a593Smuzhiyun {20, 16},
557*4882a593Smuzhiyun };
558*4882a593Smuzhiyun
559*4882a593Smuzhiyun static const struct decode_info decode_info_mfx_vc = {
560*4882a593Smuzhiyun "MFX_VC",
561*4882a593Smuzhiyun OP_LEN_MFX_VC,
562*4882a593Smuzhiyun ARRAY_SIZE(sub_op_mfx_vc),
563*4882a593Smuzhiyun sub_op_mfx_vc,
564*4882a593Smuzhiyun };
565*4882a593Smuzhiyun
566*4882a593Smuzhiyun /* ring VECS, command type 3 */
567*4882a593Smuzhiyun static const struct sub_op_bits sub_op_vebox[] = {
568*4882a593Smuzhiyun {31, 29},
569*4882a593Smuzhiyun {28, 27},
570*4882a593Smuzhiyun {26, 24},
571*4882a593Smuzhiyun {23, 21},
572*4882a593Smuzhiyun {20, 16},
573*4882a593Smuzhiyun };
574*4882a593Smuzhiyun
575*4882a593Smuzhiyun static const struct decode_info decode_info_vebox = {
576*4882a593Smuzhiyun "VEBOX",
577*4882a593Smuzhiyun OP_LEN_VEBOX,
578*4882a593Smuzhiyun ARRAY_SIZE(sub_op_vebox),
579*4882a593Smuzhiyun sub_op_vebox,
580*4882a593Smuzhiyun };
581*4882a593Smuzhiyun
582*4882a593Smuzhiyun static const struct decode_info *ring_decode_info[I915_NUM_ENGINES][8] = {
583*4882a593Smuzhiyun [RCS0] = {
584*4882a593Smuzhiyun &decode_info_mi,
585*4882a593Smuzhiyun NULL,
586*4882a593Smuzhiyun NULL,
587*4882a593Smuzhiyun &decode_info_3d_media,
588*4882a593Smuzhiyun NULL,
589*4882a593Smuzhiyun NULL,
590*4882a593Smuzhiyun NULL,
591*4882a593Smuzhiyun NULL,
592*4882a593Smuzhiyun },
593*4882a593Smuzhiyun
594*4882a593Smuzhiyun [VCS0] = {
595*4882a593Smuzhiyun &decode_info_mi,
596*4882a593Smuzhiyun NULL,
597*4882a593Smuzhiyun NULL,
598*4882a593Smuzhiyun &decode_info_mfx_vc,
599*4882a593Smuzhiyun NULL,
600*4882a593Smuzhiyun NULL,
601*4882a593Smuzhiyun NULL,
602*4882a593Smuzhiyun NULL,
603*4882a593Smuzhiyun },
604*4882a593Smuzhiyun
605*4882a593Smuzhiyun [BCS0] = {
606*4882a593Smuzhiyun &decode_info_mi,
607*4882a593Smuzhiyun NULL,
608*4882a593Smuzhiyun &decode_info_2d,
609*4882a593Smuzhiyun NULL,
610*4882a593Smuzhiyun NULL,
611*4882a593Smuzhiyun NULL,
612*4882a593Smuzhiyun NULL,
613*4882a593Smuzhiyun NULL,
614*4882a593Smuzhiyun },
615*4882a593Smuzhiyun
616*4882a593Smuzhiyun [VECS0] = {
617*4882a593Smuzhiyun &decode_info_mi,
618*4882a593Smuzhiyun NULL,
619*4882a593Smuzhiyun NULL,
620*4882a593Smuzhiyun &decode_info_vebox,
621*4882a593Smuzhiyun NULL,
622*4882a593Smuzhiyun NULL,
623*4882a593Smuzhiyun NULL,
624*4882a593Smuzhiyun NULL,
625*4882a593Smuzhiyun },
626*4882a593Smuzhiyun
627*4882a593Smuzhiyun [VCS1] = {
628*4882a593Smuzhiyun &decode_info_mi,
629*4882a593Smuzhiyun NULL,
630*4882a593Smuzhiyun NULL,
631*4882a593Smuzhiyun &decode_info_mfx_vc,
632*4882a593Smuzhiyun NULL,
633*4882a593Smuzhiyun NULL,
634*4882a593Smuzhiyun NULL,
635*4882a593Smuzhiyun NULL,
636*4882a593Smuzhiyun },
637*4882a593Smuzhiyun };
638*4882a593Smuzhiyun
get_opcode(u32 cmd,const struct intel_engine_cs * engine)639*4882a593Smuzhiyun static inline u32 get_opcode(u32 cmd, const struct intel_engine_cs *engine)
640*4882a593Smuzhiyun {
641*4882a593Smuzhiyun const struct decode_info *d_info;
642*4882a593Smuzhiyun
643*4882a593Smuzhiyun d_info = ring_decode_info[engine->id][CMD_TYPE(cmd)];
644*4882a593Smuzhiyun if (d_info == NULL)
645*4882a593Smuzhiyun return INVALID_OP;
646*4882a593Smuzhiyun
647*4882a593Smuzhiyun return cmd >> (32 - d_info->op_len);
648*4882a593Smuzhiyun }
649*4882a593Smuzhiyun
650*4882a593Smuzhiyun static inline const struct cmd_info *
find_cmd_entry(struct intel_gvt * gvt,unsigned int opcode,const struct intel_engine_cs * engine)651*4882a593Smuzhiyun find_cmd_entry(struct intel_gvt *gvt, unsigned int opcode,
652*4882a593Smuzhiyun const struct intel_engine_cs *engine)
653*4882a593Smuzhiyun {
654*4882a593Smuzhiyun struct cmd_entry *e;
655*4882a593Smuzhiyun
656*4882a593Smuzhiyun hash_for_each_possible(gvt->cmd_table, e, hlist, opcode) {
657*4882a593Smuzhiyun if (opcode == e->info->opcode &&
658*4882a593Smuzhiyun e->info->rings & engine->mask)
659*4882a593Smuzhiyun return e->info;
660*4882a593Smuzhiyun }
661*4882a593Smuzhiyun return NULL;
662*4882a593Smuzhiyun }
663*4882a593Smuzhiyun
664*4882a593Smuzhiyun static inline const struct cmd_info *
get_cmd_info(struct intel_gvt * gvt,u32 cmd,const struct intel_engine_cs * engine)665*4882a593Smuzhiyun get_cmd_info(struct intel_gvt *gvt, u32 cmd,
666*4882a593Smuzhiyun const struct intel_engine_cs *engine)
667*4882a593Smuzhiyun {
668*4882a593Smuzhiyun u32 opcode;
669*4882a593Smuzhiyun
670*4882a593Smuzhiyun opcode = get_opcode(cmd, engine);
671*4882a593Smuzhiyun if (opcode == INVALID_OP)
672*4882a593Smuzhiyun return NULL;
673*4882a593Smuzhiyun
674*4882a593Smuzhiyun return find_cmd_entry(gvt, opcode, engine);
675*4882a593Smuzhiyun }
676*4882a593Smuzhiyun
sub_op_val(u32 cmd,u32 hi,u32 low)677*4882a593Smuzhiyun static inline u32 sub_op_val(u32 cmd, u32 hi, u32 low)
678*4882a593Smuzhiyun {
679*4882a593Smuzhiyun return (cmd >> low) & ((1U << (hi - low + 1)) - 1);
680*4882a593Smuzhiyun }
681*4882a593Smuzhiyun
print_opcode(u32 cmd,const struct intel_engine_cs * engine)682*4882a593Smuzhiyun static inline void print_opcode(u32 cmd, const struct intel_engine_cs *engine)
683*4882a593Smuzhiyun {
684*4882a593Smuzhiyun const struct decode_info *d_info;
685*4882a593Smuzhiyun int i;
686*4882a593Smuzhiyun
687*4882a593Smuzhiyun d_info = ring_decode_info[engine->id][CMD_TYPE(cmd)];
688*4882a593Smuzhiyun if (d_info == NULL)
689*4882a593Smuzhiyun return;
690*4882a593Smuzhiyun
691*4882a593Smuzhiyun gvt_dbg_cmd("opcode=0x%x %s sub_ops:",
692*4882a593Smuzhiyun cmd >> (32 - d_info->op_len), d_info->name);
693*4882a593Smuzhiyun
694*4882a593Smuzhiyun for (i = 0; i < d_info->nr_sub_op; i++)
695*4882a593Smuzhiyun pr_err("0x%x ", sub_op_val(cmd, d_info->sub_op[i].hi,
696*4882a593Smuzhiyun d_info->sub_op[i].low));
697*4882a593Smuzhiyun
698*4882a593Smuzhiyun pr_err("\n");
699*4882a593Smuzhiyun }
700*4882a593Smuzhiyun
cmd_ptr(struct parser_exec_state * s,int index)701*4882a593Smuzhiyun static inline u32 *cmd_ptr(struct parser_exec_state *s, int index)
702*4882a593Smuzhiyun {
703*4882a593Smuzhiyun return s->ip_va + (index << 2);
704*4882a593Smuzhiyun }
705*4882a593Smuzhiyun
cmd_val(struct parser_exec_state * s,int index)706*4882a593Smuzhiyun static inline u32 cmd_val(struct parser_exec_state *s, int index)
707*4882a593Smuzhiyun {
708*4882a593Smuzhiyun return *cmd_ptr(s, index);
709*4882a593Smuzhiyun }
710*4882a593Smuzhiyun
parser_exec_state_dump(struct parser_exec_state * s)711*4882a593Smuzhiyun static void parser_exec_state_dump(struct parser_exec_state *s)
712*4882a593Smuzhiyun {
713*4882a593Smuzhiyun int cnt = 0;
714*4882a593Smuzhiyun int i;
715*4882a593Smuzhiyun
716*4882a593Smuzhiyun gvt_dbg_cmd(" vgpu%d RING%s: ring_start(%08lx) ring_end(%08lx)"
717*4882a593Smuzhiyun " ring_head(%08lx) ring_tail(%08lx)\n",
718*4882a593Smuzhiyun s->vgpu->id, s->engine->name,
719*4882a593Smuzhiyun s->ring_start, s->ring_start + s->ring_size,
720*4882a593Smuzhiyun s->ring_head, s->ring_tail);
721*4882a593Smuzhiyun
722*4882a593Smuzhiyun gvt_dbg_cmd(" %s %s ip_gma(%08lx) ",
723*4882a593Smuzhiyun s->buf_type == RING_BUFFER_INSTRUCTION ?
724*4882a593Smuzhiyun "RING_BUFFER" : "BATCH_BUFFER",
725*4882a593Smuzhiyun s->buf_addr_type == GTT_BUFFER ?
726*4882a593Smuzhiyun "GTT" : "PPGTT", s->ip_gma);
727*4882a593Smuzhiyun
728*4882a593Smuzhiyun if (s->ip_va == NULL) {
729*4882a593Smuzhiyun gvt_dbg_cmd(" ip_va(NULL)");
730*4882a593Smuzhiyun return;
731*4882a593Smuzhiyun }
732*4882a593Smuzhiyun
733*4882a593Smuzhiyun gvt_dbg_cmd(" ip_va=%p: %08x %08x %08x %08x\n",
734*4882a593Smuzhiyun s->ip_va, cmd_val(s, 0), cmd_val(s, 1),
735*4882a593Smuzhiyun cmd_val(s, 2), cmd_val(s, 3));
736*4882a593Smuzhiyun
737*4882a593Smuzhiyun print_opcode(cmd_val(s, 0), s->engine);
738*4882a593Smuzhiyun
739*4882a593Smuzhiyun s->ip_va = (u32 *)((((u64)s->ip_va) >> 12) << 12);
740*4882a593Smuzhiyun
741*4882a593Smuzhiyun while (cnt < 1024) {
742*4882a593Smuzhiyun gvt_dbg_cmd("ip_va=%p: ", s->ip_va);
743*4882a593Smuzhiyun for (i = 0; i < 8; i++)
744*4882a593Smuzhiyun gvt_dbg_cmd("%08x ", cmd_val(s, i));
745*4882a593Smuzhiyun gvt_dbg_cmd("\n");
746*4882a593Smuzhiyun
747*4882a593Smuzhiyun s->ip_va += 8 * sizeof(u32);
748*4882a593Smuzhiyun cnt += 8;
749*4882a593Smuzhiyun }
750*4882a593Smuzhiyun }
751*4882a593Smuzhiyun
update_ip_va(struct parser_exec_state * s)752*4882a593Smuzhiyun static inline void update_ip_va(struct parser_exec_state *s)
753*4882a593Smuzhiyun {
754*4882a593Smuzhiyun unsigned long len = 0;
755*4882a593Smuzhiyun
756*4882a593Smuzhiyun if (WARN_ON(s->ring_head == s->ring_tail))
757*4882a593Smuzhiyun return;
758*4882a593Smuzhiyun
759*4882a593Smuzhiyun if (s->buf_type == RING_BUFFER_INSTRUCTION) {
760*4882a593Smuzhiyun unsigned long ring_top = s->ring_start + s->ring_size;
761*4882a593Smuzhiyun
762*4882a593Smuzhiyun if (s->ring_head > s->ring_tail) {
763*4882a593Smuzhiyun if (s->ip_gma >= s->ring_head && s->ip_gma < ring_top)
764*4882a593Smuzhiyun len = (s->ip_gma - s->ring_head);
765*4882a593Smuzhiyun else if (s->ip_gma >= s->ring_start &&
766*4882a593Smuzhiyun s->ip_gma <= s->ring_tail)
767*4882a593Smuzhiyun len = (ring_top - s->ring_head) +
768*4882a593Smuzhiyun (s->ip_gma - s->ring_start);
769*4882a593Smuzhiyun } else
770*4882a593Smuzhiyun len = (s->ip_gma - s->ring_head);
771*4882a593Smuzhiyun
772*4882a593Smuzhiyun s->ip_va = s->rb_va + len;
773*4882a593Smuzhiyun } else {/* shadow batch buffer */
774*4882a593Smuzhiyun s->ip_va = s->ret_bb_va;
775*4882a593Smuzhiyun }
776*4882a593Smuzhiyun }
777*4882a593Smuzhiyun
ip_gma_set(struct parser_exec_state * s,unsigned long ip_gma)778*4882a593Smuzhiyun static inline int ip_gma_set(struct parser_exec_state *s,
779*4882a593Smuzhiyun unsigned long ip_gma)
780*4882a593Smuzhiyun {
781*4882a593Smuzhiyun WARN_ON(!IS_ALIGNED(ip_gma, 4));
782*4882a593Smuzhiyun
783*4882a593Smuzhiyun s->ip_gma = ip_gma;
784*4882a593Smuzhiyun update_ip_va(s);
785*4882a593Smuzhiyun return 0;
786*4882a593Smuzhiyun }
787*4882a593Smuzhiyun
ip_gma_advance(struct parser_exec_state * s,unsigned int dw_len)788*4882a593Smuzhiyun static inline int ip_gma_advance(struct parser_exec_state *s,
789*4882a593Smuzhiyun unsigned int dw_len)
790*4882a593Smuzhiyun {
791*4882a593Smuzhiyun s->ip_gma += (dw_len << 2);
792*4882a593Smuzhiyun
793*4882a593Smuzhiyun if (s->buf_type == RING_BUFFER_INSTRUCTION) {
794*4882a593Smuzhiyun if (s->ip_gma >= s->ring_start + s->ring_size)
795*4882a593Smuzhiyun s->ip_gma -= s->ring_size;
796*4882a593Smuzhiyun update_ip_va(s);
797*4882a593Smuzhiyun } else {
798*4882a593Smuzhiyun s->ip_va += (dw_len << 2);
799*4882a593Smuzhiyun }
800*4882a593Smuzhiyun
801*4882a593Smuzhiyun return 0;
802*4882a593Smuzhiyun }
803*4882a593Smuzhiyun
get_cmd_length(const struct cmd_info * info,u32 cmd)804*4882a593Smuzhiyun static inline int get_cmd_length(const struct cmd_info *info, u32 cmd)
805*4882a593Smuzhiyun {
806*4882a593Smuzhiyun if ((info->flag & F_LEN_MASK) == F_LEN_CONST)
807*4882a593Smuzhiyun return info->len;
808*4882a593Smuzhiyun else
809*4882a593Smuzhiyun return (cmd & ((1U << info->len) - 1)) + 2;
810*4882a593Smuzhiyun return 0;
811*4882a593Smuzhiyun }
812*4882a593Smuzhiyun
cmd_length(struct parser_exec_state * s)813*4882a593Smuzhiyun static inline int cmd_length(struct parser_exec_state *s)
814*4882a593Smuzhiyun {
815*4882a593Smuzhiyun return get_cmd_length(s->info, cmd_val(s, 0));
816*4882a593Smuzhiyun }
817*4882a593Smuzhiyun
818*4882a593Smuzhiyun /* do not remove this, some platform may need clflush here */
819*4882a593Smuzhiyun #define patch_value(s, addr, val) do { \
820*4882a593Smuzhiyun *addr = val; \
821*4882a593Smuzhiyun } while (0)
822*4882a593Smuzhiyun
is_shadowed_mmio(unsigned int offset)823*4882a593Smuzhiyun static bool is_shadowed_mmio(unsigned int offset)
824*4882a593Smuzhiyun {
825*4882a593Smuzhiyun bool ret = false;
826*4882a593Smuzhiyun
827*4882a593Smuzhiyun if ((offset == 0x2168) || /*BB current head register UDW */
828*4882a593Smuzhiyun (offset == 0x2140) || /*BB current header register */
829*4882a593Smuzhiyun (offset == 0x211c) || /*second BB header register UDW */
830*4882a593Smuzhiyun (offset == 0x2114)) { /*second BB header register UDW */
831*4882a593Smuzhiyun ret = true;
832*4882a593Smuzhiyun }
833*4882a593Smuzhiyun return ret;
834*4882a593Smuzhiyun }
835*4882a593Smuzhiyun
is_force_nonpriv_mmio(unsigned int offset)836*4882a593Smuzhiyun static inline bool is_force_nonpriv_mmio(unsigned int offset)
837*4882a593Smuzhiyun {
838*4882a593Smuzhiyun return (offset >= 0x24d0 && offset < 0x2500);
839*4882a593Smuzhiyun }
840*4882a593Smuzhiyun
force_nonpriv_reg_handler(struct parser_exec_state * s,unsigned int offset,unsigned int index,char * cmd)841*4882a593Smuzhiyun static int force_nonpriv_reg_handler(struct parser_exec_state *s,
842*4882a593Smuzhiyun unsigned int offset, unsigned int index, char *cmd)
843*4882a593Smuzhiyun {
844*4882a593Smuzhiyun struct intel_gvt *gvt = s->vgpu->gvt;
845*4882a593Smuzhiyun unsigned int data;
846*4882a593Smuzhiyun u32 ring_base;
847*4882a593Smuzhiyun u32 nopid;
848*4882a593Smuzhiyun
849*4882a593Smuzhiyun if (!strcmp(cmd, "lri"))
850*4882a593Smuzhiyun data = cmd_val(s, index + 1);
851*4882a593Smuzhiyun else {
852*4882a593Smuzhiyun gvt_err("Unexpected forcenonpriv 0x%x write from cmd %s\n",
853*4882a593Smuzhiyun offset, cmd);
854*4882a593Smuzhiyun return -EINVAL;
855*4882a593Smuzhiyun }
856*4882a593Smuzhiyun
857*4882a593Smuzhiyun ring_base = s->engine->mmio_base;
858*4882a593Smuzhiyun nopid = i915_mmio_reg_offset(RING_NOPID(ring_base));
859*4882a593Smuzhiyun
860*4882a593Smuzhiyun if (!intel_gvt_in_force_nonpriv_whitelist(gvt, data) &&
861*4882a593Smuzhiyun data != nopid) {
862*4882a593Smuzhiyun gvt_err("Unexpected forcenonpriv 0x%x LRI write, value=0x%x\n",
863*4882a593Smuzhiyun offset, data);
864*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, index), nopid);
865*4882a593Smuzhiyun return 0;
866*4882a593Smuzhiyun }
867*4882a593Smuzhiyun return 0;
868*4882a593Smuzhiyun }
869*4882a593Smuzhiyun
is_mocs_mmio(unsigned int offset)870*4882a593Smuzhiyun static inline bool is_mocs_mmio(unsigned int offset)
871*4882a593Smuzhiyun {
872*4882a593Smuzhiyun return ((offset >= 0xc800) && (offset <= 0xcff8)) ||
873*4882a593Smuzhiyun ((offset >= 0xb020) && (offset <= 0xb0a0));
874*4882a593Smuzhiyun }
875*4882a593Smuzhiyun
mocs_cmd_reg_handler(struct parser_exec_state * s,unsigned int offset,unsigned int index)876*4882a593Smuzhiyun static int mocs_cmd_reg_handler(struct parser_exec_state *s,
877*4882a593Smuzhiyun unsigned int offset, unsigned int index)
878*4882a593Smuzhiyun {
879*4882a593Smuzhiyun if (!is_mocs_mmio(offset))
880*4882a593Smuzhiyun return -EINVAL;
881*4882a593Smuzhiyun vgpu_vreg(s->vgpu, offset) = cmd_val(s, index + 1);
882*4882a593Smuzhiyun return 0;
883*4882a593Smuzhiyun }
884*4882a593Smuzhiyun
is_cmd_update_pdps(unsigned int offset,struct parser_exec_state * s)885*4882a593Smuzhiyun static int is_cmd_update_pdps(unsigned int offset,
886*4882a593Smuzhiyun struct parser_exec_state *s)
887*4882a593Smuzhiyun {
888*4882a593Smuzhiyun u32 base = s->workload->engine->mmio_base;
889*4882a593Smuzhiyun return i915_mmio_reg_equal(_MMIO(offset), GEN8_RING_PDP_UDW(base, 0));
890*4882a593Smuzhiyun }
891*4882a593Smuzhiyun
cmd_pdp_mmio_update_handler(struct parser_exec_state * s,unsigned int offset,unsigned int index)892*4882a593Smuzhiyun static int cmd_pdp_mmio_update_handler(struct parser_exec_state *s,
893*4882a593Smuzhiyun unsigned int offset, unsigned int index)
894*4882a593Smuzhiyun {
895*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
896*4882a593Smuzhiyun struct intel_vgpu_mm *shadow_mm = s->workload->shadow_mm;
897*4882a593Smuzhiyun struct intel_vgpu_mm *mm;
898*4882a593Smuzhiyun u64 pdps[GEN8_3LVL_PDPES];
899*4882a593Smuzhiyun
900*4882a593Smuzhiyun if (shadow_mm->ppgtt_mm.root_entry_type ==
901*4882a593Smuzhiyun GTT_TYPE_PPGTT_ROOT_L4_ENTRY) {
902*4882a593Smuzhiyun pdps[0] = (u64)cmd_val(s, 2) << 32;
903*4882a593Smuzhiyun pdps[0] |= cmd_val(s, 4);
904*4882a593Smuzhiyun
905*4882a593Smuzhiyun mm = intel_vgpu_find_ppgtt_mm(vgpu, pdps);
906*4882a593Smuzhiyun if (!mm) {
907*4882a593Smuzhiyun gvt_vgpu_err("failed to get the 4-level shadow vm\n");
908*4882a593Smuzhiyun return -EINVAL;
909*4882a593Smuzhiyun }
910*4882a593Smuzhiyun intel_vgpu_mm_get(mm);
911*4882a593Smuzhiyun list_add_tail(&mm->ppgtt_mm.link,
912*4882a593Smuzhiyun &s->workload->lri_shadow_mm);
913*4882a593Smuzhiyun *cmd_ptr(s, 2) = upper_32_bits(mm->ppgtt_mm.shadow_pdps[0]);
914*4882a593Smuzhiyun *cmd_ptr(s, 4) = lower_32_bits(mm->ppgtt_mm.shadow_pdps[0]);
915*4882a593Smuzhiyun } else {
916*4882a593Smuzhiyun /* Currently all guests use PML4 table and now can't
917*4882a593Smuzhiyun * have a guest with 3-level table but uses LRI for
918*4882a593Smuzhiyun * PPGTT update. So this is simply un-testable. */
919*4882a593Smuzhiyun GEM_BUG_ON(1);
920*4882a593Smuzhiyun gvt_vgpu_err("invalid shared shadow vm type\n");
921*4882a593Smuzhiyun return -EINVAL;
922*4882a593Smuzhiyun }
923*4882a593Smuzhiyun return 0;
924*4882a593Smuzhiyun }
925*4882a593Smuzhiyun
cmd_reg_handler(struct parser_exec_state * s,unsigned int offset,unsigned int index,char * cmd)926*4882a593Smuzhiyun static int cmd_reg_handler(struct parser_exec_state *s,
927*4882a593Smuzhiyun unsigned int offset, unsigned int index, char *cmd)
928*4882a593Smuzhiyun {
929*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
930*4882a593Smuzhiyun struct intel_gvt *gvt = vgpu->gvt;
931*4882a593Smuzhiyun u32 ctx_sr_ctl;
932*4882a593Smuzhiyun
933*4882a593Smuzhiyun if (offset + 4 > gvt->device_info.mmio_size) {
934*4882a593Smuzhiyun gvt_vgpu_err("%s access to (%x) outside of MMIO range\n",
935*4882a593Smuzhiyun cmd, offset);
936*4882a593Smuzhiyun return -EFAULT;
937*4882a593Smuzhiyun }
938*4882a593Smuzhiyun
939*4882a593Smuzhiyun if (!intel_gvt_mmio_is_cmd_accessible(gvt, offset)) {
940*4882a593Smuzhiyun gvt_vgpu_err("%s access to non-render register (%x)\n",
941*4882a593Smuzhiyun cmd, offset);
942*4882a593Smuzhiyun return -EBADRQC;
943*4882a593Smuzhiyun }
944*4882a593Smuzhiyun
945*4882a593Smuzhiyun if (is_shadowed_mmio(offset)) {
946*4882a593Smuzhiyun gvt_vgpu_err("found access of shadowed MMIO %x\n", offset);
947*4882a593Smuzhiyun return 0;
948*4882a593Smuzhiyun }
949*4882a593Smuzhiyun
950*4882a593Smuzhiyun if (is_mocs_mmio(offset) &&
951*4882a593Smuzhiyun mocs_cmd_reg_handler(s, offset, index))
952*4882a593Smuzhiyun return -EINVAL;
953*4882a593Smuzhiyun
954*4882a593Smuzhiyun if (is_force_nonpriv_mmio(offset) &&
955*4882a593Smuzhiyun force_nonpriv_reg_handler(s, offset, index, cmd))
956*4882a593Smuzhiyun return -EPERM;
957*4882a593Smuzhiyun
958*4882a593Smuzhiyun if (offset == i915_mmio_reg_offset(DERRMR) ||
959*4882a593Smuzhiyun offset == i915_mmio_reg_offset(FORCEWAKE_MT)) {
960*4882a593Smuzhiyun /* Writing to HW VGT_PVINFO_PAGE offset will be discarded */
961*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, index), VGT_PVINFO_PAGE);
962*4882a593Smuzhiyun }
963*4882a593Smuzhiyun
964*4882a593Smuzhiyun if (is_cmd_update_pdps(offset, s) &&
965*4882a593Smuzhiyun cmd_pdp_mmio_update_handler(s, offset, index))
966*4882a593Smuzhiyun return -EINVAL;
967*4882a593Smuzhiyun
968*4882a593Smuzhiyun /* TODO
969*4882a593Smuzhiyun * In order to let workload with inhibit context to generate
970*4882a593Smuzhiyun * correct image data into memory, vregs values will be loaded to
971*4882a593Smuzhiyun * hw via LRIs in the workload with inhibit context. But as
972*4882a593Smuzhiyun * indirect context is loaded prior to LRIs in workload, we don't
973*4882a593Smuzhiyun * want reg values specified in indirect context overwritten by
974*4882a593Smuzhiyun * LRIs in workloads. So, when scanning an indirect context, we
975*4882a593Smuzhiyun * update reg values in it into vregs, so LRIs in workload with
976*4882a593Smuzhiyun * inhibit context will restore with correct values
977*4882a593Smuzhiyun */
978*4882a593Smuzhiyun if (IS_GEN(s->engine->i915, 9) &&
979*4882a593Smuzhiyun intel_gvt_mmio_is_sr_in_ctx(gvt, offset) &&
980*4882a593Smuzhiyun !strncmp(cmd, "lri", 3)) {
981*4882a593Smuzhiyun intel_gvt_hypervisor_read_gpa(s->vgpu,
982*4882a593Smuzhiyun s->workload->ring_context_gpa + 12, &ctx_sr_ctl, 4);
983*4882a593Smuzhiyun /* check inhibit context */
984*4882a593Smuzhiyun if (ctx_sr_ctl & 1) {
985*4882a593Smuzhiyun u32 data = cmd_val(s, index + 1);
986*4882a593Smuzhiyun
987*4882a593Smuzhiyun if (intel_gvt_mmio_has_mode_mask(s->vgpu->gvt, offset))
988*4882a593Smuzhiyun intel_vgpu_mask_mmio_write(vgpu,
989*4882a593Smuzhiyun offset, &data, 4);
990*4882a593Smuzhiyun else
991*4882a593Smuzhiyun vgpu_vreg(vgpu, offset) = data;
992*4882a593Smuzhiyun }
993*4882a593Smuzhiyun }
994*4882a593Smuzhiyun
995*4882a593Smuzhiyun return 0;
996*4882a593Smuzhiyun }
997*4882a593Smuzhiyun
998*4882a593Smuzhiyun #define cmd_reg(s, i) \
999*4882a593Smuzhiyun (cmd_val(s, i) & GENMASK(22, 2))
1000*4882a593Smuzhiyun
1001*4882a593Smuzhiyun #define cmd_reg_inhibit(s, i) \
1002*4882a593Smuzhiyun (cmd_val(s, i) & GENMASK(22, 18))
1003*4882a593Smuzhiyun
1004*4882a593Smuzhiyun #define cmd_gma(s, i) \
1005*4882a593Smuzhiyun (cmd_val(s, i) & GENMASK(31, 2))
1006*4882a593Smuzhiyun
1007*4882a593Smuzhiyun #define cmd_gma_hi(s, i) \
1008*4882a593Smuzhiyun (cmd_val(s, i) & GENMASK(15, 0))
1009*4882a593Smuzhiyun
cmd_handler_lri(struct parser_exec_state * s)1010*4882a593Smuzhiyun static int cmd_handler_lri(struct parser_exec_state *s)
1011*4882a593Smuzhiyun {
1012*4882a593Smuzhiyun int i, ret = 0;
1013*4882a593Smuzhiyun int cmd_len = cmd_length(s);
1014*4882a593Smuzhiyun
1015*4882a593Smuzhiyun for (i = 1; i < cmd_len; i += 2) {
1016*4882a593Smuzhiyun if (IS_BROADWELL(s->engine->i915) && s->engine->id != RCS0) {
1017*4882a593Smuzhiyun if (s->engine->id == BCS0 &&
1018*4882a593Smuzhiyun cmd_reg(s, i) == i915_mmio_reg_offset(DERRMR))
1019*4882a593Smuzhiyun ret |= 0;
1020*4882a593Smuzhiyun else
1021*4882a593Smuzhiyun ret |= cmd_reg_inhibit(s, i) ? -EBADRQC : 0;
1022*4882a593Smuzhiyun }
1023*4882a593Smuzhiyun if (ret)
1024*4882a593Smuzhiyun break;
1025*4882a593Smuzhiyun ret |= cmd_reg_handler(s, cmd_reg(s, i), i, "lri");
1026*4882a593Smuzhiyun if (ret)
1027*4882a593Smuzhiyun break;
1028*4882a593Smuzhiyun }
1029*4882a593Smuzhiyun return ret;
1030*4882a593Smuzhiyun }
1031*4882a593Smuzhiyun
cmd_handler_lrr(struct parser_exec_state * s)1032*4882a593Smuzhiyun static int cmd_handler_lrr(struct parser_exec_state *s)
1033*4882a593Smuzhiyun {
1034*4882a593Smuzhiyun int i, ret = 0;
1035*4882a593Smuzhiyun int cmd_len = cmd_length(s);
1036*4882a593Smuzhiyun
1037*4882a593Smuzhiyun for (i = 1; i < cmd_len; i += 2) {
1038*4882a593Smuzhiyun if (IS_BROADWELL(s->engine->i915))
1039*4882a593Smuzhiyun ret |= ((cmd_reg_inhibit(s, i) ||
1040*4882a593Smuzhiyun (cmd_reg_inhibit(s, i + 1)))) ?
1041*4882a593Smuzhiyun -EBADRQC : 0;
1042*4882a593Smuzhiyun if (ret)
1043*4882a593Smuzhiyun break;
1044*4882a593Smuzhiyun ret |= cmd_reg_handler(s, cmd_reg(s, i), i, "lrr-src");
1045*4882a593Smuzhiyun if (ret)
1046*4882a593Smuzhiyun break;
1047*4882a593Smuzhiyun ret |= cmd_reg_handler(s, cmd_reg(s, i + 1), i, "lrr-dst");
1048*4882a593Smuzhiyun if (ret)
1049*4882a593Smuzhiyun break;
1050*4882a593Smuzhiyun }
1051*4882a593Smuzhiyun return ret;
1052*4882a593Smuzhiyun }
1053*4882a593Smuzhiyun
1054*4882a593Smuzhiyun static inline int cmd_address_audit(struct parser_exec_state *s,
1055*4882a593Smuzhiyun unsigned long guest_gma, int op_size, bool index_mode);
1056*4882a593Smuzhiyun
cmd_handler_lrm(struct parser_exec_state * s)1057*4882a593Smuzhiyun static int cmd_handler_lrm(struct parser_exec_state *s)
1058*4882a593Smuzhiyun {
1059*4882a593Smuzhiyun struct intel_gvt *gvt = s->vgpu->gvt;
1060*4882a593Smuzhiyun int gmadr_bytes = gvt->device_info.gmadr_bytes_in_cmd;
1061*4882a593Smuzhiyun unsigned long gma;
1062*4882a593Smuzhiyun int i, ret = 0;
1063*4882a593Smuzhiyun int cmd_len = cmd_length(s);
1064*4882a593Smuzhiyun
1065*4882a593Smuzhiyun for (i = 1; i < cmd_len;) {
1066*4882a593Smuzhiyun if (IS_BROADWELL(s->engine->i915))
1067*4882a593Smuzhiyun ret |= (cmd_reg_inhibit(s, i)) ? -EBADRQC : 0;
1068*4882a593Smuzhiyun if (ret)
1069*4882a593Smuzhiyun break;
1070*4882a593Smuzhiyun ret |= cmd_reg_handler(s, cmd_reg(s, i), i, "lrm");
1071*4882a593Smuzhiyun if (ret)
1072*4882a593Smuzhiyun break;
1073*4882a593Smuzhiyun if (cmd_val(s, 0) & (1 << 22)) {
1074*4882a593Smuzhiyun gma = cmd_gma(s, i + 1);
1075*4882a593Smuzhiyun if (gmadr_bytes == 8)
1076*4882a593Smuzhiyun gma |= (cmd_gma_hi(s, i + 2)) << 32;
1077*4882a593Smuzhiyun ret |= cmd_address_audit(s, gma, sizeof(u32), false);
1078*4882a593Smuzhiyun if (ret)
1079*4882a593Smuzhiyun break;
1080*4882a593Smuzhiyun }
1081*4882a593Smuzhiyun i += gmadr_dw_number(s) + 1;
1082*4882a593Smuzhiyun }
1083*4882a593Smuzhiyun return ret;
1084*4882a593Smuzhiyun }
1085*4882a593Smuzhiyun
cmd_handler_srm(struct parser_exec_state * s)1086*4882a593Smuzhiyun static int cmd_handler_srm(struct parser_exec_state *s)
1087*4882a593Smuzhiyun {
1088*4882a593Smuzhiyun int gmadr_bytes = s->vgpu->gvt->device_info.gmadr_bytes_in_cmd;
1089*4882a593Smuzhiyun unsigned long gma;
1090*4882a593Smuzhiyun int i, ret = 0;
1091*4882a593Smuzhiyun int cmd_len = cmd_length(s);
1092*4882a593Smuzhiyun
1093*4882a593Smuzhiyun for (i = 1; i < cmd_len;) {
1094*4882a593Smuzhiyun ret |= cmd_reg_handler(s, cmd_reg(s, i), i, "srm");
1095*4882a593Smuzhiyun if (ret)
1096*4882a593Smuzhiyun break;
1097*4882a593Smuzhiyun if (cmd_val(s, 0) & (1 << 22)) {
1098*4882a593Smuzhiyun gma = cmd_gma(s, i + 1);
1099*4882a593Smuzhiyun if (gmadr_bytes == 8)
1100*4882a593Smuzhiyun gma |= (cmd_gma_hi(s, i + 2)) << 32;
1101*4882a593Smuzhiyun ret |= cmd_address_audit(s, gma, sizeof(u32), false);
1102*4882a593Smuzhiyun if (ret)
1103*4882a593Smuzhiyun break;
1104*4882a593Smuzhiyun }
1105*4882a593Smuzhiyun i += gmadr_dw_number(s) + 1;
1106*4882a593Smuzhiyun }
1107*4882a593Smuzhiyun return ret;
1108*4882a593Smuzhiyun }
1109*4882a593Smuzhiyun
1110*4882a593Smuzhiyun struct cmd_interrupt_event {
1111*4882a593Smuzhiyun int pipe_control_notify;
1112*4882a593Smuzhiyun int mi_flush_dw;
1113*4882a593Smuzhiyun int mi_user_interrupt;
1114*4882a593Smuzhiyun };
1115*4882a593Smuzhiyun
1116*4882a593Smuzhiyun static struct cmd_interrupt_event cmd_interrupt_events[] = {
1117*4882a593Smuzhiyun [RCS0] = {
1118*4882a593Smuzhiyun .pipe_control_notify = RCS_PIPE_CONTROL,
1119*4882a593Smuzhiyun .mi_flush_dw = INTEL_GVT_EVENT_RESERVED,
1120*4882a593Smuzhiyun .mi_user_interrupt = RCS_MI_USER_INTERRUPT,
1121*4882a593Smuzhiyun },
1122*4882a593Smuzhiyun [BCS0] = {
1123*4882a593Smuzhiyun .pipe_control_notify = INTEL_GVT_EVENT_RESERVED,
1124*4882a593Smuzhiyun .mi_flush_dw = BCS_MI_FLUSH_DW,
1125*4882a593Smuzhiyun .mi_user_interrupt = BCS_MI_USER_INTERRUPT,
1126*4882a593Smuzhiyun },
1127*4882a593Smuzhiyun [VCS0] = {
1128*4882a593Smuzhiyun .pipe_control_notify = INTEL_GVT_EVENT_RESERVED,
1129*4882a593Smuzhiyun .mi_flush_dw = VCS_MI_FLUSH_DW,
1130*4882a593Smuzhiyun .mi_user_interrupt = VCS_MI_USER_INTERRUPT,
1131*4882a593Smuzhiyun },
1132*4882a593Smuzhiyun [VCS1] = {
1133*4882a593Smuzhiyun .pipe_control_notify = INTEL_GVT_EVENT_RESERVED,
1134*4882a593Smuzhiyun .mi_flush_dw = VCS2_MI_FLUSH_DW,
1135*4882a593Smuzhiyun .mi_user_interrupt = VCS2_MI_USER_INTERRUPT,
1136*4882a593Smuzhiyun },
1137*4882a593Smuzhiyun [VECS0] = {
1138*4882a593Smuzhiyun .pipe_control_notify = INTEL_GVT_EVENT_RESERVED,
1139*4882a593Smuzhiyun .mi_flush_dw = VECS_MI_FLUSH_DW,
1140*4882a593Smuzhiyun .mi_user_interrupt = VECS_MI_USER_INTERRUPT,
1141*4882a593Smuzhiyun },
1142*4882a593Smuzhiyun };
1143*4882a593Smuzhiyun
cmd_handler_pipe_control(struct parser_exec_state * s)1144*4882a593Smuzhiyun static int cmd_handler_pipe_control(struct parser_exec_state *s)
1145*4882a593Smuzhiyun {
1146*4882a593Smuzhiyun int gmadr_bytes = s->vgpu->gvt->device_info.gmadr_bytes_in_cmd;
1147*4882a593Smuzhiyun unsigned long gma;
1148*4882a593Smuzhiyun bool index_mode = false;
1149*4882a593Smuzhiyun unsigned int post_sync;
1150*4882a593Smuzhiyun int ret = 0;
1151*4882a593Smuzhiyun u32 hws_pga, val;
1152*4882a593Smuzhiyun
1153*4882a593Smuzhiyun post_sync = (cmd_val(s, 1) & PIPE_CONTROL_POST_SYNC_OP_MASK) >> 14;
1154*4882a593Smuzhiyun
1155*4882a593Smuzhiyun /* LRI post sync */
1156*4882a593Smuzhiyun if (cmd_val(s, 1) & PIPE_CONTROL_MMIO_WRITE)
1157*4882a593Smuzhiyun ret = cmd_reg_handler(s, cmd_reg(s, 2), 1, "pipe_ctrl");
1158*4882a593Smuzhiyun /* post sync */
1159*4882a593Smuzhiyun else if (post_sync) {
1160*4882a593Smuzhiyun if (post_sync == 2)
1161*4882a593Smuzhiyun ret = cmd_reg_handler(s, 0x2350, 1, "pipe_ctrl");
1162*4882a593Smuzhiyun else if (post_sync == 3)
1163*4882a593Smuzhiyun ret = cmd_reg_handler(s, 0x2358, 1, "pipe_ctrl");
1164*4882a593Smuzhiyun else if (post_sync == 1) {
1165*4882a593Smuzhiyun /* check ggtt*/
1166*4882a593Smuzhiyun if ((cmd_val(s, 1) & PIPE_CONTROL_GLOBAL_GTT_IVB)) {
1167*4882a593Smuzhiyun gma = cmd_val(s, 2) & GENMASK(31, 3);
1168*4882a593Smuzhiyun if (gmadr_bytes == 8)
1169*4882a593Smuzhiyun gma |= (cmd_gma_hi(s, 3)) << 32;
1170*4882a593Smuzhiyun /* Store Data Index */
1171*4882a593Smuzhiyun if (cmd_val(s, 1) & (1 << 21))
1172*4882a593Smuzhiyun index_mode = true;
1173*4882a593Smuzhiyun ret |= cmd_address_audit(s, gma, sizeof(u64),
1174*4882a593Smuzhiyun index_mode);
1175*4882a593Smuzhiyun if (ret)
1176*4882a593Smuzhiyun return ret;
1177*4882a593Smuzhiyun if (index_mode) {
1178*4882a593Smuzhiyun hws_pga = s->vgpu->hws_pga[s->engine->id];
1179*4882a593Smuzhiyun gma = hws_pga + gma;
1180*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, 2), gma);
1181*4882a593Smuzhiyun val = cmd_val(s, 1) & (~(1 << 21));
1182*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, 1), val);
1183*4882a593Smuzhiyun }
1184*4882a593Smuzhiyun }
1185*4882a593Smuzhiyun }
1186*4882a593Smuzhiyun }
1187*4882a593Smuzhiyun
1188*4882a593Smuzhiyun if (ret)
1189*4882a593Smuzhiyun return ret;
1190*4882a593Smuzhiyun
1191*4882a593Smuzhiyun if (cmd_val(s, 1) & PIPE_CONTROL_NOTIFY)
1192*4882a593Smuzhiyun set_bit(cmd_interrupt_events[s->engine->id].pipe_control_notify,
1193*4882a593Smuzhiyun s->workload->pending_events);
1194*4882a593Smuzhiyun return 0;
1195*4882a593Smuzhiyun }
1196*4882a593Smuzhiyun
cmd_handler_mi_user_interrupt(struct parser_exec_state * s)1197*4882a593Smuzhiyun static int cmd_handler_mi_user_interrupt(struct parser_exec_state *s)
1198*4882a593Smuzhiyun {
1199*4882a593Smuzhiyun set_bit(cmd_interrupt_events[s->engine->id].mi_user_interrupt,
1200*4882a593Smuzhiyun s->workload->pending_events);
1201*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, 0), MI_NOOP);
1202*4882a593Smuzhiyun return 0;
1203*4882a593Smuzhiyun }
1204*4882a593Smuzhiyun
cmd_advance_default(struct parser_exec_state * s)1205*4882a593Smuzhiyun static int cmd_advance_default(struct parser_exec_state *s)
1206*4882a593Smuzhiyun {
1207*4882a593Smuzhiyun return ip_gma_advance(s, cmd_length(s));
1208*4882a593Smuzhiyun }
1209*4882a593Smuzhiyun
cmd_handler_mi_batch_buffer_end(struct parser_exec_state * s)1210*4882a593Smuzhiyun static int cmd_handler_mi_batch_buffer_end(struct parser_exec_state *s)
1211*4882a593Smuzhiyun {
1212*4882a593Smuzhiyun int ret;
1213*4882a593Smuzhiyun
1214*4882a593Smuzhiyun if (s->buf_type == BATCH_BUFFER_2ND_LEVEL) {
1215*4882a593Smuzhiyun s->buf_type = BATCH_BUFFER_INSTRUCTION;
1216*4882a593Smuzhiyun ret = ip_gma_set(s, s->ret_ip_gma_bb);
1217*4882a593Smuzhiyun s->buf_addr_type = s->saved_buf_addr_type;
1218*4882a593Smuzhiyun } else {
1219*4882a593Smuzhiyun s->buf_type = RING_BUFFER_INSTRUCTION;
1220*4882a593Smuzhiyun s->buf_addr_type = GTT_BUFFER;
1221*4882a593Smuzhiyun if (s->ret_ip_gma_ring >= s->ring_start + s->ring_size)
1222*4882a593Smuzhiyun s->ret_ip_gma_ring -= s->ring_size;
1223*4882a593Smuzhiyun ret = ip_gma_set(s, s->ret_ip_gma_ring);
1224*4882a593Smuzhiyun }
1225*4882a593Smuzhiyun return ret;
1226*4882a593Smuzhiyun }
1227*4882a593Smuzhiyun
1228*4882a593Smuzhiyun struct mi_display_flip_command_info {
1229*4882a593Smuzhiyun int pipe;
1230*4882a593Smuzhiyun int plane;
1231*4882a593Smuzhiyun int event;
1232*4882a593Smuzhiyun i915_reg_t stride_reg;
1233*4882a593Smuzhiyun i915_reg_t ctrl_reg;
1234*4882a593Smuzhiyun i915_reg_t surf_reg;
1235*4882a593Smuzhiyun u64 stride_val;
1236*4882a593Smuzhiyun u64 tile_val;
1237*4882a593Smuzhiyun u64 surf_val;
1238*4882a593Smuzhiyun bool async_flip;
1239*4882a593Smuzhiyun };
1240*4882a593Smuzhiyun
1241*4882a593Smuzhiyun struct plane_code_mapping {
1242*4882a593Smuzhiyun int pipe;
1243*4882a593Smuzhiyun int plane;
1244*4882a593Smuzhiyun int event;
1245*4882a593Smuzhiyun };
1246*4882a593Smuzhiyun
gen8_decode_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1247*4882a593Smuzhiyun static int gen8_decode_mi_display_flip(struct parser_exec_state *s,
1248*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1249*4882a593Smuzhiyun {
1250*4882a593Smuzhiyun struct drm_i915_private *dev_priv = s->engine->i915;
1251*4882a593Smuzhiyun struct plane_code_mapping gen8_plane_code[] = {
1252*4882a593Smuzhiyun [0] = {PIPE_A, PLANE_A, PRIMARY_A_FLIP_DONE},
1253*4882a593Smuzhiyun [1] = {PIPE_B, PLANE_A, PRIMARY_B_FLIP_DONE},
1254*4882a593Smuzhiyun [2] = {PIPE_A, PLANE_B, SPRITE_A_FLIP_DONE},
1255*4882a593Smuzhiyun [3] = {PIPE_B, PLANE_B, SPRITE_B_FLIP_DONE},
1256*4882a593Smuzhiyun [4] = {PIPE_C, PLANE_A, PRIMARY_C_FLIP_DONE},
1257*4882a593Smuzhiyun [5] = {PIPE_C, PLANE_B, SPRITE_C_FLIP_DONE},
1258*4882a593Smuzhiyun };
1259*4882a593Smuzhiyun u32 dword0, dword1, dword2;
1260*4882a593Smuzhiyun u32 v;
1261*4882a593Smuzhiyun
1262*4882a593Smuzhiyun dword0 = cmd_val(s, 0);
1263*4882a593Smuzhiyun dword1 = cmd_val(s, 1);
1264*4882a593Smuzhiyun dword2 = cmd_val(s, 2);
1265*4882a593Smuzhiyun
1266*4882a593Smuzhiyun v = (dword0 & GENMASK(21, 19)) >> 19;
1267*4882a593Smuzhiyun if (drm_WARN_ON(&dev_priv->drm, v >= ARRAY_SIZE(gen8_plane_code)))
1268*4882a593Smuzhiyun return -EBADRQC;
1269*4882a593Smuzhiyun
1270*4882a593Smuzhiyun info->pipe = gen8_plane_code[v].pipe;
1271*4882a593Smuzhiyun info->plane = gen8_plane_code[v].plane;
1272*4882a593Smuzhiyun info->event = gen8_plane_code[v].event;
1273*4882a593Smuzhiyun info->stride_val = (dword1 & GENMASK(15, 6)) >> 6;
1274*4882a593Smuzhiyun info->tile_val = (dword1 & 0x1);
1275*4882a593Smuzhiyun info->surf_val = (dword2 & GENMASK(31, 12)) >> 12;
1276*4882a593Smuzhiyun info->async_flip = ((dword2 & GENMASK(1, 0)) == 0x1);
1277*4882a593Smuzhiyun
1278*4882a593Smuzhiyun if (info->plane == PLANE_A) {
1279*4882a593Smuzhiyun info->ctrl_reg = DSPCNTR(info->pipe);
1280*4882a593Smuzhiyun info->stride_reg = DSPSTRIDE(info->pipe);
1281*4882a593Smuzhiyun info->surf_reg = DSPSURF(info->pipe);
1282*4882a593Smuzhiyun } else if (info->plane == PLANE_B) {
1283*4882a593Smuzhiyun info->ctrl_reg = SPRCTL(info->pipe);
1284*4882a593Smuzhiyun info->stride_reg = SPRSTRIDE(info->pipe);
1285*4882a593Smuzhiyun info->surf_reg = SPRSURF(info->pipe);
1286*4882a593Smuzhiyun } else {
1287*4882a593Smuzhiyun drm_WARN_ON(&dev_priv->drm, 1);
1288*4882a593Smuzhiyun return -EBADRQC;
1289*4882a593Smuzhiyun }
1290*4882a593Smuzhiyun return 0;
1291*4882a593Smuzhiyun }
1292*4882a593Smuzhiyun
skl_decode_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1293*4882a593Smuzhiyun static int skl_decode_mi_display_flip(struct parser_exec_state *s,
1294*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1295*4882a593Smuzhiyun {
1296*4882a593Smuzhiyun struct drm_i915_private *dev_priv = s->engine->i915;
1297*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1298*4882a593Smuzhiyun u32 dword0 = cmd_val(s, 0);
1299*4882a593Smuzhiyun u32 dword1 = cmd_val(s, 1);
1300*4882a593Smuzhiyun u32 dword2 = cmd_val(s, 2);
1301*4882a593Smuzhiyun u32 plane = (dword0 & GENMASK(12, 8)) >> 8;
1302*4882a593Smuzhiyun
1303*4882a593Smuzhiyun info->plane = PRIMARY_PLANE;
1304*4882a593Smuzhiyun
1305*4882a593Smuzhiyun switch (plane) {
1306*4882a593Smuzhiyun case MI_DISPLAY_FLIP_SKL_PLANE_1_A:
1307*4882a593Smuzhiyun info->pipe = PIPE_A;
1308*4882a593Smuzhiyun info->event = PRIMARY_A_FLIP_DONE;
1309*4882a593Smuzhiyun break;
1310*4882a593Smuzhiyun case MI_DISPLAY_FLIP_SKL_PLANE_1_B:
1311*4882a593Smuzhiyun info->pipe = PIPE_B;
1312*4882a593Smuzhiyun info->event = PRIMARY_B_FLIP_DONE;
1313*4882a593Smuzhiyun break;
1314*4882a593Smuzhiyun case MI_DISPLAY_FLIP_SKL_PLANE_1_C:
1315*4882a593Smuzhiyun info->pipe = PIPE_C;
1316*4882a593Smuzhiyun info->event = PRIMARY_C_FLIP_DONE;
1317*4882a593Smuzhiyun break;
1318*4882a593Smuzhiyun
1319*4882a593Smuzhiyun case MI_DISPLAY_FLIP_SKL_PLANE_2_A:
1320*4882a593Smuzhiyun info->pipe = PIPE_A;
1321*4882a593Smuzhiyun info->event = SPRITE_A_FLIP_DONE;
1322*4882a593Smuzhiyun info->plane = SPRITE_PLANE;
1323*4882a593Smuzhiyun break;
1324*4882a593Smuzhiyun case MI_DISPLAY_FLIP_SKL_PLANE_2_B:
1325*4882a593Smuzhiyun info->pipe = PIPE_B;
1326*4882a593Smuzhiyun info->event = SPRITE_B_FLIP_DONE;
1327*4882a593Smuzhiyun info->plane = SPRITE_PLANE;
1328*4882a593Smuzhiyun break;
1329*4882a593Smuzhiyun case MI_DISPLAY_FLIP_SKL_PLANE_2_C:
1330*4882a593Smuzhiyun info->pipe = PIPE_C;
1331*4882a593Smuzhiyun info->event = SPRITE_C_FLIP_DONE;
1332*4882a593Smuzhiyun info->plane = SPRITE_PLANE;
1333*4882a593Smuzhiyun break;
1334*4882a593Smuzhiyun
1335*4882a593Smuzhiyun default:
1336*4882a593Smuzhiyun gvt_vgpu_err("unknown plane code %d\n", plane);
1337*4882a593Smuzhiyun return -EBADRQC;
1338*4882a593Smuzhiyun }
1339*4882a593Smuzhiyun
1340*4882a593Smuzhiyun info->stride_val = (dword1 & GENMASK(15, 6)) >> 6;
1341*4882a593Smuzhiyun info->tile_val = (dword1 & GENMASK(2, 0));
1342*4882a593Smuzhiyun info->surf_val = (dword2 & GENMASK(31, 12)) >> 12;
1343*4882a593Smuzhiyun info->async_flip = ((dword2 & GENMASK(1, 0)) == 0x1);
1344*4882a593Smuzhiyun
1345*4882a593Smuzhiyun info->ctrl_reg = DSPCNTR(info->pipe);
1346*4882a593Smuzhiyun info->stride_reg = DSPSTRIDE(info->pipe);
1347*4882a593Smuzhiyun info->surf_reg = DSPSURF(info->pipe);
1348*4882a593Smuzhiyun
1349*4882a593Smuzhiyun return 0;
1350*4882a593Smuzhiyun }
1351*4882a593Smuzhiyun
gen8_check_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1352*4882a593Smuzhiyun static int gen8_check_mi_display_flip(struct parser_exec_state *s,
1353*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1354*4882a593Smuzhiyun {
1355*4882a593Smuzhiyun u32 stride, tile;
1356*4882a593Smuzhiyun
1357*4882a593Smuzhiyun if (!info->async_flip)
1358*4882a593Smuzhiyun return 0;
1359*4882a593Smuzhiyun
1360*4882a593Smuzhiyun if (INTEL_GEN(s->engine->i915) >= 9) {
1361*4882a593Smuzhiyun stride = vgpu_vreg_t(s->vgpu, info->stride_reg) & GENMASK(9, 0);
1362*4882a593Smuzhiyun tile = (vgpu_vreg_t(s->vgpu, info->ctrl_reg) &
1363*4882a593Smuzhiyun GENMASK(12, 10)) >> 10;
1364*4882a593Smuzhiyun } else {
1365*4882a593Smuzhiyun stride = (vgpu_vreg_t(s->vgpu, info->stride_reg) &
1366*4882a593Smuzhiyun GENMASK(15, 6)) >> 6;
1367*4882a593Smuzhiyun tile = (vgpu_vreg_t(s->vgpu, info->ctrl_reg) & (1 << 10)) >> 10;
1368*4882a593Smuzhiyun }
1369*4882a593Smuzhiyun
1370*4882a593Smuzhiyun if (stride != info->stride_val)
1371*4882a593Smuzhiyun gvt_dbg_cmd("cannot change stride during async flip\n");
1372*4882a593Smuzhiyun
1373*4882a593Smuzhiyun if (tile != info->tile_val)
1374*4882a593Smuzhiyun gvt_dbg_cmd("cannot change tile during async flip\n");
1375*4882a593Smuzhiyun
1376*4882a593Smuzhiyun return 0;
1377*4882a593Smuzhiyun }
1378*4882a593Smuzhiyun
gen8_update_plane_mmio_from_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1379*4882a593Smuzhiyun static int gen8_update_plane_mmio_from_mi_display_flip(
1380*4882a593Smuzhiyun struct parser_exec_state *s,
1381*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1382*4882a593Smuzhiyun {
1383*4882a593Smuzhiyun struct drm_i915_private *dev_priv = s->engine->i915;
1384*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1385*4882a593Smuzhiyun
1386*4882a593Smuzhiyun set_mask_bits(&vgpu_vreg_t(vgpu, info->surf_reg), GENMASK(31, 12),
1387*4882a593Smuzhiyun info->surf_val << 12);
1388*4882a593Smuzhiyun if (INTEL_GEN(dev_priv) >= 9) {
1389*4882a593Smuzhiyun set_mask_bits(&vgpu_vreg_t(vgpu, info->stride_reg), GENMASK(9, 0),
1390*4882a593Smuzhiyun info->stride_val);
1391*4882a593Smuzhiyun set_mask_bits(&vgpu_vreg_t(vgpu, info->ctrl_reg), GENMASK(12, 10),
1392*4882a593Smuzhiyun info->tile_val << 10);
1393*4882a593Smuzhiyun } else {
1394*4882a593Smuzhiyun set_mask_bits(&vgpu_vreg_t(vgpu, info->stride_reg), GENMASK(15, 6),
1395*4882a593Smuzhiyun info->stride_val << 6);
1396*4882a593Smuzhiyun set_mask_bits(&vgpu_vreg_t(vgpu, info->ctrl_reg), GENMASK(10, 10),
1397*4882a593Smuzhiyun info->tile_val << 10);
1398*4882a593Smuzhiyun }
1399*4882a593Smuzhiyun
1400*4882a593Smuzhiyun if (info->plane == PLANE_PRIMARY)
1401*4882a593Smuzhiyun vgpu_vreg_t(vgpu, PIPE_FLIPCOUNT_G4X(info->pipe))++;
1402*4882a593Smuzhiyun
1403*4882a593Smuzhiyun if (info->async_flip)
1404*4882a593Smuzhiyun intel_vgpu_trigger_virtual_event(vgpu, info->event);
1405*4882a593Smuzhiyun else
1406*4882a593Smuzhiyun set_bit(info->event, vgpu->irq.flip_done_event[info->pipe]);
1407*4882a593Smuzhiyun
1408*4882a593Smuzhiyun return 0;
1409*4882a593Smuzhiyun }
1410*4882a593Smuzhiyun
decode_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1411*4882a593Smuzhiyun static int decode_mi_display_flip(struct parser_exec_state *s,
1412*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1413*4882a593Smuzhiyun {
1414*4882a593Smuzhiyun if (IS_BROADWELL(s->engine->i915))
1415*4882a593Smuzhiyun return gen8_decode_mi_display_flip(s, info);
1416*4882a593Smuzhiyun if (INTEL_GEN(s->engine->i915) >= 9)
1417*4882a593Smuzhiyun return skl_decode_mi_display_flip(s, info);
1418*4882a593Smuzhiyun
1419*4882a593Smuzhiyun return -ENODEV;
1420*4882a593Smuzhiyun }
1421*4882a593Smuzhiyun
check_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1422*4882a593Smuzhiyun static int check_mi_display_flip(struct parser_exec_state *s,
1423*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1424*4882a593Smuzhiyun {
1425*4882a593Smuzhiyun return gen8_check_mi_display_flip(s, info);
1426*4882a593Smuzhiyun }
1427*4882a593Smuzhiyun
update_plane_mmio_from_mi_display_flip(struct parser_exec_state * s,struct mi_display_flip_command_info * info)1428*4882a593Smuzhiyun static int update_plane_mmio_from_mi_display_flip(
1429*4882a593Smuzhiyun struct parser_exec_state *s,
1430*4882a593Smuzhiyun struct mi_display_flip_command_info *info)
1431*4882a593Smuzhiyun {
1432*4882a593Smuzhiyun return gen8_update_plane_mmio_from_mi_display_flip(s, info);
1433*4882a593Smuzhiyun }
1434*4882a593Smuzhiyun
cmd_handler_mi_display_flip(struct parser_exec_state * s)1435*4882a593Smuzhiyun static int cmd_handler_mi_display_flip(struct parser_exec_state *s)
1436*4882a593Smuzhiyun {
1437*4882a593Smuzhiyun struct mi_display_flip_command_info info;
1438*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1439*4882a593Smuzhiyun int ret;
1440*4882a593Smuzhiyun int i;
1441*4882a593Smuzhiyun int len = cmd_length(s);
1442*4882a593Smuzhiyun u32 valid_len = CMD_LEN(1);
1443*4882a593Smuzhiyun
1444*4882a593Smuzhiyun /* Flip Type == Stereo 3D Flip */
1445*4882a593Smuzhiyun if (DWORD_FIELD(2, 1, 0) == 2)
1446*4882a593Smuzhiyun valid_len++;
1447*4882a593Smuzhiyun ret = gvt_check_valid_cmd_length(cmd_length(s),
1448*4882a593Smuzhiyun valid_len);
1449*4882a593Smuzhiyun if (ret)
1450*4882a593Smuzhiyun return ret;
1451*4882a593Smuzhiyun
1452*4882a593Smuzhiyun ret = decode_mi_display_flip(s, &info);
1453*4882a593Smuzhiyun if (ret) {
1454*4882a593Smuzhiyun gvt_vgpu_err("fail to decode MI display flip command\n");
1455*4882a593Smuzhiyun return ret;
1456*4882a593Smuzhiyun }
1457*4882a593Smuzhiyun
1458*4882a593Smuzhiyun ret = check_mi_display_flip(s, &info);
1459*4882a593Smuzhiyun if (ret) {
1460*4882a593Smuzhiyun gvt_vgpu_err("invalid MI display flip command\n");
1461*4882a593Smuzhiyun return ret;
1462*4882a593Smuzhiyun }
1463*4882a593Smuzhiyun
1464*4882a593Smuzhiyun ret = update_plane_mmio_from_mi_display_flip(s, &info);
1465*4882a593Smuzhiyun if (ret) {
1466*4882a593Smuzhiyun gvt_vgpu_err("fail to update plane mmio\n");
1467*4882a593Smuzhiyun return ret;
1468*4882a593Smuzhiyun }
1469*4882a593Smuzhiyun
1470*4882a593Smuzhiyun for (i = 0; i < len; i++)
1471*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, i), MI_NOOP);
1472*4882a593Smuzhiyun return 0;
1473*4882a593Smuzhiyun }
1474*4882a593Smuzhiyun
is_wait_for_flip_pending(u32 cmd)1475*4882a593Smuzhiyun static bool is_wait_for_flip_pending(u32 cmd)
1476*4882a593Smuzhiyun {
1477*4882a593Smuzhiyun return cmd & (MI_WAIT_FOR_PLANE_A_FLIP_PENDING |
1478*4882a593Smuzhiyun MI_WAIT_FOR_PLANE_B_FLIP_PENDING |
1479*4882a593Smuzhiyun MI_WAIT_FOR_PLANE_C_FLIP_PENDING |
1480*4882a593Smuzhiyun MI_WAIT_FOR_SPRITE_A_FLIP_PENDING |
1481*4882a593Smuzhiyun MI_WAIT_FOR_SPRITE_B_FLIP_PENDING |
1482*4882a593Smuzhiyun MI_WAIT_FOR_SPRITE_C_FLIP_PENDING);
1483*4882a593Smuzhiyun }
1484*4882a593Smuzhiyun
cmd_handler_mi_wait_for_event(struct parser_exec_state * s)1485*4882a593Smuzhiyun static int cmd_handler_mi_wait_for_event(struct parser_exec_state *s)
1486*4882a593Smuzhiyun {
1487*4882a593Smuzhiyun u32 cmd = cmd_val(s, 0);
1488*4882a593Smuzhiyun
1489*4882a593Smuzhiyun if (!is_wait_for_flip_pending(cmd))
1490*4882a593Smuzhiyun return 0;
1491*4882a593Smuzhiyun
1492*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, 0), MI_NOOP);
1493*4882a593Smuzhiyun return 0;
1494*4882a593Smuzhiyun }
1495*4882a593Smuzhiyun
get_gma_bb_from_cmd(struct parser_exec_state * s,int index)1496*4882a593Smuzhiyun static unsigned long get_gma_bb_from_cmd(struct parser_exec_state *s, int index)
1497*4882a593Smuzhiyun {
1498*4882a593Smuzhiyun unsigned long addr;
1499*4882a593Smuzhiyun unsigned long gma_high, gma_low;
1500*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1501*4882a593Smuzhiyun int gmadr_bytes = vgpu->gvt->device_info.gmadr_bytes_in_cmd;
1502*4882a593Smuzhiyun
1503*4882a593Smuzhiyun if (WARN_ON(gmadr_bytes != 4 && gmadr_bytes != 8)) {
1504*4882a593Smuzhiyun gvt_vgpu_err("invalid gma bytes %d\n", gmadr_bytes);
1505*4882a593Smuzhiyun return INTEL_GVT_INVALID_ADDR;
1506*4882a593Smuzhiyun }
1507*4882a593Smuzhiyun
1508*4882a593Smuzhiyun gma_low = cmd_val(s, index) & BATCH_BUFFER_ADDR_MASK;
1509*4882a593Smuzhiyun if (gmadr_bytes == 4) {
1510*4882a593Smuzhiyun addr = gma_low;
1511*4882a593Smuzhiyun } else {
1512*4882a593Smuzhiyun gma_high = cmd_val(s, index + 1) & BATCH_BUFFER_ADDR_HIGH_MASK;
1513*4882a593Smuzhiyun addr = (((unsigned long)gma_high) << 32) | gma_low;
1514*4882a593Smuzhiyun }
1515*4882a593Smuzhiyun return addr;
1516*4882a593Smuzhiyun }
1517*4882a593Smuzhiyun
cmd_address_audit(struct parser_exec_state * s,unsigned long guest_gma,int op_size,bool index_mode)1518*4882a593Smuzhiyun static inline int cmd_address_audit(struct parser_exec_state *s,
1519*4882a593Smuzhiyun unsigned long guest_gma, int op_size, bool index_mode)
1520*4882a593Smuzhiyun {
1521*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1522*4882a593Smuzhiyun u32 max_surface_size = vgpu->gvt->device_info.max_surface_size;
1523*4882a593Smuzhiyun int i;
1524*4882a593Smuzhiyun int ret;
1525*4882a593Smuzhiyun
1526*4882a593Smuzhiyun if (op_size > max_surface_size) {
1527*4882a593Smuzhiyun gvt_vgpu_err("command address audit fail name %s\n",
1528*4882a593Smuzhiyun s->info->name);
1529*4882a593Smuzhiyun return -EFAULT;
1530*4882a593Smuzhiyun }
1531*4882a593Smuzhiyun
1532*4882a593Smuzhiyun if (index_mode) {
1533*4882a593Smuzhiyun if (guest_gma >= I915_GTT_PAGE_SIZE) {
1534*4882a593Smuzhiyun ret = -EFAULT;
1535*4882a593Smuzhiyun goto err;
1536*4882a593Smuzhiyun }
1537*4882a593Smuzhiyun } else if (!intel_gvt_ggtt_validate_range(vgpu, guest_gma, op_size)) {
1538*4882a593Smuzhiyun ret = -EFAULT;
1539*4882a593Smuzhiyun goto err;
1540*4882a593Smuzhiyun }
1541*4882a593Smuzhiyun
1542*4882a593Smuzhiyun return 0;
1543*4882a593Smuzhiyun
1544*4882a593Smuzhiyun err:
1545*4882a593Smuzhiyun gvt_vgpu_err("cmd_parser: Malicious %s detected, addr=0x%lx, len=%d!\n",
1546*4882a593Smuzhiyun s->info->name, guest_gma, op_size);
1547*4882a593Smuzhiyun
1548*4882a593Smuzhiyun pr_err("cmd dump: ");
1549*4882a593Smuzhiyun for (i = 0; i < cmd_length(s); i++) {
1550*4882a593Smuzhiyun if (!(i % 4))
1551*4882a593Smuzhiyun pr_err("\n%08x ", cmd_val(s, i));
1552*4882a593Smuzhiyun else
1553*4882a593Smuzhiyun pr_err("%08x ", cmd_val(s, i));
1554*4882a593Smuzhiyun }
1555*4882a593Smuzhiyun pr_err("\nvgpu%d: aperture 0x%llx - 0x%llx, hidden 0x%llx - 0x%llx\n",
1556*4882a593Smuzhiyun vgpu->id,
1557*4882a593Smuzhiyun vgpu_aperture_gmadr_base(vgpu),
1558*4882a593Smuzhiyun vgpu_aperture_gmadr_end(vgpu),
1559*4882a593Smuzhiyun vgpu_hidden_gmadr_base(vgpu),
1560*4882a593Smuzhiyun vgpu_hidden_gmadr_end(vgpu));
1561*4882a593Smuzhiyun return ret;
1562*4882a593Smuzhiyun }
1563*4882a593Smuzhiyun
cmd_handler_mi_store_data_imm(struct parser_exec_state * s)1564*4882a593Smuzhiyun static int cmd_handler_mi_store_data_imm(struct parser_exec_state *s)
1565*4882a593Smuzhiyun {
1566*4882a593Smuzhiyun int gmadr_bytes = s->vgpu->gvt->device_info.gmadr_bytes_in_cmd;
1567*4882a593Smuzhiyun int op_size = (cmd_length(s) - 3) * sizeof(u32);
1568*4882a593Smuzhiyun int core_id = (cmd_val(s, 2) & (1 << 0)) ? 1 : 0;
1569*4882a593Smuzhiyun unsigned long gma, gma_low, gma_high;
1570*4882a593Smuzhiyun u32 valid_len = CMD_LEN(2);
1571*4882a593Smuzhiyun int ret = 0;
1572*4882a593Smuzhiyun
1573*4882a593Smuzhiyun /* check ppggt */
1574*4882a593Smuzhiyun if (!(cmd_val(s, 0) & (1 << 22)))
1575*4882a593Smuzhiyun return 0;
1576*4882a593Smuzhiyun
1577*4882a593Smuzhiyun /* check if QWORD */
1578*4882a593Smuzhiyun if (DWORD_FIELD(0, 21, 21))
1579*4882a593Smuzhiyun valid_len++;
1580*4882a593Smuzhiyun ret = gvt_check_valid_cmd_length(cmd_length(s),
1581*4882a593Smuzhiyun valid_len);
1582*4882a593Smuzhiyun if (ret)
1583*4882a593Smuzhiyun return ret;
1584*4882a593Smuzhiyun
1585*4882a593Smuzhiyun gma = cmd_val(s, 2) & GENMASK(31, 2);
1586*4882a593Smuzhiyun
1587*4882a593Smuzhiyun if (gmadr_bytes == 8) {
1588*4882a593Smuzhiyun gma_low = cmd_val(s, 1) & GENMASK(31, 2);
1589*4882a593Smuzhiyun gma_high = cmd_val(s, 2) & GENMASK(15, 0);
1590*4882a593Smuzhiyun gma = (gma_high << 32) | gma_low;
1591*4882a593Smuzhiyun core_id = (cmd_val(s, 1) & (1 << 0)) ? 1 : 0;
1592*4882a593Smuzhiyun }
1593*4882a593Smuzhiyun ret = cmd_address_audit(s, gma + op_size * core_id, op_size, false);
1594*4882a593Smuzhiyun return ret;
1595*4882a593Smuzhiyun }
1596*4882a593Smuzhiyun
unexpected_cmd(struct parser_exec_state * s)1597*4882a593Smuzhiyun static inline int unexpected_cmd(struct parser_exec_state *s)
1598*4882a593Smuzhiyun {
1599*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1600*4882a593Smuzhiyun
1601*4882a593Smuzhiyun gvt_vgpu_err("Unexpected %s in command buffer!\n", s->info->name);
1602*4882a593Smuzhiyun
1603*4882a593Smuzhiyun return -EBADRQC;
1604*4882a593Smuzhiyun }
1605*4882a593Smuzhiyun
cmd_handler_mi_semaphore_wait(struct parser_exec_state * s)1606*4882a593Smuzhiyun static int cmd_handler_mi_semaphore_wait(struct parser_exec_state *s)
1607*4882a593Smuzhiyun {
1608*4882a593Smuzhiyun return unexpected_cmd(s);
1609*4882a593Smuzhiyun }
1610*4882a593Smuzhiyun
cmd_handler_mi_report_perf_count(struct parser_exec_state * s)1611*4882a593Smuzhiyun static int cmd_handler_mi_report_perf_count(struct parser_exec_state *s)
1612*4882a593Smuzhiyun {
1613*4882a593Smuzhiyun return unexpected_cmd(s);
1614*4882a593Smuzhiyun }
1615*4882a593Smuzhiyun
cmd_handler_mi_op_2e(struct parser_exec_state * s)1616*4882a593Smuzhiyun static int cmd_handler_mi_op_2e(struct parser_exec_state *s)
1617*4882a593Smuzhiyun {
1618*4882a593Smuzhiyun return unexpected_cmd(s);
1619*4882a593Smuzhiyun }
1620*4882a593Smuzhiyun
cmd_handler_mi_op_2f(struct parser_exec_state * s)1621*4882a593Smuzhiyun static int cmd_handler_mi_op_2f(struct parser_exec_state *s)
1622*4882a593Smuzhiyun {
1623*4882a593Smuzhiyun int gmadr_bytes = s->vgpu->gvt->device_info.gmadr_bytes_in_cmd;
1624*4882a593Smuzhiyun int op_size = (1 << ((cmd_val(s, 0) & GENMASK(20, 19)) >> 19)) *
1625*4882a593Smuzhiyun sizeof(u32);
1626*4882a593Smuzhiyun unsigned long gma, gma_high;
1627*4882a593Smuzhiyun u32 valid_len = CMD_LEN(1);
1628*4882a593Smuzhiyun int ret = 0;
1629*4882a593Smuzhiyun
1630*4882a593Smuzhiyun if (!(cmd_val(s, 0) & (1 << 22)))
1631*4882a593Smuzhiyun return ret;
1632*4882a593Smuzhiyun
1633*4882a593Smuzhiyun /* check inline data */
1634*4882a593Smuzhiyun if (cmd_val(s, 0) & BIT(18))
1635*4882a593Smuzhiyun valid_len = CMD_LEN(9);
1636*4882a593Smuzhiyun ret = gvt_check_valid_cmd_length(cmd_length(s),
1637*4882a593Smuzhiyun valid_len);
1638*4882a593Smuzhiyun if (ret)
1639*4882a593Smuzhiyun return ret;
1640*4882a593Smuzhiyun
1641*4882a593Smuzhiyun gma = cmd_val(s, 1) & GENMASK(31, 2);
1642*4882a593Smuzhiyun if (gmadr_bytes == 8) {
1643*4882a593Smuzhiyun gma_high = cmd_val(s, 2) & GENMASK(15, 0);
1644*4882a593Smuzhiyun gma = (gma_high << 32) | gma;
1645*4882a593Smuzhiyun }
1646*4882a593Smuzhiyun ret = cmd_address_audit(s, gma, op_size, false);
1647*4882a593Smuzhiyun return ret;
1648*4882a593Smuzhiyun }
1649*4882a593Smuzhiyun
cmd_handler_mi_store_data_index(struct parser_exec_state * s)1650*4882a593Smuzhiyun static int cmd_handler_mi_store_data_index(struct parser_exec_state *s)
1651*4882a593Smuzhiyun {
1652*4882a593Smuzhiyun return unexpected_cmd(s);
1653*4882a593Smuzhiyun }
1654*4882a593Smuzhiyun
cmd_handler_mi_clflush(struct parser_exec_state * s)1655*4882a593Smuzhiyun static int cmd_handler_mi_clflush(struct parser_exec_state *s)
1656*4882a593Smuzhiyun {
1657*4882a593Smuzhiyun return unexpected_cmd(s);
1658*4882a593Smuzhiyun }
1659*4882a593Smuzhiyun
cmd_handler_mi_conditional_batch_buffer_end(struct parser_exec_state * s)1660*4882a593Smuzhiyun static int cmd_handler_mi_conditional_batch_buffer_end(
1661*4882a593Smuzhiyun struct parser_exec_state *s)
1662*4882a593Smuzhiyun {
1663*4882a593Smuzhiyun return unexpected_cmd(s);
1664*4882a593Smuzhiyun }
1665*4882a593Smuzhiyun
cmd_handler_mi_update_gtt(struct parser_exec_state * s)1666*4882a593Smuzhiyun static int cmd_handler_mi_update_gtt(struct parser_exec_state *s)
1667*4882a593Smuzhiyun {
1668*4882a593Smuzhiyun return unexpected_cmd(s);
1669*4882a593Smuzhiyun }
1670*4882a593Smuzhiyun
cmd_handler_mi_flush_dw(struct parser_exec_state * s)1671*4882a593Smuzhiyun static int cmd_handler_mi_flush_dw(struct parser_exec_state *s)
1672*4882a593Smuzhiyun {
1673*4882a593Smuzhiyun int gmadr_bytes = s->vgpu->gvt->device_info.gmadr_bytes_in_cmd;
1674*4882a593Smuzhiyun unsigned long gma;
1675*4882a593Smuzhiyun bool index_mode = false;
1676*4882a593Smuzhiyun int ret = 0;
1677*4882a593Smuzhiyun u32 hws_pga, val;
1678*4882a593Smuzhiyun u32 valid_len = CMD_LEN(2);
1679*4882a593Smuzhiyun
1680*4882a593Smuzhiyun ret = gvt_check_valid_cmd_length(cmd_length(s),
1681*4882a593Smuzhiyun valid_len);
1682*4882a593Smuzhiyun if (ret) {
1683*4882a593Smuzhiyun /* Check again for Qword */
1684*4882a593Smuzhiyun ret = gvt_check_valid_cmd_length(cmd_length(s),
1685*4882a593Smuzhiyun ++valid_len);
1686*4882a593Smuzhiyun return ret;
1687*4882a593Smuzhiyun }
1688*4882a593Smuzhiyun
1689*4882a593Smuzhiyun /* Check post-sync and ppgtt bit */
1690*4882a593Smuzhiyun if (((cmd_val(s, 0) >> 14) & 0x3) && (cmd_val(s, 1) & (1 << 2))) {
1691*4882a593Smuzhiyun gma = cmd_val(s, 1) & GENMASK(31, 3);
1692*4882a593Smuzhiyun if (gmadr_bytes == 8)
1693*4882a593Smuzhiyun gma |= (cmd_val(s, 2) & GENMASK(15, 0)) << 32;
1694*4882a593Smuzhiyun /* Store Data Index */
1695*4882a593Smuzhiyun if (cmd_val(s, 0) & (1 << 21))
1696*4882a593Smuzhiyun index_mode = true;
1697*4882a593Smuzhiyun ret = cmd_address_audit(s, gma, sizeof(u64), index_mode);
1698*4882a593Smuzhiyun if (ret)
1699*4882a593Smuzhiyun return ret;
1700*4882a593Smuzhiyun if (index_mode) {
1701*4882a593Smuzhiyun hws_pga = s->vgpu->hws_pga[s->engine->id];
1702*4882a593Smuzhiyun gma = hws_pga + gma;
1703*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, 1), gma);
1704*4882a593Smuzhiyun val = cmd_val(s, 0) & (~(1 << 21));
1705*4882a593Smuzhiyun patch_value(s, cmd_ptr(s, 0), val);
1706*4882a593Smuzhiyun }
1707*4882a593Smuzhiyun }
1708*4882a593Smuzhiyun /* Check notify bit */
1709*4882a593Smuzhiyun if ((cmd_val(s, 0) & (1 << 8)))
1710*4882a593Smuzhiyun set_bit(cmd_interrupt_events[s->engine->id].mi_flush_dw,
1711*4882a593Smuzhiyun s->workload->pending_events);
1712*4882a593Smuzhiyun return ret;
1713*4882a593Smuzhiyun }
1714*4882a593Smuzhiyun
addr_type_update_snb(struct parser_exec_state * s)1715*4882a593Smuzhiyun static void addr_type_update_snb(struct parser_exec_state *s)
1716*4882a593Smuzhiyun {
1717*4882a593Smuzhiyun if ((s->buf_type == RING_BUFFER_INSTRUCTION) &&
1718*4882a593Smuzhiyun (BATCH_BUFFER_ADR_SPACE_BIT(cmd_val(s, 0)) == 1)) {
1719*4882a593Smuzhiyun s->buf_addr_type = PPGTT_BUFFER;
1720*4882a593Smuzhiyun }
1721*4882a593Smuzhiyun }
1722*4882a593Smuzhiyun
1723*4882a593Smuzhiyun
copy_gma_to_hva(struct intel_vgpu * vgpu,struct intel_vgpu_mm * mm,unsigned long gma,unsigned long end_gma,void * va)1724*4882a593Smuzhiyun static int copy_gma_to_hva(struct intel_vgpu *vgpu, struct intel_vgpu_mm *mm,
1725*4882a593Smuzhiyun unsigned long gma, unsigned long end_gma, void *va)
1726*4882a593Smuzhiyun {
1727*4882a593Smuzhiyun unsigned long copy_len, offset;
1728*4882a593Smuzhiyun unsigned long len = 0;
1729*4882a593Smuzhiyun unsigned long gpa;
1730*4882a593Smuzhiyun
1731*4882a593Smuzhiyun while (gma != end_gma) {
1732*4882a593Smuzhiyun gpa = intel_vgpu_gma_to_gpa(mm, gma);
1733*4882a593Smuzhiyun if (gpa == INTEL_GVT_INVALID_ADDR) {
1734*4882a593Smuzhiyun gvt_vgpu_err("invalid gma address: %lx\n", gma);
1735*4882a593Smuzhiyun return -EFAULT;
1736*4882a593Smuzhiyun }
1737*4882a593Smuzhiyun
1738*4882a593Smuzhiyun offset = gma & (I915_GTT_PAGE_SIZE - 1);
1739*4882a593Smuzhiyun
1740*4882a593Smuzhiyun copy_len = (end_gma - gma) >= (I915_GTT_PAGE_SIZE - offset) ?
1741*4882a593Smuzhiyun I915_GTT_PAGE_SIZE - offset : end_gma - gma;
1742*4882a593Smuzhiyun
1743*4882a593Smuzhiyun intel_gvt_hypervisor_read_gpa(vgpu, gpa, va + len, copy_len);
1744*4882a593Smuzhiyun
1745*4882a593Smuzhiyun len += copy_len;
1746*4882a593Smuzhiyun gma += copy_len;
1747*4882a593Smuzhiyun }
1748*4882a593Smuzhiyun return len;
1749*4882a593Smuzhiyun }
1750*4882a593Smuzhiyun
1751*4882a593Smuzhiyun
1752*4882a593Smuzhiyun /*
1753*4882a593Smuzhiyun * Check whether a batch buffer needs to be scanned. Currently
1754*4882a593Smuzhiyun * the only criteria is based on privilege.
1755*4882a593Smuzhiyun */
batch_buffer_needs_scan(struct parser_exec_state * s)1756*4882a593Smuzhiyun static int batch_buffer_needs_scan(struct parser_exec_state *s)
1757*4882a593Smuzhiyun {
1758*4882a593Smuzhiyun /* Decide privilege based on address space */
1759*4882a593Smuzhiyun if (cmd_val(s, 0) & BIT(8) &&
1760*4882a593Smuzhiyun !(s->vgpu->scan_nonprivbb & s->engine->mask))
1761*4882a593Smuzhiyun return 0;
1762*4882a593Smuzhiyun
1763*4882a593Smuzhiyun return 1;
1764*4882a593Smuzhiyun }
1765*4882a593Smuzhiyun
repr_addr_type(unsigned int type)1766*4882a593Smuzhiyun static const char *repr_addr_type(unsigned int type)
1767*4882a593Smuzhiyun {
1768*4882a593Smuzhiyun return type == PPGTT_BUFFER ? "ppgtt" : "ggtt";
1769*4882a593Smuzhiyun }
1770*4882a593Smuzhiyun
find_bb_size(struct parser_exec_state * s,unsigned long * bb_size,unsigned long * bb_end_cmd_offset)1771*4882a593Smuzhiyun static int find_bb_size(struct parser_exec_state *s,
1772*4882a593Smuzhiyun unsigned long *bb_size,
1773*4882a593Smuzhiyun unsigned long *bb_end_cmd_offset)
1774*4882a593Smuzhiyun {
1775*4882a593Smuzhiyun unsigned long gma = 0;
1776*4882a593Smuzhiyun const struct cmd_info *info;
1777*4882a593Smuzhiyun u32 cmd_len = 0;
1778*4882a593Smuzhiyun bool bb_end = false;
1779*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1780*4882a593Smuzhiyun u32 cmd;
1781*4882a593Smuzhiyun struct intel_vgpu_mm *mm = (s->buf_addr_type == GTT_BUFFER) ?
1782*4882a593Smuzhiyun s->vgpu->gtt.ggtt_mm : s->workload->shadow_mm;
1783*4882a593Smuzhiyun
1784*4882a593Smuzhiyun *bb_size = 0;
1785*4882a593Smuzhiyun *bb_end_cmd_offset = 0;
1786*4882a593Smuzhiyun
1787*4882a593Smuzhiyun /* get the start gm address of the batch buffer */
1788*4882a593Smuzhiyun gma = get_gma_bb_from_cmd(s, 1);
1789*4882a593Smuzhiyun if (gma == INTEL_GVT_INVALID_ADDR)
1790*4882a593Smuzhiyun return -EFAULT;
1791*4882a593Smuzhiyun
1792*4882a593Smuzhiyun cmd = cmd_val(s, 0);
1793*4882a593Smuzhiyun info = get_cmd_info(s->vgpu->gvt, cmd, s->engine);
1794*4882a593Smuzhiyun if (info == NULL) {
1795*4882a593Smuzhiyun gvt_vgpu_err("unknown cmd 0x%x, opcode=0x%x, addr_type=%s, ring %s, workload=%p\n",
1796*4882a593Smuzhiyun cmd, get_opcode(cmd, s->engine),
1797*4882a593Smuzhiyun repr_addr_type(s->buf_addr_type),
1798*4882a593Smuzhiyun s->engine->name, s->workload);
1799*4882a593Smuzhiyun return -EBADRQC;
1800*4882a593Smuzhiyun }
1801*4882a593Smuzhiyun do {
1802*4882a593Smuzhiyun if (copy_gma_to_hva(s->vgpu, mm,
1803*4882a593Smuzhiyun gma, gma + 4, &cmd) < 0)
1804*4882a593Smuzhiyun return -EFAULT;
1805*4882a593Smuzhiyun info = get_cmd_info(s->vgpu->gvt, cmd, s->engine);
1806*4882a593Smuzhiyun if (info == NULL) {
1807*4882a593Smuzhiyun gvt_vgpu_err("unknown cmd 0x%x, opcode=0x%x, addr_type=%s, ring %s, workload=%p\n",
1808*4882a593Smuzhiyun cmd, get_opcode(cmd, s->engine),
1809*4882a593Smuzhiyun repr_addr_type(s->buf_addr_type),
1810*4882a593Smuzhiyun s->engine->name, s->workload);
1811*4882a593Smuzhiyun return -EBADRQC;
1812*4882a593Smuzhiyun }
1813*4882a593Smuzhiyun
1814*4882a593Smuzhiyun if (info->opcode == OP_MI_BATCH_BUFFER_END) {
1815*4882a593Smuzhiyun bb_end = true;
1816*4882a593Smuzhiyun } else if (info->opcode == OP_MI_BATCH_BUFFER_START) {
1817*4882a593Smuzhiyun if (BATCH_BUFFER_2ND_LEVEL_BIT(cmd) == 0)
1818*4882a593Smuzhiyun /* chained batch buffer */
1819*4882a593Smuzhiyun bb_end = true;
1820*4882a593Smuzhiyun }
1821*4882a593Smuzhiyun
1822*4882a593Smuzhiyun if (bb_end)
1823*4882a593Smuzhiyun *bb_end_cmd_offset = *bb_size;
1824*4882a593Smuzhiyun
1825*4882a593Smuzhiyun cmd_len = get_cmd_length(info, cmd) << 2;
1826*4882a593Smuzhiyun *bb_size += cmd_len;
1827*4882a593Smuzhiyun gma += cmd_len;
1828*4882a593Smuzhiyun } while (!bb_end);
1829*4882a593Smuzhiyun
1830*4882a593Smuzhiyun return 0;
1831*4882a593Smuzhiyun }
1832*4882a593Smuzhiyun
audit_bb_end(struct parser_exec_state * s,void * va)1833*4882a593Smuzhiyun static int audit_bb_end(struct parser_exec_state *s, void *va)
1834*4882a593Smuzhiyun {
1835*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1836*4882a593Smuzhiyun u32 cmd = *(u32 *)va;
1837*4882a593Smuzhiyun const struct cmd_info *info;
1838*4882a593Smuzhiyun
1839*4882a593Smuzhiyun info = get_cmd_info(s->vgpu->gvt, cmd, s->engine);
1840*4882a593Smuzhiyun if (info == NULL) {
1841*4882a593Smuzhiyun gvt_vgpu_err("unknown cmd 0x%x, opcode=0x%x, addr_type=%s, ring %s, workload=%p\n",
1842*4882a593Smuzhiyun cmd, get_opcode(cmd, s->engine),
1843*4882a593Smuzhiyun repr_addr_type(s->buf_addr_type),
1844*4882a593Smuzhiyun s->engine->name, s->workload);
1845*4882a593Smuzhiyun return -EBADRQC;
1846*4882a593Smuzhiyun }
1847*4882a593Smuzhiyun
1848*4882a593Smuzhiyun if ((info->opcode == OP_MI_BATCH_BUFFER_END) ||
1849*4882a593Smuzhiyun ((info->opcode == OP_MI_BATCH_BUFFER_START) &&
1850*4882a593Smuzhiyun (BATCH_BUFFER_2ND_LEVEL_BIT(cmd) == 0)))
1851*4882a593Smuzhiyun return 0;
1852*4882a593Smuzhiyun
1853*4882a593Smuzhiyun return -EBADRQC;
1854*4882a593Smuzhiyun }
1855*4882a593Smuzhiyun
perform_bb_shadow(struct parser_exec_state * s)1856*4882a593Smuzhiyun static int perform_bb_shadow(struct parser_exec_state *s)
1857*4882a593Smuzhiyun {
1858*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1859*4882a593Smuzhiyun struct intel_vgpu_shadow_bb *bb;
1860*4882a593Smuzhiyun unsigned long gma = 0;
1861*4882a593Smuzhiyun unsigned long bb_size;
1862*4882a593Smuzhiyun unsigned long bb_end_cmd_offset;
1863*4882a593Smuzhiyun int ret = 0;
1864*4882a593Smuzhiyun struct intel_vgpu_mm *mm = (s->buf_addr_type == GTT_BUFFER) ?
1865*4882a593Smuzhiyun s->vgpu->gtt.ggtt_mm : s->workload->shadow_mm;
1866*4882a593Smuzhiyun unsigned long start_offset = 0;
1867*4882a593Smuzhiyun
1868*4882a593Smuzhiyun /* get the start gm address of the batch buffer */
1869*4882a593Smuzhiyun gma = get_gma_bb_from_cmd(s, 1);
1870*4882a593Smuzhiyun if (gma == INTEL_GVT_INVALID_ADDR)
1871*4882a593Smuzhiyun return -EFAULT;
1872*4882a593Smuzhiyun
1873*4882a593Smuzhiyun ret = find_bb_size(s, &bb_size, &bb_end_cmd_offset);
1874*4882a593Smuzhiyun if (ret)
1875*4882a593Smuzhiyun return ret;
1876*4882a593Smuzhiyun
1877*4882a593Smuzhiyun bb = kzalloc(sizeof(*bb), GFP_KERNEL);
1878*4882a593Smuzhiyun if (!bb)
1879*4882a593Smuzhiyun return -ENOMEM;
1880*4882a593Smuzhiyun
1881*4882a593Smuzhiyun bb->ppgtt = (s->buf_addr_type == GTT_BUFFER) ? false : true;
1882*4882a593Smuzhiyun
1883*4882a593Smuzhiyun /* the start_offset stores the batch buffer's start gma's
1884*4882a593Smuzhiyun * offset relative to page boundary. so for non-privileged batch
1885*4882a593Smuzhiyun * buffer, the shadowed gem object holds exactly the same page
1886*4882a593Smuzhiyun * layout as original gem object. This is for the convience of
1887*4882a593Smuzhiyun * replacing the whole non-privilged batch buffer page to this
1888*4882a593Smuzhiyun * shadowed one in PPGTT at the same gma address. (this replacing
1889*4882a593Smuzhiyun * action is not implemented yet now, but may be necessary in
1890*4882a593Smuzhiyun * future).
1891*4882a593Smuzhiyun * for prileged batch buffer, we just change start gma address to
1892*4882a593Smuzhiyun * that of shadowed page.
1893*4882a593Smuzhiyun */
1894*4882a593Smuzhiyun if (bb->ppgtt)
1895*4882a593Smuzhiyun start_offset = gma & ~I915_GTT_PAGE_MASK;
1896*4882a593Smuzhiyun
1897*4882a593Smuzhiyun bb->obj = i915_gem_object_create_shmem(s->engine->i915,
1898*4882a593Smuzhiyun round_up(bb_size + start_offset,
1899*4882a593Smuzhiyun PAGE_SIZE));
1900*4882a593Smuzhiyun if (IS_ERR(bb->obj)) {
1901*4882a593Smuzhiyun ret = PTR_ERR(bb->obj);
1902*4882a593Smuzhiyun goto err_free_bb;
1903*4882a593Smuzhiyun }
1904*4882a593Smuzhiyun
1905*4882a593Smuzhiyun bb->va = i915_gem_object_pin_map(bb->obj, I915_MAP_WB);
1906*4882a593Smuzhiyun if (IS_ERR(bb->va)) {
1907*4882a593Smuzhiyun ret = PTR_ERR(bb->va);
1908*4882a593Smuzhiyun goto err_free_obj;
1909*4882a593Smuzhiyun }
1910*4882a593Smuzhiyun
1911*4882a593Smuzhiyun ret = copy_gma_to_hva(s->vgpu, mm,
1912*4882a593Smuzhiyun gma, gma + bb_size,
1913*4882a593Smuzhiyun bb->va + start_offset);
1914*4882a593Smuzhiyun if (ret < 0) {
1915*4882a593Smuzhiyun gvt_vgpu_err("fail to copy guest ring buffer\n");
1916*4882a593Smuzhiyun ret = -EFAULT;
1917*4882a593Smuzhiyun goto err_unmap;
1918*4882a593Smuzhiyun }
1919*4882a593Smuzhiyun
1920*4882a593Smuzhiyun ret = audit_bb_end(s, bb->va + start_offset + bb_end_cmd_offset);
1921*4882a593Smuzhiyun if (ret)
1922*4882a593Smuzhiyun goto err_unmap;
1923*4882a593Smuzhiyun
1924*4882a593Smuzhiyun i915_gem_object_unlock(bb->obj);
1925*4882a593Smuzhiyun INIT_LIST_HEAD(&bb->list);
1926*4882a593Smuzhiyun list_add(&bb->list, &s->workload->shadow_bb);
1927*4882a593Smuzhiyun
1928*4882a593Smuzhiyun bb->bb_start_cmd_va = s->ip_va;
1929*4882a593Smuzhiyun
1930*4882a593Smuzhiyun if ((s->buf_type == BATCH_BUFFER_INSTRUCTION) && (!s->is_ctx_wa))
1931*4882a593Smuzhiyun bb->bb_offset = s->ip_va - s->rb_va;
1932*4882a593Smuzhiyun else
1933*4882a593Smuzhiyun bb->bb_offset = 0;
1934*4882a593Smuzhiyun
1935*4882a593Smuzhiyun /*
1936*4882a593Smuzhiyun * ip_va saves the virtual address of the shadow batch buffer, while
1937*4882a593Smuzhiyun * ip_gma saves the graphics address of the original batch buffer.
1938*4882a593Smuzhiyun * As the shadow batch buffer is just a copy from the originial one,
1939*4882a593Smuzhiyun * it should be right to use shadow batch buffer'va and original batch
1940*4882a593Smuzhiyun * buffer's gma in pair. After all, we don't want to pin the shadow
1941*4882a593Smuzhiyun * buffer here (too early).
1942*4882a593Smuzhiyun */
1943*4882a593Smuzhiyun s->ip_va = bb->va + start_offset;
1944*4882a593Smuzhiyun s->ip_gma = gma;
1945*4882a593Smuzhiyun return 0;
1946*4882a593Smuzhiyun err_unmap:
1947*4882a593Smuzhiyun i915_gem_object_unpin_map(bb->obj);
1948*4882a593Smuzhiyun err_free_obj:
1949*4882a593Smuzhiyun i915_gem_object_put(bb->obj);
1950*4882a593Smuzhiyun err_free_bb:
1951*4882a593Smuzhiyun kfree(bb);
1952*4882a593Smuzhiyun return ret;
1953*4882a593Smuzhiyun }
1954*4882a593Smuzhiyun
cmd_handler_mi_batch_buffer_start(struct parser_exec_state * s)1955*4882a593Smuzhiyun static int cmd_handler_mi_batch_buffer_start(struct parser_exec_state *s)
1956*4882a593Smuzhiyun {
1957*4882a593Smuzhiyun bool second_level;
1958*4882a593Smuzhiyun int ret = 0;
1959*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
1960*4882a593Smuzhiyun
1961*4882a593Smuzhiyun if (s->buf_type == BATCH_BUFFER_2ND_LEVEL) {
1962*4882a593Smuzhiyun gvt_vgpu_err("Found MI_BATCH_BUFFER_START in 2nd level BB\n");
1963*4882a593Smuzhiyun return -EFAULT;
1964*4882a593Smuzhiyun }
1965*4882a593Smuzhiyun
1966*4882a593Smuzhiyun second_level = BATCH_BUFFER_2ND_LEVEL_BIT(cmd_val(s, 0)) == 1;
1967*4882a593Smuzhiyun if (second_level && (s->buf_type != BATCH_BUFFER_INSTRUCTION)) {
1968*4882a593Smuzhiyun gvt_vgpu_err("Jumping to 2nd level BB from RB is not allowed\n");
1969*4882a593Smuzhiyun return -EFAULT;
1970*4882a593Smuzhiyun }
1971*4882a593Smuzhiyun
1972*4882a593Smuzhiyun s->saved_buf_addr_type = s->buf_addr_type;
1973*4882a593Smuzhiyun addr_type_update_snb(s);
1974*4882a593Smuzhiyun if (s->buf_type == RING_BUFFER_INSTRUCTION) {
1975*4882a593Smuzhiyun s->ret_ip_gma_ring = s->ip_gma + cmd_length(s) * sizeof(u32);
1976*4882a593Smuzhiyun s->buf_type = BATCH_BUFFER_INSTRUCTION;
1977*4882a593Smuzhiyun } else if (second_level) {
1978*4882a593Smuzhiyun s->buf_type = BATCH_BUFFER_2ND_LEVEL;
1979*4882a593Smuzhiyun s->ret_ip_gma_bb = s->ip_gma + cmd_length(s) * sizeof(u32);
1980*4882a593Smuzhiyun s->ret_bb_va = s->ip_va + cmd_length(s) * sizeof(u32);
1981*4882a593Smuzhiyun }
1982*4882a593Smuzhiyun
1983*4882a593Smuzhiyun if (batch_buffer_needs_scan(s)) {
1984*4882a593Smuzhiyun ret = perform_bb_shadow(s);
1985*4882a593Smuzhiyun if (ret < 0)
1986*4882a593Smuzhiyun gvt_vgpu_err("invalid shadow batch buffer\n");
1987*4882a593Smuzhiyun } else {
1988*4882a593Smuzhiyun /* emulate a batch buffer end to do return right */
1989*4882a593Smuzhiyun ret = cmd_handler_mi_batch_buffer_end(s);
1990*4882a593Smuzhiyun if (ret < 0)
1991*4882a593Smuzhiyun return ret;
1992*4882a593Smuzhiyun }
1993*4882a593Smuzhiyun return ret;
1994*4882a593Smuzhiyun }
1995*4882a593Smuzhiyun
1996*4882a593Smuzhiyun static int mi_noop_index;
1997*4882a593Smuzhiyun
1998*4882a593Smuzhiyun static const struct cmd_info cmd_info[] = {
1999*4882a593Smuzhiyun {"MI_NOOP", OP_MI_NOOP, F_LEN_CONST, R_ALL, D_ALL, 0, 1, NULL},
2000*4882a593Smuzhiyun
2001*4882a593Smuzhiyun {"MI_SET_PREDICATE", OP_MI_SET_PREDICATE, F_LEN_CONST, R_ALL, D_ALL,
2002*4882a593Smuzhiyun 0, 1, NULL},
2003*4882a593Smuzhiyun
2004*4882a593Smuzhiyun {"MI_USER_INTERRUPT", OP_MI_USER_INTERRUPT, F_LEN_CONST, R_ALL, D_ALL,
2005*4882a593Smuzhiyun 0, 1, cmd_handler_mi_user_interrupt},
2006*4882a593Smuzhiyun
2007*4882a593Smuzhiyun {"MI_WAIT_FOR_EVENT", OP_MI_WAIT_FOR_EVENT, F_LEN_CONST, R_RCS | R_BCS,
2008*4882a593Smuzhiyun D_ALL, 0, 1, cmd_handler_mi_wait_for_event},
2009*4882a593Smuzhiyun
2010*4882a593Smuzhiyun {"MI_FLUSH", OP_MI_FLUSH, F_LEN_CONST, R_ALL, D_ALL, 0, 1, NULL},
2011*4882a593Smuzhiyun
2012*4882a593Smuzhiyun {"MI_ARB_CHECK", OP_MI_ARB_CHECK, F_LEN_CONST, R_ALL, D_ALL, 0, 1,
2013*4882a593Smuzhiyun NULL},
2014*4882a593Smuzhiyun
2015*4882a593Smuzhiyun {"MI_RS_CONTROL", OP_MI_RS_CONTROL, F_LEN_CONST, R_RCS, D_ALL, 0, 1,
2016*4882a593Smuzhiyun NULL},
2017*4882a593Smuzhiyun
2018*4882a593Smuzhiyun {"MI_REPORT_HEAD", OP_MI_REPORT_HEAD, F_LEN_CONST, R_ALL, D_ALL, 0, 1,
2019*4882a593Smuzhiyun NULL},
2020*4882a593Smuzhiyun
2021*4882a593Smuzhiyun {"MI_ARB_ON_OFF", OP_MI_ARB_ON_OFF, F_LEN_CONST, R_ALL, D_ALL, 0, 1,
2022*4882a593Smuzhiyun NULL},
2023*4882a593Smuzhiyun
2024*4882a593Smuzhiyun {"MI_URB_ATOMIC_ALLOC", OP_MI_URB_ATOMIC_ALLOC, F_LEN_CONST, R_RCS,
2025*4882a593Smuzhiyun D_ALL, 0, 1, NULL},
2026*4882a593Smuzhiyun
2027*4882a593Smuzhiyun {"MI_BATCH_BUFFER_END", OP_MI_BATCH_BUFFER_END,
2028*4882a593Smuzhiyun F_IP_ADVANCE_CUSTOM | F_LEN_CONST, R_ALL, D_ALL, 0, 1,
2029*4882a593Smuzhiyun cmd_handler_mi_batch_buffer_end},
2030*4882a593Smuzhiyun
2031*4882a593Smuzhiyun {"MI_SUSPEND_FLUSH", OP_MI_SUSPEND_FLUSH, F_LEN_CONST, R_ALL, D_ALL,
2032*4882a593Smuzhiyun 0, 1, NULL},
2033*4882a593Smuzhiyun
2034*4882a593Smuzhiyun {"MI_PREDICATE", OP_MI_PREDICATE, F_LEN_CONST, R_RCS, D_ALL, 0, 1,
2035*4882a593Smuzhiyun NULL},
2036*4882a593Smuzhiyun
2037*4882a593Smuzhiyun {"MI_TOPOLOGY_FILTER", OP_MI_TOPOLOGY_FILTER, F_LEN_CONST, R_ALL,
2038*4882a593Smuzhiyun D_ALL, 0, 1, NULL},
2039*4882a593Smuzhiyun
2040*4882a593Smuzhiyun {"MI_SET_APPID", OP_MI_SET_APPID, F_LEN_CONST, R_ALL, D_ALL, 0, 1,
2041*4882a593Smuzhiyun NULL},
2042*4882a593Smuzhiyun
2043*4882a593Smuzhiyun {"MI_RS_CONTEXT", OP_MI_RS_CONTEXT, F_LEN_CONST, R_RCS, D_ALL, 0, 1,
2044*4882a593Smuzhiyun NULL},
2045*4882a593Smuzhiyun
2046*4882a593Smuzhiyun {"MI_DISPLAY_FLIP", OP_MI_DISPLAY_FLIP, F_LEN_VAR,
2047*4882a593Smuzhiyun R_RCS | R_BCS, D_ALL, 0, 8, cmd_handler_mi_display_flip},
2048*4882a593Smuzhiyun
2049*4882a593Smuzhiyun {"MI_SEMAPHORE_MBOX", OP_MI_SEMAPHORE_MBOX, F_LEN_VAR | F_LEN_VAR_FIXED,
2050*4882a593Smuzhiyun R_ALL, D_ALL, 0, 8, NULL, CMD_LEN(1)},
2051*4882a593Smuzhiyun
2052*4882a593Smuzhiyun {"MI_MATH", OP_MI_MATH, F_LEN_VAR, R_ALL, D_ALL, 0, 8, NULL},
2053*4882a593Smuzhiyun
2054*4882a593Smuzhiyun {"MI_URB_CLEAR", OP_MI_URB_CLEAR, F_LEN_VAR | F_LEN_VAR_FIXED, R_RCS,
2055*4882a593Smuzhiyun D_ALL, 0, 8, NULL, CMD_LEN(0)},
2056*4882a593Smuzhiyun
2057*4882a593Smuzhiyun {"MI_SEMAPHORE_SIGNAL", OP_MI_SEMAPHORE_SIGNAL,
2058*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_BDW_PLUS, 0, 8,
2059*4882a593Smuzhiyun NULL, CMD_LEN(0)},
2060*4882a593Smuzhiyun
2061*4882a593Smuzhiyun {"MI_SEMAPHORE_WAIT", OP_MI_SEMAPHORE_WAIT,
2062*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_BDW_PLUS, ADDR_FIX_1(2),
2063*4882a593Smuzhiyun 8, cmd_handler_mi_semaphore_wait, CMD_LEN(2)},
2064*4882a593Smuzhiyun
2065*4882a593Smuzhiyun {"MI_STORE_DATA_IMM", OP_MI_STORE_DATA_IMM, F_LEN_VAR, R_ALL, D_BDW_PLUS,
2066*4882a593Smuzhiyun ADDR_FIX_1(1), 10, cmd_handler_mi_store_data_imm},
2067*4882a593Smuzhiyun
2068*4882a593Smuzhiyun {"MI_STORE_DATA_INDEX", OP_MI_STORE_DATA_INDEX, F_LEN_VAR, R_ALL, D_ALL,
2069*4882a593Smuzhiyun 0, 8, cmd_handler_mi_store_data_index},
2070*4882a593Smuzhiyun
2071*4882a593Smuzhiyun {"MI_LOAD_REGISTER_IMM", OP_MI_LOAD_REGISTER_IMM, F_LEN_VAR, R_ALL,
2072*4882a593Smuzhiyun D_ALL, 0, 8, cmd_handler_lri},
2073*4882a593Smuzhiyun
2074*4882a593Smuzhiyun {"MI_UPDATE_GTT", OP_MI_UPDATE_GTT, F_LEN_VAR, R_ALL, D_BDW_PLUS, 0, 10,
2075*4882a593Smuzhiyun cmd_handler_mi_update_gtt},
2076*4882a593Smuzhiyun
2077*4882a593Smuzhiyun {"MI_STORE_REGISTER_MEM", OP_MI_STORE_REGISTER_MEM,
2078*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_ALL, ADDR_FIX_1(2), 8,
2079*4882a593Smuzhiyun cmd_handler_srm, CMD_LEN(2)},
2080*4882a593Smuzhiyun
2081*4882a593Smuzhiyun {"MI_FLUSH_DW", OP_MI_FLUSH_DW, F_LEN_VAR, R_ALL, D_ALL, 0, 6,
2082*4882a593Smuzhiyun cmd_handler_mi_flush_dw},
2083*4882a593Smuzhiyun
2084*4882a593Smuzhiyun {"MI_CLFLUSH", OP_MI_CLFLUSH, F_LEN_VAR, R_ALL, D_ALL, ADDR_FIX_1(1),
2085*4882a593Smuzhiyun 10, cmd_handler_mi_clflush},
2086*4882a593Smuzhiyun
2087*4882a593Smuzhiyun {"MI_REPORT_PERF_COUNT", OP_MI_REPORT_PERF_COUNT,
2088*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_ALL, ADDR_FIX_1(1), 6,
2089*4882a593Smuzhiyun cmd_handler_mi_report_perf_count, CMD_LEN(2)},
2090*4882a593Smuzhiyun
2091*4882a593Smuzhiyun {"MI_LOAD_REGISTER_MEM", OP_MI_LOAD_REGISTER_MEM,
2092*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_ALL, ADDR_FIX_1(2), 8,
2093*4882a593Smuzhiyun cmd_handler_lrm, CMD_LEN(2)},
2094*4882a593Smuzhiyun
2095*4882a593Smuzhiyun {"MI_LOAD_REGISTER_REG", OP_MI_LOAD_REGISTER_REG,
2096*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_ALL, 0, 8,
2097*4882a593Smuzhiyun cmd_handler_lrr, CMD_LEN(1)},
2098*4882a593Smuzhiyun
2099*4882a593Smuzhiyun {"MI_RS_STORE_DATA_IMM", OP_MI_RS_STORE_DATA_IMM,
2100*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_RCS, D_ALL, 0,
2101*4882a593Smuzhiyun 8, NULL, CMD_LEN(2)},
2102*4882a593Smuzhiyun
2103*4882a593Smuzhiyun {"MI_LOAD_URB_MEM", OP_MI_LOAD_URB_MEM, F_LEN_VAR | F_LEN_VAR_FIXED,
2104*4882a593Smuzhiyun R_RCS, D_ALL, ADDR_FIX_1(2), 8, NULL, CMD_LEN(2)},
2105*4882a593Smuzhiyun
2106*4882a593Smuzhiyun {"MI_STORE_URM_MEM", OP_MI_STORE_URM_MEM, F_LEN_VAR, R_RCS, D_ALL,
2107*4882a593Smuzhiyun ADDR_FIX_1(2), 8, NULL},
2108*4882a593Smuzhiyun
2109*4882a593Smuzhiyun {"MI_OP_2E", OP_MI_2E, F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_BDW_PLUS,
2110*4882a593Smuzhiyun ADDR_FIX_2(1, 2), 8, cmd_handler_mi_op_2e, CMD_LEN(3)},
2111*4882a593Smuzhiyun
2112*4882a593Smuzhiyun {"MI_OP_2F", OP_MI_2F, F_LEN_VAR, R_ALL, D_BDW_PLUS, ADDR_FIX_1(1),
2113*4882a593Smuzhiyun 8, cmd_handler_mi_op_2f},
2114*4882a593Smuzhiyun
2115*4882a593Smuzhiyun {"MI_BATCH_BUFFER_START", OP_MI_BATCH_BUFFER_START,
2116*4882a593Smuzhiyun F_IP_ADVANCE_CUSTOM, R_ALL, D_ALL, 0, 8,
2117*4882a593Smuzhiyun cmd_handler_mi_batch_buffer_start},
2118*4882a593Smuzhiyun
2119*4882a593Smuzhiyun {"MI_CONDITIONAL_BATCH_BUFFER_END", OP_MI_CONDITIONAL_BATCH_BUFFER_END,
2120*4882a593Smuzhiyun F_LEN_VAR | F_LEN_VAR_FIXED, R_ALL, D_ALL, ADDR_FIX_1(2), 8,
2121*4882a593Smuzhiyun cmd_handler_mi_conditional_batch_buffer_end, CMD_LEN(2)},
2122*4882a593Smuzhiyun
2123*4882a593Smuzhiyun {"MI_LOAD_SCAN_LINES_INCL", OP_MI_LOAD_SCAN_LINES_INCL, F_LEN_CONST,
2124*4882a593Smuzhiyun R_RCS | R_BCS, D_ALL, 0, 2, NULL},
2125*4882a593Smuzhiyun
2126*4882a593Smuzhiyun {"XY_SETUP_BLT", OP_XY_SETUP_BLT, F_LEN_VAR, R_BCS, D_ALL,
2127*4882a593Smuzhiyun ADDR_FIX_2(4, 7), 8, NULL},
2128*4882a593Smuzhiyun
2129*4882a593Smuzhiyun {"XY_SETUP_CLIP_BLT", OP_XY_SETUP_CLIP_BLT, F_LEN_VAR, R_BCS, D_ALL,
2130*4882a593Smuzhiyun 0, 8, NULL},
2131*4882a593Smuzhiyun
2132*4882a593Smuzhiyun {"XY_SETUP_MONO_PATTERN_SL_BLT", OP_XY_SETUP_MONO_PATTERN_SL_BLT,
2133*4882a593Smuzhiyun F_LEN_VAR, R_BCS, D_ALL, ADDR_FIX_1(4), 8, NULL},
2134*4882a593Smuzhiyun
2135*4882a593Smuzhiyun {"XY_PIXEL_BLT", OP_XY_PIXEL_BLT, F_LEN_VAR, R_BCS, D_ALL, 0, 8, NULL},
2136*4882a593Smuzhiyun
2137*4882a593Smuzhiyun {"XY_SCANLINES_BLT", OP_XY_SCANLINES_BLT, F_LEN_VAR, R_BCS, D_ALL,
2138*4882a593Smuzhiyun 0, 8, NULL},
2139*4882a593Smuzhiyun
2140*4882a593Smuzhiyun {"XY_TEXT_BLT", OP_XY_TEXT_BLT, F_LEN_VAR, R_BCS, D_ALL,
2141*4882a593Smuzhiyun ADDR_FIX_1(3), 8, NULL},
2142*4882a593Smuzhiyun
2143*4882a593Smuzhiyun {"XY_TEXT_IMMEDIATE_BLT", OP_XY_TEXT_IMMEDIATE_BLT, F_LEN_VAR, R_BCS,
2144*4882a593Smuzhiyun D_ALL, 0, 8, NULL},
2145*4882a593Smuzhiyun
2146*4882a593Smuzhiyun {"XY_COLOR_BLT", OP_XY_COLOR_BLT, F_LEN_VAR, R_BCS, D_ALL,
2147*4882a593Smuzhiyun ADDR_FIX_1(4), 8, NULL},
2148*4882a593Smuzhiyun
2149*4882a593Smuzhiyun {"XY_PAT_BLT", OP_XY_PAT_BLT, F_LEN_VAR, R_BCS, D_ALL,
2150*4882a593Smuzhiyun ADDR_FIX_2(4, 5), 8, NULL},
2151*4882a593Smuzhiyun
2152*4882a593Smuzhiyun {"XY_MONO_PAT_BLT", OP_XY_MONO_PAT_BLT, F_LEN_VAR, R_BCS, D_ALL,
2153*4882a593Smuzhiyun ADDR_FIX_1(4), 8, NULL},
2154*4882a593Smuzhiyun
2155*4882a593Smuzhiyun {"XY_SRC_COPY_BLT", OP_XY_SRC_COPY_BLT, F_LEN_VAR, R_BCS, D_ALL,
2156*4882a593Smuzhiyun ADDR_FIX_2(4, 7), 8, NULL},
2157*4882a593Smuzhiyun
2158*4882a593Smuzhiyun {"XY_MONO_SRC_COPY_BLT", OP_XY_MONO_SRC_COPY_BLT, F_LEN_VAR, R_BCS,
2159*4882a593Smuzhiyun D_ALL, ADDR_FIX_2(4, 5), 8, NULL},
2160*4882a593Smuzhiyun
2161*4882a593Smuzhiyun {"XY_FULL_BLT", OP_XY_FULL_BLT, F_LEN_VAR, R_BCS, D_ALL, 0, 8, NULL},
2162*4882a593Smuzhiyun
2163*4882a593Smuzhiyun {"XY_FULL_MONO_SRC_BLT", OP_XY_FULL_MONO_SRC_BLT, F_LEN_VAR, R_BCS,
2164*4882a593Smuzhiyun D_ALL, ADDR_FIX_3(4, 5, 8), 8, NULL},
2165*4882a593Smuzhiyun
2166*4882a593Smuzhiyun {"XY_FULL_MONO_PATTERN_BLT", OP_XY_FULL_MONO_PATTERN_BLT, F_LEN_VAR,
2167*4882a593Smuzhiyun R_BCS, D_ALL, ADDR_FIX_2(4, 7), 8, NULL},
2168*4882a593Smuzhiyun
2169*4882a593Smuzhiyun {"XY_FULL_MONO_PATTERN_MONO_SRC_BLT",
2170*4882a593Smuzhiyun OP_XY_FULL_MONO_PATTERN_MONO_SRC_BLT,
2171*4882a593Smuzhiyun F_LEN_VAR, R_BCS, D_ALL, ADDR_FIX_2(4, 5), 8, NULL},
2172*4882a593Smuzhiyun
2173*4882a593Smuzhiyun {"XY_MONO_PAT_FIXED_BLT", OP_XY_MONO_PAT_FIXED_BLT, F_LEN_VAR, R_BCS,
2174*4882a593Smuzhiyun D_ALL, ADDR_FIX_1(4), 8, NULL},
2175*4882a593Smuzhiyun
2176*4882a593Smuzhiyun {"XY_MONO_SRC_COPY_IMMEDIATE_BLT", OP_XY_MONO_SRC_COPY_IMMEDIATE_BLT,
2177*4882a593Smuzhiyun F_LEN_VAR, R_BCS, D_ALL, ADDR_FIX_1(4), 8, NULL},
2178*4882a593Smuzhiyun
2179*4882a593Smuzhiyun {"XY_PAT_BLT_IMMEDIATE", OP_XY_PAT_BLT_IMMEDIATE, F_LEN_VAR, R_BCS,
2180*4882a593Smuzhiyun D_ALL, ADDR_FIX_1(4), 8, NULL},
2181*4882a593Smuzhiyun
2182*4882a593Smuzhiyun {"XY_SRC_COPY_CHROMA_BLT", OP_XY_SRC_COPY_CHROMA_BLT, F_LEN_VAR, R_BCS,
2183*4882a593Smuzhiyun D_ALL, ADDR_FIX_2(4, 7), 8, NULL},
2184*4882a593Smuzhiyun
2185*4882a593Smuzhiyun {"XY_FULL_IMMEDIATE_PATTERN_BLT", OP_XY_FULL_IMMEDIATE_PATTERN_BLT,
2186*4882a593Smuzhiyun F_LEN_VAR, R_BCS, D_ALL, ADDR_FIX_2(4, 7), 8, NULL},
2187*4882a593Smuzhiyun
2188*4882a593Smuzhiyun {"XY_FULL_MONO_SRC_IMMEDIATE_PATTERN_BLT",
2189*4882a593Smuzhiyun OP_XY_FULL_MONO_SRC_IMMEDIATE_PATTERN_BLT,
2190*4882a593Smuzhiyun F_LEN_VAR, R_BCS, D_ALL, ADDR_FIX_2(4, 5), 8, NULL},
2191*4882a593Smuzhiyun
2192*4882a593Smuzhiyun {"XY_PAT_CHROMA_BLT", OP_XY_PAT_CHROMA_BLT, F_LEN_VAR, R_BCS, D_ALL,
2193*4882a593Smuzhiyun ADDR_FIX_2(4, 5), 8, NULL},
2194*4882a593Smuzhiyun
2195*4882a593Smuzhiyun {"XY_PAT_CHROMA_BLT_IMMEDIATE", OP_XY_PAT_CHROMA_BLT_IMMEDIATE,
2196*4882a593Smuzhiyun F_LEN_VAR, R_BCS, D_ALL, ADDR_FIX_1(4), 8, NULL},
2197*4882a593Smuzhiyun
2198*4882a593Smuzhiyun {"3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP",
2199*4882a593Smuzhiyun OP_3DSTATE_VIEWPORT_STATE_POINTERS_SF_CLIP,
2200*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2201*4882a593Smuzhiyun
2202*4882a593Smuzhiyun {"3DSTATE_VIEWPORT_STATE_POINTERS_CC",
2203*4882a593Smuzhiyun OP_3DSTATE_VIEWPORT_STATE_POINTERS_CC,
2204*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2205*4882a593Smuzhiyun
2206*4882a593Smuzhiyun {"3DSTATE_BLEND_STATE_POINTERS",
2207*4882a593Smuzhiyun OP_3DSTATE_BLEND_STATE_POINTERS,
2208*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2209*4882a593Smuzhiyun
2210*4882a593Smuzhiyun {"3DSTATE_DEPTH_STENCIL_STATE_POINTERS",
2211*4882a593Smuzhiyun OP_3DSTATE_DEPTH_STENCIL_STATE_POINTERS,
2212*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2213*4882a593Smuzhiyun
2214*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_POINTERS_VS",
2215*4882a593Smuzhiyun OP_3DSTATE_BINDING_TABLE_POINTERS_VS,
2216*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2217*4882a593Smuzhiyun
2218*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_POINTERS_HS",
2219*4882a593Smuzhiyun OP_3DSTATE_BINDING_TABLE_POINTERS_HS,
2220*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2221*4882a593Smuzhiyun
2222*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_POINTERS_DS",
2223*4882a593Smuzhiyun OP_3DSTATE_BINDING_TABLE_POINTERS_DS,
2224*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2225*4882a593Smuzhiyun
2226*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_POINTERS_GS",
2227*4882a593Smuzhiyun OP_3DSTATE_BINDING_TABLE_POINTERS_GS,
2228*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2229*4882a593Smuzhiyun
2230*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_POINTERS_PS",
2231*4882a593Smuzhiyun OP_3DSTATE_BINDING_TABLE_POINTERS_PS,
2232*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2233*4882a593Smuzhiyun
2234*4882a593Smuzhiyun {"3DSTATE_SAMPLER_STATE_POINTERS_VS",
2235*4882a593Smuzhiyun OP_3DSTATE_SAMPLER_STATE_POINTERS_VS,
2236*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2237*4882a593Smuzhiyun
2238*4882a593Smuzhiyun {"3DSTATE_SAMPLER_STATE_POINTERS_HS",
2239*4882a593Smuzhiyun OP_3DSTATE_SAMPLER_STATE_POINTERS_HS,
2240*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2241*4882a593Smuzhiyun
2242*4882a593Smuzhiyun {"3DSTATE_SAMPLER_STATE_POINTERS_DS",
2243*4882a593Smuzhiyun OP_3DSTATE_SAMPLER_STATE_POINTERS_DS,
2244*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2245*4882a593Smuzhiyun
2246*4882a593Smuzhiyun {"3DSTATE_SAMPLER_STATE_POINTERS_GS",
2247*4882a593Smuzhiyun OP_3DSTATE_SAMPLER_STATE_POINTERS_GS,
2248*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2249*4882a593Smuzhiyun
2250*4882a593Smuzhiyun {"3DSTATE_SAMPLER_STATE_POINTERS_PS",
2251*4882a593Smuzhiyun OP_3DSTATE_SAMPLER_STATE_POINTERS_PS,
2252*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2253*4882a593Smuzhiyun
2254*4882a593Smuzhiyun {"3DSTATE_URB_VS", OP_3DSTATE_URB_VS, F_LEN_VAR, R_RCS, D_ALL,
2255*4882a593Smuzhiyun 0, 8, NULL},
2256*4882a593Smuzhiyun
2257*4882a593Smuzhiyun {"3DSTATE_URB_HS", OP_3DSTATE_URB_HS, F_LEN_VAR, R_RCS, D_ALL,
2258*4882a593Smuzhiyun 0, 8, NULL},
2259*4882a593Smuzhiyun
2260*4882a593Smuzhiyun {"3DSTATE_URB_DS", OP_3DSTATE_URB_DS, F_LEN_VAR, R_RCS, D_ALL,
2261*4882a593Smuzhiyun 0, 8, NULL},
2262*4882a593Smuzhiyun
2263*4882a593Smuzhiyun {"3DSTATE_URB_GS", OP_3DSTATE_URB_GS, F_LEN_VAR, R_RCS, D_ALL,
2264*4882a593Smuzhiyun 0, 8, NULL},
2265*4882a593Smuzhiyun
2266*4882a593Smuzhiyun {"3DSTATE_GATHER_CONSTANT_VS", OP_3DSTATE_GATHER_CONSTANT_VS,
2267*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2268*4882a593Smuzhiyun
2269*4882a593Smuzhiyun {"3DSTATE_GATHER_CONSTANT_GS", OP_3DSTATE_GATHER_CONSTANT_GS,
2270*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2271*4882a593Smuzhiyun
2272*4882a593Smuzhiyun {"3DSTATE_GATHER_CONSTANT_HS", OP_3DSTATE_GATHER_CONSTANT_HS,
2273*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2274*4882a593Smuzhiyun
2275*4882a593Smuzhiyun {"3DSTATE_GATHER_CONSTANT_DS", OP_3DSTATE_GATHER_CONSTANT_DS,
2276*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2277*4882a593Smuzhiyun
2278*4882a593Smuzhiyun {"3DSTATE_GATHER_CONSTANT_PS", OP_3DSTATE_GATHER_CONSTANT_PS,
2279*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2280*4882a593Smuzhiyun
2281*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANTF_VS", OP_3DSTATE_DX9_CONSTANTF_VS,
2282*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 11, NULL},
2283*4882a593Smuzhiyun
2284*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANTF_PS", OP_3DSTATE_DX9_CONSTANTF_PS,
2285*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 11, NULL},
2286*4882a593Smuzhiyun
2287*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANTI_VS", OP_3DSTATE_DX9_CONSTANTI_VS,
2288*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2289*4882a593Smuzhiyun
2290*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANTI_PS", OP_3DSTATE_DX9_CONSTANTI_PS,
2291*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2292*4882a593Smuzhiyun
2293*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANTB_VS", OP_3DSTATE_DX9_CONSTANTB_VS,
2294*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2295*4882a593Smuzhiyun
2296*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANTB_PS", OP_3DSTATE_DX9_CONSTANTB_PS,
2297*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2298*4882a593Smuzhiyun
2299*4882a593Smuzhiyun {"3DSTATE_DX9_LOCAL_VALID_VS", OP_3DSTATE_DX9_LOCAL_VALID_VS,
2300*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2301*4882a593Smuzhiyun
2302*4882a593Smuzhiyun {"3DSTATE_DX9_LOCAL_VALID_PS", OP_3DSTATE_DX9_LOCAL_VALID_PS,
2303*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2304*4882a593Smuzhiyun
2305*4882a593Smuzhiyun {"3DSTATE_DX9_GENERATE_ACTIVE_VS", OP_3DSTATE_DX9_GENERATE_ACTIVE_VS,
2306*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2307*4882a593Smuzhiyun
2308*4882a593Smuzhiyun {"3DSTATE_DX9_GENERATE_ACTIVE_PS", OP_3DSTATE_DX9_GENERATE_ACTIVE_PS,
2309*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2310*4882a593Smuzhiyun
2311*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_EDIT_VS", OP_3DSTATE_BINDING_TABLE_EDIT_VS,
2312*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 9, NULL},
2313*4882a593Smuzhiyun
2314*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_EDIT_GS", OP_3DSTATE_BINDING_TABLE_EDIT_GS,
2315*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 9, NULL},
2316*4882a593Smuzhiyun
2317*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_EDIT_HS", OP_3DSTATE_BINDING_TABLE_EDIT_HS,
2318*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 9, NULL},
2319*4882a593Smuzhiyun
2320*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_EDIT_DS", OP_3DSTATE_BINDING_TABLE_EDIT_DS,
2321*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 9, NULL},
2322*4882a593Smuzhiyun
2323*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_EDIT_PS", OP_3DSTATE_BINDING_TABLE_EDIT_PS,
2324*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 9, NULL},
2325*4882a593Smuzhiyun
2326*4882a593Smuzhiyun {"3DSTATE_VF_INSTANCING", OP_3DSTATE_VF_INSTANCING, F_LEN_VAR, R_RCS,
2327*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2328*4882a593Smuzhiyun
2329*4882a593Smuzhiyun {"3DSTATE_VF_SGVS", OP_3DSTATE_VF_SGVS, F_LEN_VAR, R_RCS, D_BDW_PLUS, 0, 8,
2330*4882a593Smuzhiyun NULL},
2331*4882a593Smuzhiyun
2332*4882a593Smuzhiyun {"3DSTATE_VF_TOPOLOGY", OP_3DSTATE_VF_TOPOLOGY, F_LEN_VAR, R_RCS,
2333*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2334*4882a593Smuzhiyun
2335*4882a593Smuzhiyun {"3DSTATE_WM_CHROMAKEY", OP_3DSTATE_WM_CHROMAKEY, F_LEN_VAR, R_RCS,
2336*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2337*4882a593Smuzhiyun
2338*4882a593Smuzhiyun {"3DSTATE_PS_BLEND", OP_3DSTATE_PS_BLEND, F_LEN_VAR, R_RCS, D_BDW_PLUS, 0,
2339*4882a593Smuzhiyun 8, NULL},
2340*4882a593Smuzhiyun
2341*4882a593Smuzhiyun {"3DSTATE_WM_DEPTH_STENCIL", OP_3DSTATE_WM_DEPTH_STENCIL, F_LEN_VAR,
2342*4882a593Smuzhiyun R_RCS, D_BDW_PLUS, 0, 8, NULL},
2343*4882a593Smuzhiyun
2344*4882a593Smuzhiyun {"3DSTATE_PS_EXTRA", OP_3DSTATE_PS_EXTRA, F_LEN_VAR, R_RCS, D_BDW_PLUS, 0,
2345*4882a593Smuzhiyun 8, NULL},
2346*4882a593Smuzhiyun
2347*4882a593Smuzhiyun {"3DSTATE_RASTER", OP_3DSTATE_RASTER, F_LEN_VAR, R_RCS, D_BDW_PLUS, 0, 8,
2348*4882a593Smuzhiyun NULL},
2349*4882a593Smuzhiyun
2350*4882a593Smuzhiyun {"3DSTATE_SBE_SWIZ", OP_3DSTATE_SBE_SWIZ, F_LEN_VAR, R_RCS, D_BDW_PLUS, 0, 8,
2351*4882a593Smuzhiyun NULL},
2352*4882a593Smuzhiyun
2353*4882a593Smuzhiyun {"3DSTATE_WM_HZ_OP", OP_3DSTATE_WM_HZ_OP, F_LEN_VAR, R_RCS, D_BDW_PLUS, 0, 8,
2354*4882a593Smuzhiyun NULL},
2355*4882a593Smuzhiyun
2356*4882a593Smuzhiyun {"3DSTATE_VERTEX_BUFFERS", OP_3DSTATE_VERTEX_BUFFERS, F_LEN_VAR, R_RCS,
2357*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2358*4882a593Smuzhiyun
2359*4882a593Smuzhiyun {"3DSTATE_VERTEX_ELEMENTS", OP_3DSTATE_VERTEX_ELEMENTS, F_LEN_VAR,
2360*4882a593Smuzhiyun R_RCS, D_ALL, 0, 8, NULL},
2361*4882a593Smuzhiyun
2362*4882a593Smuzhiyun {"3DSTATE_INDEX_BUFFER", OP_3DSTATE_INDEX_BUFFER, F_LEN_VAR, R_RCS,
2363*4882a593Smuzhiyun D_BDW_PLUS, ADDR_FIX_1(2), 8, NULL},
2364*4882a593Smuzhiyun
2365*4882a593Smuzhiyun {"3DSTATE_VF_STATISTICS", OP_3DSTATE_VF_STATISTICS, F_LEN_CONST,
2366*4882a593Smuzhiyun R_RCS, D_ALL, 0, 1, NULL},
2367*4882a593Smuzhiyun
2368*4882a593Smuzhiyun {"3DSTATE_VF", OP_3DSTATE_VF, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2369*4882a593Smuzhiyun
2370*4882a593Smuzhiyun {"3DSTATE_CC_STATE_POINTERS", OP_3DSTATE_CC_STATE_POINTERS, F_LEN_VAR,
2371*4882a593Smuzhiyun R_RCS, D_ALL, 0, 8, NULL},
2372*4882a593Smuzhiyun
2373*4882a593Smuzhiyun {"3DSTATE_SCISSOR_STATE_POINTERS", OP_3DSTATE_SCISSOR_STATE_POINTERS,
2374*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2375*4882a593Smuzhiyun
2376*4882a593Smuzhiyun {"3DSTATE_GS", OP_3DSTATE_GS, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2377*4882a593Smuzhiyun
2378*4882a593Smuzhiyun {"3DSTATE_CLIP", OP_3DSTATE_CLIP, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2379*4882a593Smuzhiyun
2380*4882a593Smuzhiyun {"3DSTATE_WM", OP_3DSTATE_WM, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2381*4882a593Smuzhiyun
2382*4882a593Smuzhiyun {"3DSTATE_CONSTANT_GS", OP_3DSTATE_CONSTANT_GS, F_LEN_VAR, R_RCS,
2383*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2384*4882a593Smuzhiyun
2385*4882a593Smuzhiyun {"3DSTATE_CONSTANT_PS", OP_3DSTATE_CONSTANT_PS, F_LEN_VAR, R_RCS,
2386*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2387*4882a593Smuzhiyun
2388*4882a593Smuzhiyun {"3DSTATE_SAMPLE_MASK", OP_3DSTATE_SAMPLE_MASK, F_LEN_VAR, R_RCS,
2389*4882a593Smuzhiyun D_ALL, 0, 8, NULL},
2390*4882a593Smuzhiyun
2391*4882a593Smuzhiyun {"3DSTATE_CONSTANT_HS", OP_3DSTATE_CONSTANT_HS, F_LEN_VAR, R_RCS,
2392*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2393*4882a593Smuzhiyun
2394*4882a593Smuzhiyun {"3DSTATE_CONSTANT_DS", OP_3DSTATE_CONSTANT_DS, F_LEN_VAR, R_RCS,
2395*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2396*4882a593Smuzhiyun
2397*4882a593Smuzhiyun {"3DSTATE_HS", OP_3DSTATE_HS, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2398*4882a593Smuzhiyun
2399*4882a593Smuzhiyun {"3DSTATE_TE", OP_3DSTATE_TE, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2400*4882a593Smuzhiyun
2401*4882a593Smuzhiyun {"3DSTATE_DS", OP_3DSTATE_DS, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2402*4882a593Smuzhiyun
2403*4882a593Smuzhiyun {"3DSTATE_STREAMOUT", OP_3DSTATE_STREAMOUT, F_LEN_VAR, R_RCS,
2404*4882a593Smuzhiyun D_ALL, 0, 8, NULL},
2405*4882a593Smuzhiyun
2406*4882a593Smuzhiyun {"3DSTATE_SBE", OP_3DSTATE_SBE, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2407*4882a593Smuzhiyun
2408*4882a593Smuzhiyun {"3DSTATE_PS", OP_3DSTATE_PS, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2409*4882a593Smuzhiyun
2410*4882a593Smuzhiyun {"3DSTATE_DRAWING_RECTANGLE", OP_3DSTATE_DRAWING_RECTANGLE, F_LEN_VAR,
2411*4882a593Smuzhiyun R_RCS, D_ALL, 0, 8, NULL},
2412*4882a593Smuzhiyun
2413*4882a593Smuzhiyun {"3DSTATE_SAMPLER_PALETTE_LOAD0", OP_3DSTATE_SAMPLER_PALETTE_LOAD0,
2414*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2415*4882a593Smuzhiyun
2416*4882a593Smuzhiyun {"3DSTATE_CHROMA_KEY", OP_3DSTATE_CHROMA_KEY, F_LEN_VAR, R_RCS, D_ALL,
2417*4882a593Smuzhiyun 0, 8, NULL},
2418*4882a593Smuzhiyun
2419*4882a593Smuzhiyun {"3DSTATE_DEPTH_BUFFER", OP_3DSTATE_DEPTH_BUFFER, F_LEN_VAR, R_RCS,
2420*4882a593Smuzhiyun D_ALL, ADDR_FIX_1(2), 8, NULL},
2421*4882a593Smuzhiyun
2422*4882a593Smuzhiyun {"3DSTATE_POLY_STIPPLE_OFFSET", OP_3DSTATE_POLY_STIPPLE_OFFSET,
2423*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2424*4882a593Smuzhiyun
2425*4882a593Smuzhiyun {"3DSTATE_POLY_STIPPLE_PATTERN", OP_3DSTATE_POLY_STIPPLE_PATTERN,
2426*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2427*4882a593Smuzhiyun
2428*4882a593Smuzhiyun {"3DSTATE_LINE_STIPPLE", OP_3DSTATE_LINE_STIPPLE, F_LEN_VAR, R_RCS,
2429*4882a593Smuzhiyun D_ALL, 0, 8, NULL},
2430*4882a593Smuzhiyun
2431*4882a593Smuzhiyun {"3DSTATE_AA_LINE_PARAMS", OP_3DSTATE_AA_LINE_PARAMS, F_LEN_VAR, R_RCS,
2432*4882a593Smuzhiyun D_ALL, 0, 8, NULL},
2433*4882a593Smuzhiyun
2434*4882a593Smuzhiyun {"3DSTATE_GS_SVB_INDEX", OP_3DSTATE_GS_SVB_INDEX, F_LEN_VAR, R_RCS,
2435*4882a593Smuzhiyun D_ALL, 0, 8, NULL},
2436*4882a593Smuzhiyun
2437*4882a593Smuzhiyun {"3DSTATE_SAMPLER_PALETTE_LOAD1", OP_3DSTATE_SAMPLER_PALETTE_LOAD1,
2438*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2439*4882a593Smuzhiyun
2440*4882a593Smuzhiyun {"3DSTATE_MULTISAMPLE", OP_3DSTATE_MULTISAMPLE_BDW, F_LEN_VAR, R_RCS,
2441*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2442*4882a593Smuzhiyun
2443*4882a593Smuzhiyun {"3DSTATE_STENCIL_BUFFER", OP_3DSTATE_STENCIL_BUFFER, F_LEN_VAR, R_RCS,
2444*4882a593Smuzhiyun D_ALL, ADDR_FIX_1(2), 8, NULL},
2445*4882a593Smuzhiyun
2446*4882a593Smuzhiyun {"3DSTATE_HIER_DEPTH_BUFFER", OP_3DSTATE_HIER_DEPTH_BUFFER, F_LEN_VAR,
2447*4882a593Smuzhiyun R_RCS, D_ALL, ADDR_FIX_1(2), 8, NULL},
2448*4882a593Smuzhiyun
2449*4882a593Smuzhiyun {"3DSTATE_CLEAR_PARAMS", OP_3DSTATE_CLEAR_PARAMS, F_LEN_VAR,
2450*4882a593Smuzhiyun R_RCS, D_ALL, 0, 8, NULL},
2451*4882a593Smuzhiyun
2452*4882a593Smuzhiyun {"3DSTATE_PUSH_CONSTANT_ALLOC_VS", OP_3DSTATE_PUSH_CONSTANT_ALLOC_VS,
2453*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2454*4882a593Smuzhiyun
2455*4882a593Smuzhiyun {"3DSTATE_PUSH_CONSTANT_ALLOC_HS", OP_3DSTATE_PUSH_CONSTANT_ALLOC_HS,
2456*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2457*4882a593Smuzhiyun
2458*4882a593Smuzhiyun {"3DSTATE_PUSH_CONSTANT_ALLOC_DS", OP_3DSTATE_PUSH_CONSTANT_ALLOC_DS,
2459*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2460*4882a593Smuzhiyun
2461*4882a593Smuzhiyun {"3DSTATE_PUSH_CONSTANT_ALLOC_GS", OP_3DSTATE_PUSH_CONSTANT_ALLOC_GS,
2462*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2463*4882a593Smuzhiyun
2464*4882a593Smuzhiyun {"3DSTATE_PUSH_CONSTANT_ALLOC_PS", OP_3DSTATE_PUSH_CONSTANT_ALLOC_PS,
2465*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2466*4882a593Smuzhiyun
2467*4882a593Smuzhiyun {"3DSTATE_MONOFILTER_SIZE", OP_3DSTATE_MONOFILTER_SIZE, F_LEN_VAR,
2468*4882a593Smuzhiyun R_RCS, D_ALL, 0, 8, NULL},
2469*4882a593Smuzhiyun
2470*4882a593Smuzhiyun {"3DSTATE_SO_DECL_LIST", OP_3DSTATE_SO_DECL_LIST, F_LEN_VAR, R_RCS,
2471*4882a593Smuzhiyun D_ALL, 0, 9, NULL},
2472*4882a593Smuzhiyun
2473*4882a593Smuzhiyun {"3DSTATE_SO_BUFFER", OP_3DSTATE_SO_BUFFER, F_LEN_VAR, R_RCS, D_BDW_PLUS,
2474*4882a593Smuzhiyun ADDR_FIX_2(2, 4), 8, NULL},
2475*4882a593Smuzhiyun
2476*4882a593Smuzhiyun {"3DSTATE_BINDING_TABLE_POOL_ALLOC",
2477*4882a593Smuzhiyun OP_3DSTATE_BINDING_TABLE_POOL_ALLOC,
2478*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_BDW_PLUS, ADDR_FIX_1(1), 8, NULL},
2479*4882a593Smuzhiyun
2480*4882a593Smuzhiyun {"3DSTATE_GATHER_POOL_ALLOC", OP_3DSTATE_GATHER_POOL_ALLOC,
2481*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_BDW_PLUS, ADDR_FIX_1(1), 8, NULL},
2482*4882a593Smuzhiyun
2483*4882a593Smuzhiyun {"3DSTATE_DX9_CONSTANT_BUFFER_POOL_ALLOC",
2484*4882a593Smuzhiyun OP_3DSTATE_DX9_CONSTANT_BUFFER_POOL_ALLOC,
2485*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_BDW_PLUS, ADDR_FIX_1(1), 8, NULL},
2486*4882a593Smuzhiyun
2487*4882a593Smuzhiyun {"3DSTATE_SAMPLE_PATTERN", OP_3DSTATE_SAMPLE_PATTERN, F_LEN_VAR, R_RCS,
2488*4882a593Smuzhiyun D_BDW_PLUS, 0, 8, NULL},
2489*4882a593Smuzhiyun
2490*4882a593Smuzhiyun {"PIPE_CONTROL", OP_PIPE_CONTROL, F_LEN_VAR, R_RCS, D_ALL,
2491*4882a593Smuzhiyun ADDR_FIX_1(2), 8, cmd_handler_pipe_control},
2492*4882a593Smuzhiyun
2493*4882a593Smuzhiyun {"3DPRIMITIVE", OP_3DPRIMITIVE, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2494*4882a593Smuzhiyun
2495*4882a593Smuzhiyun {"PIPELINE_SELECT", OP_PIPELINE_SELECT, F_LEN_CONST, R_RCS, D_ALL, 0,
2496*4882a593Smuzhiyun 1, NULL},
2497*4882a593Smuzhiyun
2498*4882a593Smuzhiyun {"STATE_PREFETCH", OP_STATE_PREFETCH, F_LEN_VAR, R_RCS, D_ALL,
2499*4882a593Smuzhiyun ADDR_FIX_1(1), 8, NULL},
2500*4882a593Smuzhiyun
2501*4882a593Smuzhiyun {"STATE_SIP", OP_STATE_SIP, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2502*4882a593Smuzhiyun
2503*4882a593Smuzhiyun {"STATE_BASE_ADDRESS", OP_STATE_BASE_ADDRESS, F_LEN_VAR, R_RCS, D_BDW_PLUS,
2504*4882a593Smuzhiyun ADDR_FIX_5(1, 3, 4, 5, 6), 8, NULL},
2505*4882a593Smuzhiyun
2506*4882a593Smuzhiyun {"OP_3D_MEDIA_0_1_4", OP_3D_MEDIA_0_1_4, F_LEN_VAR, R_RCS, D_ALL,
2507*4882a593Smuzhiyun ADDR_FIX_1(1), 8, NULL},
2508*4882a593Smuzhiyun
2509*4882a593Smuzhiyun {"OP_SWTESS_BASE_ADDRESS", OP_SWTESS_BASE_ADDRESS,
2510*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, ADDR_FIX_2(1, 2), 3, NULL},
2511*4882a593Smuzhiyun
2512*4882a593Smuzhiyun {"3DSTATE_VS", OP_3DSTATE_VS, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2513*4882a593Smuzhiyun
2514*4882a593Smuzhiyun {"3DSTATE_SF", OP_3DSTATE_SF, F_LEN_VAR, R_RCS, D_ALL, 0, 8, NULL},
2515*4882a593Smuzhiyun
2516*4882a593Smuzhiyun {"3DSTATE_CONSTANT_VS", OP_3DSTATE_CONSTANT_VS, F_LEN_VAR, R_RCS, D_BDW_PLUS,
2517*4882a593Smuzhiyun 0, 8, NULL},
2518*4882a593Smuzhiyun
2519*4882a593Smuzhiyun {"3DSTATE_COMPONENT_PACKING", OP_3DSTATE_COMPONENT_PACKING, F_LEN_VAR, R_RCS,
2520*4882a593Smuzhiyun D_SKL_PLUS, 0, 8, NULL},
2521*4882a593Smuzhiyun
2522*4882a593Smuzhiyun {"MEDIA_INTERFACE_DESCRIPTOR_LOAD", OP_MEDIA_INTERFACE_DESCRIPTOR_LOAD,
2523*4882a593Smuzhiyun F_LEN_VAR, R_RCS, D_ALL, 0, 16, NULL},
2524*4882a593Smuzhiyun
2525*4882a593Smuzhiyun {"MEDIA_GATEWAY_STATE", OP_MEDIA_GATEWAY_STATE, F_LEN_VAR, R_RCS, D_ALL,
2526*4882a593Smuzhiyun 0, 16, NULL},
2527*4882a593Smuzhiyun
2528*4882a593Smuzhiyun {"MEDIA_STATE_FLUSH", OP_MEDIA_STATE_FLUSH, F_LEN_VAR, R_RCS, D_ALL,
2529*4882a593Smuzhiyun 0, 16, NULL},
2530*4882a593Smuzhiyun
2531*4882a593Smuzhiyun {"MEDIA_POOL_STATE", OP_MEDIA_POOL_STATE, F_LEN_VAR, R_RCS, D_ALL,
2532*4882a593Smuzhiyun 0, 16, NULL},
2533*4882a593Smuzhiyun
2534*4882a593Smuzhiyun {"MEDIA_OBJECT", OP_MEDIA_OBJECT, F_LEN_VAR, R_RCS, D_ALL, 0, 16, NULL},
2535*4882a593Smuzhiyun
2536*4882a593Smuzhiyun {"MEDIA_CURBE_LOAD", OP_MEDIA_CURBE_LOAD, F_LEN_VAR, R_RCS, D_ALL,
2537*4882a593Smuzhiyun 0, 16, NULL},
2538*4882a593Smuzhiyun
2539*4882a593Smuzhiyun {"MEDIA_OBJECT_PRT", OP_MEDIA_OBJECT_PRT, F_LEN_VAR, R_RCS, D_ALL,
2540*4882a593Smuzhiyun 0, 16, NULL},
2541*4882a593Smuzhiyun
2542*4882a593Smuzhiyun {"MEDIA_OBJECT_WALKER", OP_MEDIA_OBJECT_WALKER, F_LEN_VAR, R_RCS, D_ALL,
2543*4882a593Smuzhiyun 0, 16, NULL},
2544*4882a593Smuzhiyun
2545*4882a593Smuzhiyun {"GPGPU_WALKER", OP_GPGPU_WALKER, F_LEN_VAR, R_RCS, D_ALL,
2546*4882a593Smuzhiyun 0, 8, NULL},
2547*4882a593Smuzhiyun
2548*4882a593Smuzhiyun {"MEDIA_VFE_STATE", OP_MEDIA_VFE_STATE, F_LEN_VAR, R_RCS, D_ALL, 0, 16,
2549*4882a593Smuzhiyun NULL},
2550*4882a593Smuzhiyun
2551*4882a593Smuzhiyun {"3DSTATE_VF_STATISTICS_GM45", OP_3DSTATE_VF_STATISTICS_GM45,
2552*4882a593Smuzhiyun F_LEN_CONST, R_ALL, D_ALL, 0, 1, NULL},
2553*4882a593Smuzhiyun
2554*4882a593Smuzhiyun {"MFX_PIPE_MODE_SELECT", OP_MFX_PIPE_MODE_SELECT, F_LEN_VAR,
2555*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2556*4882a593Smuzhiyun
2557*4882a593Smuzhiyun {"MFX_SURFACE_STATE", OP_MFX_SURFACE_STATE, F_LEN_VAR,
2558*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2559*4882a593Smuzhiyun
2560*4882a593Smuzhiyun {"MFX_PIPE_BUF_ADDR_STATE", OP_MFX_PIPE_BUF_ADDR_STATE, F_LEN_VAR,
2561*4882a593Smuzhiyun R_VCS, D_BDW_PLUS, 0, 12, NULL},
2562*4882a593Smuzhiyun
2563*4882a593Smuzhiyun {"MFX_IND_OBJ_BASE_ADDR_STATE", OP_MFX_IND_OBJ_BASE_ADDR_STATE,
2564*4882a593Smuzhiyun F_LEN_VAR, R_VCS, D_BDW_PLUS, 0, 12, NULL},
2565*4882a593Smuzhiyun
2566*4882a593Smuzhiyun {"MFX_BSP_BUF_BASE_ADDR_STATE", OP_MFX_BSP_BUF_BASE_ADDR_STATE,
2567*4882a593Smuzhiyun F_LEN_VAR, R_VCS, D_BDW_PLUS, ADDR_FIX_3(1, 3, 5), 12, NULL},
2568*4882a593Smuzhiyun
2569*4882a593Smuzhiyun {"OP_2_0_0_5", OP_2_0_0_5, F_LEN_VAR, R_VCS, D_BDW_PLUS, 0, 12, NULL},
2570*4882a593Smuzhiyun
2571*4882a593Smuzhiyun {"MFX_STATE_POINTER", OP_MFX_STATE_POINTER, F_LEN_VAR,
2572*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2573*4882a593Smuzhiyun
2574*4882a593Smuzhiyun {"MFX_QM_STATE", OP_MFX_QM_STATE, F_LEN_VAR,
2575*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2576*4882a593Smuzhiyun
2577*4882a593Smuzhiyun {"MFX_FQM_STATE", OP_MFX_FQM_STATE, F_LEN_VAR,
2578*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2579*4882a593Smuzhiyun
2580*4882a593Smuzhiyun {"MFX_PAK_INSERT_OBJECT", OP_MFX_PAK_INSERT_OBJECT, F_LEN_VAR,
2581*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2582*4882a593Smuzhiyun
2583*4882a593Smuzhiyun {"MFX_STITCH_OBJECT", OP_MFX_STITCH_OBJECT, F_LEN_VAR,
2584*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2585*4882a593Smuzhiyun
2586*4882a593Smuzhiyun {"MFD_IT_OBJECT", OP_MFD_IT_OBJECT, F_LEN_VAR,
2587*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2588*4882a593Smuzhiyun
2589*4882a593Smuzhiyun {"MFX_WAIT", OP_MFX_WAIT, F_LEN_VAR,
2590*4882a593Smuzhiyun R_VCS, D_ALL, 0, 6, NULL},
2591*4882a593Smuzhiyun
2592*4882a593Smuzhiyun {"MFX_AVC_IMG_STATE", OP_MFX_AVC_IMG_STATE, F_LEN_VAR,
2593*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2594*4882a593Smuzhiyun
2595*4882a593Smuzhiyun {"MFX_AVC_QM_STATE", OP_MFX_AVC_QM_STATE, F_LEN_VAR,
2596*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2597*4882a593Smuzhiyun
2598*4882a593Smuzhiyun {"MFX_AVC_DIRECTMODE_STATE", OP_MFX_AVC_DIRECTMODE_STATE, F_LEN_VAR,
2599*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2600*4882a593Smuzhiyun
2601*4882a593Smuzhiyun {"MFX_AVC_SLICE_STATE", OP_MFX_AVC_SLICE_STATE, F_LEN_VAR,
2602*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2603*4882a593Smuzhiyun
2604*4882a593Smuzhiyun {"MFX_AVC_REF_IDX_STATE", OP_MFX_AVC_REF_IDX_STATE, F_LEN_VAR,
2605*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2606*4882a593Smuzhiyun
2607*4882a593Smuzhiyun {"MFX_AVC_WEIGHTOFFSET_STATE", OP_MFX_AVC_WEIGHTOFFSET_STATE, F_LEN_VAR,
2608*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2609*4882a593Smuzhiyun
2610*4882a593Smuzhiyun {"MFD_AVC_PICID_STATE", OP_MFD_AVC_PICID_STATE, F_LEN_VAR,
2611*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2612*4882a593Smuzhiyun {"MFD_AVC_DPB_STATE", OP_MFD_AVC_DPB_STATE, F_LEN_VAR,
2613*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2614*4882a593Smuzhiyun
2615*4882a593Smuzhiyun {"MFD_AVC_BSD_OBJECT", OP_MFD_AVC_BSD_OBJECT, F_LEN_VAR,
2616*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2617*4882a593Smuzhiyun
2618*4882a593Smuzhiyun {"MFD_AVC_SLICEADDR", OP_MFD_AVC_SLICEADDR, F_LEN_VAR,
2619*4882a593Smuzhiyun R_VCS, D_ALL, ADDR_FIX_1(2), 12, NULL},
2620*4882a593Smuzhiyun
2621*4882a593Smuzhiyun {"MFC_AVC_PAK_OBJECT", OP_MFC_AVC_PAK_OBJECT, F_LEN_VAR,
2622*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2623*4882a593Smuzhiyun
2624*4882a593Smuzhiyun {"MFX_VC1_PRED_PIPE_STATE", OP_MFX_VC1_PRED_PIPE_STATE, F_LEN_VAR,
2625*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2626*4882a593Smuzhiyun
2627*4882a593Smuzhiyun {"MFX_VC1_DIRECTMODE_STATE", OP_MFX_VC1_DIRECTMODE_STATE, F_LEN_VAR,
2628*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2629*4882a593Smuzhiyun
2630*4882a593Smuzhiyun {"MFD_VC1_SHORT_PIC_STATE", OP_MFD_VC1_SHORT_PIC_STATE, F_LEN_VAR,
2631*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2632*4882a593Smuzhiyun
2633*4882a593Smuzhiyun {"MFD_VC1_LONG_PIC_STATE", OP_MFD_VC1_LONG_PIC_STATE, F_LEN_VAR,
2634*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2635*4882a593Smuzhiyun
2636*4882a593Smuzhiyun {"MFD_VC1_BSD_OBJECT", OP_MFD_VC1_BSD_OBJECT, F_LEN_VAR,
2637*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2638*4882a593Smuzhiyun
2639*4882a593Smuzhiyun {"MFC_MPEG2_SLICEGROUP_STATE", OP_MFC_MPEG2_SLICEGROUP_STATE, F_LEN_VAR,
2640*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2641*4882a593Smuzhiyun
2642*4882a593Smuzhiyun {"MFC_MPEG2_PAK_OBJECT", OP_MFC_MPEG2_PAK_OBJECT, F_LEN_VAR,
2643*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2644*4882a593Smuzhiyun
2645*4882a593Smuzhiyun {"MFX_MPEG2_PIC_STATE", OP_MFX_MPEG2_PIC_STATE, F_LEN_VAR,
2646*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2647*4882a593Smuzhiyun
2648*4882a593Smuzhiyun {"MFX_MPEG2_QM_STATE", OP_MFX_MPEG2_QM_STATE, F_LEN_VAR,
2649*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2650*4882a593Smuzhiyun
2651*4882a593Smuzhiyun {"MFD_MPEG2_BSD_OBJECT", OP_MFD_MPEG2_BSD_OBJECT, F_LEN_VAR,
2652*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2653*4882a593Smuzhiyun
2654*4882a593Smuzhiyun {"MFX_2_6_0_0", OP_MFX_2_6_0_0, F_LEN_VAR, R_VCS, D_ALL,
2655*4882a593Smuzhiyun 0, 16, NULL},
2656*4882a593Smuzhiyun
2657*4882a593Smuzhiyun {"MFX_2_6_0_9", OP_MFX_2_6_0_9, F_LEN_VAR, R_VCS, D_ALL, 0, 16, NULL},
2658*4882a593Smuzhiyun
2659*4882a593Smuzhiyun {"MFX_2_6_0_8", OP_MFX_2_6_0_8, F_LEN_VAR, R_VCS, D_ALL, 0, 16, NULL},
2660*4882a593Smuzhiyun
2661*4882a593Smuzhiyun {"MFX_JPEG_PIC_STATE", OP_MFX_JPEG_PIC_STATE, F_LEN_VAR,
2662*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2663*4882a593Smuzhiyun
2664*4882a593Smuzhiyun {"MFX_JPEG_HUFF_TABLE_STATE", OP_MFX_JPEG_HUFF_TABLE_STATE, F_LEN_VAR,
2665*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2666*4882a593Smuzhiyun
2667*4882a593Smuzhiyun {"MFD_JPEG_BSD_OBJECT", OP_MFD_JPEG_BSD_OBJECT, F_LEN_VAR,
2668*4882a593Smuzhiyun R_VCS, D_ALL, 0, 12, NULL},
2669*4882a593Smuzhiyun
2670*4882a593Smuzhiyun {"VEBOX_STATE", OP_VEB_STATE, F_LEN_VAR, R_VECS, D_ALL, 0, 12, NULL},
2671*4882a593Smuzhiyun
2672*4882a593Smuzhiyun {"VEBOX_SURFACE_STATE", OP_VEB_SURFACE_STATE, F_LEN_VAR, R_VECS, D_ALL,
2673*4882a593Smuzhiyun 0, 12, NULL},
2674*4882a593Smuzhiyun
2675*4882a593Smuzhiyun {"VEB_DI_IECP", OP_VEB_DNDI_IECP_STATE, F_LEN_VAR, R_VECS, D_BDW_PLUS,
2676*4882a593Smuzhiyun 0, 12, NULL},
2677*4882a593Smuzhiyun };
2678*4882a593Smuzhiyun
add_cmd_entry(struct intel_gvt * gvt,struct cmd_entry * e)2679*4882a593Smuzhiyun static void add_cmd_entry(struct intel_gvt *gvt, struct cmd_entry *e)
2680*4882a593Smuzhiyun {
2681*4882a593Smuzhiyun hash_add(gvt->cmd_table, &e->hlist, e->info->opcode);
2682*4882a593Smuzhiyun }
2683*4882a593Smuzhiyun
2684*4882a593Smuzhiyun /* call the cmd handler, and advance ip */
cmd_parser_exec(struct parser_exec_state * s)2685*4882a593Smuzhiyun static int cmd_parser_exec(struct parser_exec_state *s)
2686*4882a593Smuzhiyun {
2687*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
2688*4882a593Smuzhiyun const struct cmd_info *info;
2689*4882a593Smuzhiyun u32 cmd;
2690*4882a593Smuzhiyun int ret = 0;
2691*4882a593Smuzhiyun
2692*4882a593Smuzhiyun cmd = cmd_val(s, 0);
2693*4882a593Smuzhiyun
2694*4882a593Smuzhiyun /* fastpath for MI_NOOP */
2695*4882a593Smuzhiyun if (cmd == MI_NOOP)
2696*4882a593Smuzhiyun info = &cmd_info[mi_noop_index];
2697*4882a593Smuzhiyun else
2698*4882a593Smuzhiyun info = get_cmd_info(s->vgpu->gvt, cmd, s->engine);
2699*4882a593Smuzhiyun
2700*4882a593Smuzhiyun if (info == NULL) {
2701*4882a593Smuzhiyun gvt_vgpu_err("unknown cmd 0x%x, opcode=0x%x, addr_type=%s, ring %s, workload=%p\n",
2702*4882a593Smuzhiyun cmd, get_opcode(cmd, s->engine),
2703*4882a593Smuzhiyun repr_addr_type(s->buf_addr_type),
2704*4882a593Smuzhiyun s->engine->name, s->workload);
2705*4882a593Smuzhiyun return -EBADRQC;
2706*4882a593Smuzhiyun }
2707*4882a593Smuzhiyun
2708*4882a593Smuzhiyun s->info = info;
2709*4882a593Smuzhiyun
2710*4882a593Smuzhiyun trace_gvt_command(vgpu->id, s->engine->id, s->ip_gma, s->ip_va,
2711*4882a593Smuzhiyun cmd_length(s), s->buf_type, s->buf_addr_type,
2712*4882a593Smuzhiyun s->workload, info->name);
2713*4882a593Smuzhiyun
2714*4882a593Smuzhiyun if ((info->flag & F_LEN_MASK) == F_LEN_VAR_FIXED) {
2715*4882a593Smuzhiyun ret = gvt_check_valid_cmd_length(cmd_length(s),
2716*4882a593Smuzhiyun info->valid_len);
2717*4882a593Smuzhiyun if (ret)
2718*4882a593Smuzhiyun return ret;
2719*4882a593Smuzhiyun }
2720*4882a593Smuzhiyun
2721*4882a593Smuzhiyun if (info->handler) {
2722*4882a593Smuzhiyun ret = info->handler(s);
2723*4882a593Smuzhiyun if (ret < 0) {
2724*4882a593Smuzhiyun gvt_vgpu_err("%s handler error\n", info->name);
2725*4882a593Smuzhiyun return ret;
2726*4882a593Smuzhiyun }
2727*4882a593Smuzhiyun }
2728*4882a593Smuzhiyun
2729*4882a593Smuzhiyun if (!(info->flag & F_IP_ADVANCE_CUSTOM)) {
2730*4882a593Smuzhiyun ret = cmd_advance_default(s);
2731*4882a593Smuzhiyun if (ret) {
2732*4882a593Smuzhiyun gvt_vgpu_err("%s IP advance error\n", info->name);
2733*4882a593Smuzhiyun return ret;
2734*4882a593Smuzhiyun }
2735*4882a593Smuzhiyun }
2736*4882a593Smuzhiyun return 0;
2737*4882a593Smuzhiyun }
2738*4882a593Smuzhiyun
gma_out_of_range(unsigned long gma,unsigned long gma_head,unsigned int gma_tail)2739*4882a593Smuzhiyun static inline bool gma_out_of_range(unsigned long gma,
2740*4882a593Smuzhiyun unsigned long gma_head, unsigned int gma_tail)
2741*4882a593Smuzhiyun {
2742*4882a593Smuzhiyun if (gma_tail >= gma_head)
2743*4882a593Smuzhiyun return (gma < gma_head) || (gma > gma_tail);
2744*4882a593Smuzhiyun else
2745*4882a593Smuzhiyun return (gma > gma_tail) && (gma < gma_head);
2746*4882a593Smuzhiyun }
2747*4882a593Smuzhiyun
2748*4882a593Smuzhiyun /* Keep the consistent return type, e.g EBADRQC for unknown
2749*4882a593Smuzhiyun * cmd, EFAULT for invalid address, EPERM for nonpriv. later
2750*4882a593Smuzhiyun * works as the input of VM healthy status.
2751*4882a593Smuzhiyun */
command_scan(struct parser_exec_state * s,unsigned long rb_head,unsigned long rb_tail,unsigned long rb_start,unsigned long rb_len)2752*4882a593Smuzhiyun static int command_scan(struct parser_exec_state *s,
2753*4882a593Smuzhiyun unsigned long rb_head, unsigned long rb_tail,
2754*4882a593Smuzhiyun unsigned long rb_start, unsigned long rb_len)
2755*4882a593Smuzhiyun {
2756*4882a593Smuzhiyun
2757*4882a593Smuzhiyun unsigned long gma_head, gma_tail, gma_bottom;
2758*4882a593Smuzhiyun int ret = 0;
2759*4882a593Smuzhiyun struct intel_vgpu *vgpu = s->vgpu;
2760*4882a593Smuzhiyun
2761*4882a593Smuzhiyun gma_head = rb_start + rb_head;
2762*4882a593Smuzhiyun gma_tail = rb_start + rb_tail;
2763*4882a593Smuzhiyun gma_bottom = rb_start + rb_len;
2764*4882a593Smuzhiyun
2765*4882a593Smuzhiyun while (s->ip_gma != gma_tail) {
2766*4882a593Smuzhiyun if (s->buf_type == RING_BUFFER_INSTRUCTION) {
2767*4882a593Smuzhiyun if (!(s->ip_gma >= rb_start) ||
2768*4882a593Smuzhiyun !(s->ip_gma < gma_bottom)) {
2769*4882a593Smuzhiyun gvt_vgpu_err("ip_gma %lx out of ring scope."
2770*4882a593Smuzhiyun "(base:0x%lx, bottom: 0x%lx)\n",
2771*4882a593Smuzhiyun s->ip_gma, rb_start,
2772*4882a593Smuzhiyun gma_bottom);
2773*4882a593Smuzhiyun parser_exec_state_dump(s);
2774*4882a593Smuzhiyun return -EFAULT;
2775*4882a593Smuzhiyun }
2776*4882a593Smuzhiyun if (gma_out_of_range(s->ip_gma, gma_head, gma_tail)) {
2777*4882a593Smuzhiyun gvt_vgpu_err("ip_gma %lx out of range."
2778*4882a593Smuzhiyun "base 0x%lx head 0x%lx tail 0x%lx\n",
2779*4882a593Smuzhiyun s->ip_gma, rb_start,
2780*4882a593Smuzhiyun rb_head, rb_tail);
2781*4882a593Smuzhiyun parser_exec_state_dump(s);
2782*4882a593Smuzhiyun break;
2783*4882a593Smuzhiyun }
2784*4882a593Smuzhiyun }
2785*4882a593Smuzhiyun ret = cmd_parser_exec(s);
2786*4882a593Smuzhiyun if (ret) {
2787*4882a593Smuzhiyun gvt_vgpu_err("cmd parser error\n");
2788*4882a593Smuzhiyun parser_exec_state_dump(s);
2789*4882a593Smuzhiyun break;
2790*4882a593Smuzhiyun }
2791*4882a593Smuzhiyun }
2792*4882a593Smuzhiyun
2793*4882a593Smuzhiyun return ret;
2794*4882a593Smuzhiyun }
2795*4882a593Smuzhiyun
scan_workload(struct intel_vgpu_workload * workload)2796*4882a593Smuzhiyun static int scan_workload(struct intel_vgpu_workload *workload)
2797*4882a593Smuzhiyun {
2798*4882a593Smuzhiyun unsigned long gma_head, gma_tail, gma_bottom;
2799*4882a593Smuzhiyun struct parser_exec_state s;
2800*4882a593Smuzhiyun int ret = 0;
2801*4882a593Smuzhiyun
2802*4882a593Smuzhiyun /* ring base is page aligned */
2803*4882a593Smuzhiyun if (WARN_ON(!IS_ALIGNED(workload->rb_start, I915_GTT_PAGE_SIZE)))
2804*4882a593Smuzhiyun return -EINVAL;
2805*4882a593Smuzhiyun
2806*4882a593Smuzhiyun gma_head = workload->rb_start + workload->rb_head;
2807*4882a593Smuzhiyun gma_tail = workload->rb_start + workload->rb_tail;
2808*4882a593Smuzhiyun gma_bottom = workload->rb_start + _RING_CTL_BUF_SIZE(workload->rb_ctl);
2809*4882a593Smuzhiyun
2810*4882a593Smuzhiyun s.buf_type = RING_BUFFER_INSTRUCTION;
2811*4882a593Smuzhiyun s.buf_addr_type = GTT_BUFFER;
2812*4882a593Smuzhiyun s.vgpu = workload->vgpu;
2813*4882a593Smuzhiyun s.engine = workload->engine;
2814*4882a593Smuzhiyun s.ring_start = workload->rb_start;
2815*4882a593Smuzhiyun s.ring_size = _RING_CTL_BUF_SIZE(workload->rb_ctl);
2816*4882a593Smuzhiyun s.ring_head = gma_head;
2817*4882a593Smuzhiyun s.ring_tail = gma_tail;
2818*4882a593Smuzhiyun s.rb_va = workload->shadow_ring_buffer_va;
2819*4882a593Smuzhiyun s.workload = workload;
2820*4882a593Smuzhiyun s.is_ctx_wa = false;
2821*4882a593Smuzhiyun
2822*4882a593Smuzhiyun if (bypass_scan_mask & workload->engine->mask || gma_head == gma_tail)
2823*4882a593Smuzhiyun return 0;
2824*4882a593Smuzhiyun
2825*4882a593Smuzhiyun ret = ip_gma_set(&s, gma_head);
2826*4882a593Smuzhiyun if (ret)
2827*4882a593Smuzhiyun goto out;
2828*4882a593Smuzhiyun
2829*4882a593Smuzhiyun ret = command_scan(&s, workload->rb_head, workload->rb_tail,
2830*4882a593Smuzhiyun workload->rb_start, _RING_CTL_BUF_SIZE(workload->rb_ctl));
2831*4882a593Smuzhiyun
2832*4882a593Smuzhiyun out:
2833*4882a593Smuzhiyun return ret;
2834*4882a593Smuzhiyun }
2835*4882a593Smuzhiyun
scan_wa_ctx(struct intel_shadow_wa_ctx * wa_ctx)2836*4882a593Smuzhiyun static int scan_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
2837*4882a593Smuzhiyun {
2838*4882a593Smuzhiyun
2839*4882a593Smuzhiyun unsigned long gma_head, gma_tail, gma_bottom, ring_size, ring_tail;
2840*4882a593Smuzhiyun struct parser_exec_state s;
2841*4882a593Smuzhiyun int ret = 0;
2842*4882a593Smuzhiyun struct intel_vgpu_workload *workload = container_of(wa_ctx,
2843*4882a593Smuzhiyun struct intel_vgpu_workload,
2844*4882a593Smuzhiyun wa_ctx);
2845*4882a593Smuzhiyun
2846*4882a593Smuzhiyun /* ring base is page aligned */
2847*4882a593Smuzhiyun if (WARN_ON(!IS_ALIGNED(wa_ctx->indirect_ctx.guest_gma,
2848*4882a593Smuzhiyun I915_GTT_PAGE_SIZE)))
2849*4882a593Smuzhiyun return -EINVAL;
2850*4882a593Smuzhiyun
2851*4882a593Smuzhiyun ring_tail = wa_ctx->indirect_ctx.size + 3 * sizeof(u32);
2852*4882a593Smuzhiyun ring_size = round_up(wa_ctx->indirect_ctx.size + CACHELINE_BYTES,
2853*4882a593Smuzhiyun PAGE_SIZE);
2854*4882a593Smuzhiyun gma_head = wa_ctx->indirect_ctx.guest_gma;
2855*4882a593Smuzhiyun gma_tail = wa_ctx->indirect_ctx.guest_gma + ring_tail;
2856*4882a593Smuzhiyun gma_bottom = wa_ctx->indirect_ctx.guest_gma + ring_size;
2857*4882a593Smuzhiyun
2858*4882a593Smuzhiyun s.buf_type = RING_BUFFER_INSTRUCTION;
2859*4882a593Smuzhiyun s.buf_addr_type = GTT_BUFFER;
2860*4882a593Smuzhiyun s.vgpu = workload->vgpu;
2861*4882a593Smuzhiyun s.engine = workload->engine;
2862*4882a593Smuzhiyun s.ring_start = wa_ctx->indirect_ctx.guest_gma;
2863*4882a593Smuzhiyun s.ring_size = ring_size;
2864*4882a593Smuzhiyun s.ring_head = gma_head;
2865*4882a593Smuzhiyun s.ring_tail = gma_tail;
2866*4882a593Smuzhiyun s.rb_va = wa_ctx->indirect_ctx.shadow_va;
2867*4882a593Smuzhiyun s.workload = workload;
2868*4882a593Smuzhiyun s.is_ctx_wa = true;
2869*4882a593Smuzhiyun
2870*4882a593Smuzhiyun ret = ip_gma_set(&s, gma_head);
2871*4882a593Smuzhiyun if (ret)
2872*4882a593Smuzhiyun goto out;
2873*4882a593Smuzhiyun
2874*4882a593Smuzhiyun ret = command_scan(&s, 0, ring_tail,
2875*4882a593Smuzhiyun wa_ctx->indirect_ctx.guest_gma, ring_size);
2876*4882a593Smuzhiyun out:
2877*4882a593Smuzhiyun return ret;
2878*4882a593Smuzhiyun }
2879*4882a593Smuzhiyun
shadow_workload_ring_buffer(struct intel_vgpu_workload * workload)2880*4882a593Smuzhiyun static int shadow_workload_ring_buffer(struct intel_vgpu_workload *workload)
2881*4882a593Smuzhiyun {
2882*4882a593Smuzhiyun struct intel_vgpu *vgpu = workload->vgpu;
2883*4882a593Smuzhiyun struct intel_vgpu_submission *s = &vgpu->submission;
2884*4882a593Smuzhiyun unsigned long gma_head, gma_tail, gma_top, guest_rb_size;
2885*4882a593Smuzhiyun void *shadow_ring_buffer_va;
2886*4882a593Smuzhiyun int ret;
2887*4882a593Smuzhiyun
2888*4882a593Smuzhiyun guest_rb_size = _RING_CTL_BUF_SIZE(workload->rb_ctl);
2889*4882a593Smuzhiyun
2890*4882a593Smuzhiyun /* calculate workload ring buffer size */
2891*4882a593Smuzhiyun workload->rb_len = (workload->rb_tail + guest_rb_size -
2892*4882a593Smuzhiyun workload->rb_head) % guest_rb_size;
2893*4882a593Smuzhiyun
2894*4882a593Smuzhiyun gma_head = workload->rb_start + workload->rb_head;
2895*4882a593Smuzhiyun gma_tail = workload->rb_start + workload->rb_tail;
2896*4882a593Smuzhiyun gma_top = workload->rb_start + guest_rb_size;
2897*4882a593Smuzhiyun
2898*4882a593Smuzhiyun if (workload->rb_len > s->ring_scan_buffer_size[workload->engine->id]) {
2899*4882a593Smuzhiyun void *p;
2900*4882a593Smuzhiyun
2901*4882a593Smuzhiyun /* realloc the new ring buffer if needed */
2902*4882a593Smuzhiyun p = krealloc(s->ring_scan_buffer[workload->engine->id],
2903*4882a593Smuzhiyun workload->rb_len, GFP_KERNEL);
2904*4882a593Smuzhiyun if (!p) {
2905*4882a593Smuzhiyun gvt_vgpu_err("fail to re-alloc ring scan buffer\n");
2906*4882a593Smuzhiyun return -ENOMEM;
2907*4882a593Smuzhiyun }
2908*4882a593Smuzhiyun s->ring_scan_buffer[workload->engine->id] = p;
2909*4882a593Smuzhiyun s->ring_scan_buffer_size[workload->engine->id] = workload->rb_len;
2910*4882a593Smuzhiyun }
2911*4882a593Smuzhiyun
2912*4882a593Smuzhiyun shadow_ring_buffer_va = s->ring_scan_buffer[workload->engine->id];
2913*4882a593Smuzhiyun
2914*4882a593Smuzhiyun /* get shadow ring buffer va */
2915*4882a593Smuzhiyun workload->shadow_ring_buffer_va = shadow_ring_buffer_va;
2916*4882a593Smuzhiyun
2917*4882a593Smuzhiyun /* head > tail --> copy head <-> top */
2918*4882a593Smuzhiyun if (gma_head > gma_tail) {
2919*4882a593Smuzhiyun ret = copy_gma_to_hva(vgpu, vgpu->gtt.ggtt_mm,
2920*4882a593Smuzhiyun gma_head, gma_top, shadow_ring_buffer_va);
2921*4882a593Smuzhiyun if (ret < 0) {
2922*4882a593Smuzhiyun gvt_vgpu_err("fail to copy guest ring buffer\n");
2923*4882a593Smuzhiyun return ret;
2924*4882a593Smuzhiyun }
2925*4882a593Smuzhiyun shadow_ring_buffer_va += ret;
2926*4882a593Smuzhiyun gma_head = workload->rb_start;
2927*4882a593Smuzhiyun }
2928*4882a593Smuzhiyun
2929*4882a593Smuzhiyun /* copy head or start <-> tail */
2930*4882a593Smuzhiyun ret = copy_gma_to_hva(vgpu, vgpu->gtt.ggtt_mm, gma_head, gma_tail,
2931*4882a593Smuzhiyun shadow_ring_buffer_va);
2932*4882a593Smuzhiyun if (ret < 0) {
2933*4882a593Smuzhiyun gvt_vgpu_err("fail to copy guest ring buffer\n");
2934*4882a593Smuzhiyun return ret;
2935*4882a593Smuzhiyun }
2936*4882a593Smuzhiyun return 0;
2937*4882a593Smuzhiyun }
2938*4882a593Smuzhiyun
intel_gvt_scan_and_shadow_ringbuffer(struct intel_vgpu_workload * workload)2939*4882a593Smuzhiyun int intel_gvt_scan_and_shadow_ringbuffer(struct intel_vgpu_workload *workload)
2940*4882a593Smuzhiyun {
2941*4882a593Smuzhiyun int ret;
2942*4882a593Smuzhiyun struct intel_vgpu *vgpu = workload->vgpu;
2943*4882a593Smuzhiyun
2944*4882a593Smuzhiyun ret = shadow_workload_ring_buffer(workload);
2945*4882a593Smuzhiyun if (ret) {
2946*4882a593Smuzhiyun gvt_vgpu_err("fail to shadow workload ring_buffer\n");
2947*4882a593Smuzhiyun return ret;
2948*4882a593Smuzhiyun }
2949*4882a593Smuzhiyun
2950*4882a593Smuzhiyun ret = scan_workload(workload);
2951*4882a593Smuzhiyun if (ret) {
2952*4882a593Smuzhiyun gvt_vgpu_err("scan workload error\n");
2953*4882a593Smuzhiyun return ret;
2954*4882a593Smuzhiyun }
2955*4882a593Smuzhiyun return 0;
2956*4882a593Smuzhiyun }
2957*4882a593Smuzhiyun
shadow_indirect_ctx(struct intel_shadow_wa_ctx * wa_ctx)2958*4882a593Smuzhiyun static int shadow_indirect_ctx(struct intel_shadow_wa_ctx *wa_ctx)
2959*4882a593Smuzhiyun {
2960*4882a593Smuzhiyun int ctx_size = wa_ctx->indirect_ctx.size;
2961*4882a593Smuzhiyun unsigned long guest_gma = wa_ctx->indirect_ctx.guest_gma;
2962*4882a593Smuzhiyun struct intel_vgpu_workload *workload = container_of(wa_ctx,
2963*4882a593Smuzhiyun struct intel_vgpu_workload,
2964*4882a593Smuzhiyun wa_ctx);
2965*4882a593Smuzhiyun struct intel_vgpu *vgpu = workload->vgpu;
2966*4882a593Smuzhiyun struct drm_i915_gem_object *obj;
2967*4882a593Smuzhiyun int ret = 0;
2968*4882a593Smuzhiyun void *map;
2969*4882a593Smuzhiyun
2970*4882a593Smuzhiyun obj = i915_gem_object_create_shmem(workload->engine->i915,
2971*4882a593Smuzhiyun roundup(ctx_size + CACHELINE_BYTES,
2972*4882a593Smuzhiyun PAGE_SIZE));
2973*4882a593Smuzhiyun if (IS_ERR(obj))
2974*4882a593Smuzhiyun return PTR_ERR(obj);
2975*4882a593Smuzhiyun
2976*4882a593Smuzhiyun /* get the va of the shadow batch buffer */
2977*4882a593Smuzhiyun map = i915_gem_object_pin_map(obj, I915_MAP_WB);
2978*4882a593Smuzhiyun if (IS_ERR(map)) {
2979*4882a593Smuzhiyun gvt_vgpu_err("failed to vmap shadow indirect ctx\n");
2980*4882a593Smuzhiyun ret = PTR_ERR(map);
2981*4882a593Smuzhiyun goto put_obj;
2982*4882a593Smuzhiyun }
2983*4882a593Smuzhiyun
2984*4882a593Smuzhiyun i915_gem_object_lock(obj, NULL);
2985*4882a593Smuzhiyun ret = i915_gem_object_set_to_cpu_domain(obj, false);
2986*4882a593Smuzhiyun i915_gem_object_unlock(obj);
2987*4882a593Smuzhiyun if (ret) {
2988*4882a593Smuzhiyun gvt_vgpu_err("failed to set shadow indirect ctx to CPU\n");
2989*4882a593Smuzhiyun goto unmap_src;
2990*4882a593Smuzhiyun }
2991*4882a593Smuzhiyun
2992*4882a593Smuzhiyun ret = copy_gma_to_hva(workload->vgpu,
2993*4882a593Smuzhiyun workload->vgpu->gtt.ggtt_mm,
2994*4882a593Smuzhiyun guest_gma, guest_gma + ctx_size,
2995*4882a593Smuzhiyun map);
2996*4882a593Smuzhiyun if (ret < 0) {
2997*4882a593Smuzhiyun gvt_vgpu_err("fail to copy guest indirect ctx\n");
2998*4882a593Smuzhiyun goto unmap_src;
2999*4882a593Smuzhiyun }
3000*4882a593Smuzhiyun
3001*4882a593Smuzhiyun wa_ctx->indirect_ctx.obj = obj;
3002*4882a593Smuzhiyun wa_ctx->indirect_ctx.shadow_va = map;
3003*4882a593Smuzhiyun return 0;
3004*4882a593Smuzhiyun
3005*4882a593Smuzhiyun unmap_src:
3006*4882a593Smuzhiyun i915_gem_object_unpin_map(obj);
3007*4882a593Smuzhiyun put_obj:
3008*4882a593Smuzhiyun i915_gem_object_put(obj);
3009*4882a593Smuzhiyun return ret;
3010*4882a593Smuzhiyun }
3011*4882a593Smuzhiyun
combine_wa_ctx(struct intel_shadow_wa_ctx * wa_ctx)3012*4882a593Smuzhiyun static int combine_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
3013*4882a593Smuzhiyun {
3014*4882a593Smuzhiyun u32 per_ctx_start[CACHELINE_DWORDS] = {0};
3015*4882a593Smuzhiyun unsigned char *bb_start_sva;
3016*4882a593Smuzhiyun
3017*4882a593Smuzhiyun if (!wa_ctx->per_ctx.valid)
3018*4882a593Smuzhiyun return 0;
3019*4882a593Smuzhiyun
3020*4882a593Smuzhiyun per_ctx_start[0] = 0x18800001;
3021*4882a593Smuzhiyun per_ctx_start[1] = wa_ctx->per_ctx.guest_gma;
3022*4882a593Smuzhiyun
3023*4882a593Smuzhiyun bb_start_sva = (unsigned char *)wa_ctx->indirect_ctx.shadow_va +
3024*4882a593Smuzhiyun wa_ctx->indirect_ctx.size;
3025*4882a593Smuzhiyun
3026*4882a593Smuzhiyun memcpy(bb_start_sva, per_ctx_start, CACHELINE_BYTES);
3027*4882a593Smuzhiyun
3028*4882a593Smuzhiyun return 0;
3029*4882a593Smuzhiyun }
3030*4882a593Smuzhiyun
intel_gvt_scan_and_shadow_wa_ctx(struct intel_shadow_wa_ctx * wa_ctx)3031*4882a593Smuzhiyun int intel_gvt_scan_and_shadow_wa_ctx(struct intel_shadow_wa_ctx *wa_ctx)
3032*4882a593Smuzhiyun {
3033*4882a593Smuzhiyun int ret;
3034*4882a593Smuzhiyun struct intel_vgpu_workload *workload = container_of(wa_ctx,
3035*4882a593Smuzhiyun struct intel_vgpu_workload,
3036*4882a593Smuzhiyun wa_ctx);
3037*4882a593Smuzhiyun struct intel_vgpu *vgpu = workload->vgpu;
3038*4882a593Smuzhiyun
3039*4882a593Smuzhiyun if (wa_ctx->indirect_ctx.size == 0)
3040*4882a593Smuzhiyun return 0;
3041*4882a593Smuzhiyun
3042*4882a593Smuzhiyun ret = shadow_indirect_ctx(wa_ctx);
3043*4882a593Smuzhiyun if (ret) {
3044*4882a593Smuzhiyun gvt_vgpu_err("fail to shadow indirect ctx\n");
3045*4882a593Smuzhiyun return ret;
3046*4882a593Smuzhiyun }
3047*4882a593Smuzhiyun
3048*4882a593Smuzhiyun combine_wa_ctx(wa_ctx);
3049*4882a593Smuzhiyun
3050*4882a593Smuzhiyun ret = scan_wa_ctx(wa_ctx);
3051*4882a593Smuzhiyun if (ret) {
3052*4882a593Smuzhiyun gvt_vgpu_err("scan wa ctx error\n");
3053*4882a593Smuzhiyun return ret;
3054*4882a593Smuzhiyun }
3055*4882a593Smuzhiyun
3056*4882a593Smuzhiyun return 0;
3057*4882a593Smuzhiyun }
3058*4882a593Smuzhiyun
init_cmd_table(struct intel_gvt * gvt)3059*4882a593Smuzhiyun static int init_cmd_table(struct intel_gvt *gvt)
3060*4882a593Smuzhiyun {
3061*4882a593Smuzhiyun unsigned int gen_type = intel_gvt_get_device_type(gvt);
3062*4882a593Smuzhiyun int i;
3063*4882a593Smuzhiyun
3064*4882a593Smuzhiyun for (i = 0; i < ARRAY_SIZE(cmd_info); i++) {
3065*4882a593Smuzhiyun struct cmd_entry *e;
3066*4882a593Smuzhiyun
3067*4882a593Smuzhiyun if (!(cmd_info[i].devices & gen_type))
3068*4882a593Smuzhiyun continue;
3069*4882a593Smuzhiyun
3070*4882a593Smuzhiyun e = kzalloc(sizeof(*e), GFP_KERNEL);
3071*4882a593Smuzhiyun if (!e)
3072*4882a593Smuzhiyun return -ENOMEM;
3073*4882a593Smuzhiyun
3074*4882a593Smuzhiyun e->info = &cmd_info[i];
3075*4882a593Smuzhiyun if (cmd_info[i].opcode == OP_MI_NOOP)
3076*4882a593Smuzhiyun mi_noop_index = i;
3077*4882a593Smuzhiyun
3078*4882a593Smuzhiyun INIT_HLIST_NODE(&e->hlist);
3079*4882a593Smuzhiyun add_cmd_entry(gvt, e);
3080*4882a593Smuzhiyun gvt_dbg_cmd("add %-30s op %04x flag %x devs %02x rings %02x\n",
3081*4882a593Smuzhiyun e->info->name, e->info->opcode, e->info->flag,
3082*4882a593Smuzhiyun e->info->devices, e->info->rings);
3083*4882a593Smuzhiyun }
3084*4882a593Smuzhiyun
3085*4882a593Smuzhiyun return 0;
3086*4882a593Smuzhiyun }
3087*4882a593Smuzhiyun
clean_cmd_table(struct intel_gvt * gvt)3088*4882a593Smuzhiyun static void clean_cmd_table(struct intel_gvt *gvt)
3089*4882a593Smuzhiyun {
3090*4882a593Smuzhiyun struct hlist_node *tmp;
3091*4882a593Smuzhiyun struct cmd_entry *e;
3092*4882a593Smuzhiyun int i;
3093*4882a593Smuzhiyun
3094*4882a593Smuzhiyun hash_for_each_safe(gvt->cmd_table, i, tmp, e, hlist)
3095*4882a593Smuzhiyun kfree(e);
3096*4882a593Smuzhiyun
3097*4882a593Smuzhiyun hash_init(gvt->cmd_table);
3098*4882a593Smuzhiyun }
3099*4882a593Smuzhiyun
intel_gvt_clean_cmd_parser(struct intel_gvt * gvt)3100*4882a593Smuzhiyun void intel_gvt_clean_cmd_parser(struct intel_gvt *gvt)
3101*4882a593Smuzhiyun {
3102*4882a593Smuzhiyun clean_cmd_table(gvt);
3103*4882a593Smuzhiyun }
3104*4882a593Smuzhiyun
intel_gvt_init_cmd_parser(struct intel_gvt * gvt)3105*4882a593Smuzhiyun int intel_gvt_init_cmd_parser(struct intel_gvt *gvt)
3106*4882a593Smuzhiyun {
3107*4882a593Smuzhiyun int ret;
3108*4882a593Smuzhiyun
3109*4882a593Smuzhiyun ret = init_cmd_table(gvt);
3110*4882a593Smuzhiyun if (ret) {
3111*4882a593Smuzhiyun intel_gvt_clean_cmd_parser(gvt);
3112*4882a593Smuzhiyun return ret;
3113*4882a593Smuzhiyun }
3114*4882a593Smuzhiyun return 0;
3115*4882a593Smuzhiyun }
3116