xref: /OK3568_Linux_fs/kernel/drivers/gpu/drm/amd/amdgpu/navi10_ih.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun  * Copyright 2019 Advanced Micro Devices, Inc.
3*4882a593Smuzhiyun  *
4*4882a593Smuzhiyun  * Permission is hereby granted, free of charge, to any person obtaining a
5*4882a593Smuzhiyun  * copy of this software and associated documentation files (the "Software"),
6*4882a593Smuzhiyun  * to deal in the Software without restriction, including without limitation
7*4882a593Smuzhiyun  * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8*4882a593Smuzhiyun  * and/or sell copies of the Software, and to permit persons to whom the
9*4882a593Smuzhiyun  * Software is furnished to do so, subject to the following conditions:
10*4882a593Smuzhiyun  *
11*4882a593Smuzhiyun  * The above copyright notice and this permission notice shall be included in
12*4882a593Smuzhiyun  * all copies or substantial portions of the Software.
13*4882a593Smuzhiyun  *
14*4882a593Smuzhiyun  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15*4882a593Smuzhiyun  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16*4882a593Smuzhiyun  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT.  IN NO EVENT SHALL
17*4882a593Smuzhiyun  * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18*4882a593Smuzhiyun  * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19*4882a593Smuzhiyun  * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20*4882a593Smuzhiyun  * OTHER DEALINGS IN THE SOFTWARE.
21*4882a593Smuzhiyun  *
22*4882a593Smuzhiyun  */
23*4882a593Smuzhiyun 
24*4882a593Smuzhiyun #include <linux/pci.h>
25*4882a593Smuzhiyun 
26*4882a593Smuzhiyun #include "amdgpu.h"
27*4882a593Smuzhiyun #include "amdgpu_ih.h"
28*4882a593Smuzhiyun 
29*4882a593Smuzhiyun #include "oss/osssys_5_0_0_offset.h"
30*4882a593Smuzhiyun #include "oss/osssys_5_0_0_sh_mask.h"
31*4882a593Smuzhiyun 
32*4882a593Smuzhiyun #include "soc15_common.h"
33*4882a593Smuzhiyun #include "navi10_ih.h"
34*4882a593Smuzhiyun 
35*4882a593Smuzhiyun #define MAX_REARM_RETRY 10
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun #define mmIH_CHICKEN_Sienna_Cichlid                 0x018d
38*4882a593Smuzhiyun #define mmIH_CHICKEN_Sienna_Cichlid_BASE_IDX        0
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev);
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun /**
43*4882a593Smuzhiyun  * force_update_wptr_for_self_int - Force update the wptr for self interrupt
44*4882a593Smuzhiyun  *
45*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
46*4882a593Smuzhiyun  * @threshold: threshold to trigger the wptr reporting
47*4882a593Smuzhiyun  * @timeout: timeout to trigger the wptr reporting
48*4882a593Smuzhiyun  * @enabled: Enable/disable timeout flush mechanism
49*4882a593Smuzhiyun  *
50*4882a593Smuzhiyun  * threshold input range: 0 ~ 15, default 0,
51*4882a593Smuzhiyun  * real_threshold = 2^threshold
52*4882a593Smuzhiyun  * timeout input range: 0 ~ 20, default 8,
53*4882a593Smuzhiyun  * real_timeout = (2^timeout) * 1024 / (socclk_freq)
54*4882a593Smuzhiyun  *
55*4882a593Smuzhiyun  * Force update wptr for self interrupt ( >= SIENNA_CICHLID).
56*4882a593Smuzhiyun  */
57*4882a593Smuzhiyun static void
force_update_wptr_for_self_int(struct amdgpu_device * adev,u32 threshold,u32 timeout,bool enabled)58*4882a593Smuzhiyun force_update_wptr_for_self_int(struct amdgpu_device *adev,
59*4882a593Smuzhiyun 			       u32 threshold, u32 timeout, bool enabled)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun 	u32 ih_cntl, ih_rb_cntl;
62*4882a593Smuzhiyun 
63*4882a593Smuzhiyun 	if (adev->asic_type < CHIP_SIENNA_CICHLID)
64*4882a593Smuzhiyun 		return;
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	ih_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_CNTL2);
67*4882a593Smuzhiyun 	ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1);
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun 	ih_cntl = REG_SET_FIELD(ih_cntl, IH_CNTL2,
70*4882a593Smuzhiyun 				SELF_IV_FORCE_WPTR_UPDATE_TIMEOUT, timeout);
71*4882a593Smuzhiyun 	ih_cntl = REG_SET_FIELD(ih_cntl, IH_CNTL2,
72*4882a593Smuzhiyun 				SELF_IV_FORCE_WPTR_UPDATE_ENABLE, enabled);
73*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING1,
74*4882a593Smuzhiyun 				   RB_USED_INT_THRESHOLD, threshold);
75*4882a593Smuzhiyun 
76*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1, ih_rb_cntl);
77*4882a593Smuzhiyun 	ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2);
78*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING2,
79*4882a593Smuzhiyun 				   RB_USED_INT_THRESHOLD, threshold);
80*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2, ih_rb_cntl);
81*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_CNTL2, ih_cntl);
82*4882a593Smuzhiyun }
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun /**
85*4882a593Smuzhiyun  * navi10_ih_enable_interrupts - Enable the interrupt ring buffer
86*4882a593Smuzhiyun  *
87*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
88*4882a593Smuzhiyun  *
89*4882a593Smuzhiyun  * Enable the interrupt ring buffer (NAVI10).
90*4882a593Smuzhiyun  */
navi10_ih_enable_interrupts(struct amdgpu_device * adev)91*4882a593Smuzhiyun static void navi10_ih_enable_interrupts(struct amdgpu_device *adev)
92*4882a593Smuzhiyun {
93*4882a593Smuzhiyun 	u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
94*4882a593Smuzhiyun 
95*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 1);
96*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 1);
97*4882a593Smuzhiyun 	if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
98*4882a593Smuzhiyun 		if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL, ih_rb_cntl)) {
99*4882a593Smuzhiyun 			DRM_ERROR("PSP program IH_RB_CNTL failed!\n");
100*4882a593Smuzhiyun 			return;
101*4882a593Smuzhiyun 		}
102*4882a593Smuzhiyun 	} else {
103*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
104*4882a593Smuzhiyun 	}
105*4882a593Smuzhiyun 
106*4882a593Smuzhiyun 	adev->irq.ih.enabled = true;
107*4882a593Smuzhiyun 
108*4882a593Smuzhiyun 	if (adev->irq.ih1.ring_size) {
109*4882a593Smuzhiyun 		ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1);
110*4882a593Smuzhiyun 		ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING1,
111*4882a593Smuzhiyun 					   RB_ENABLE, 1);
112*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
113*4882a593Smuzhiyun 			if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING1,
114*4882a593Smuzhiyun 						ih_rb_cntl)) {
115*4882a593Smuzhiyun 				DRM_ERROR("program IH_RB_CNTL_RING1 failed!\n");
116*4882a593Smuzhiyun 				return;
117*4882a593Smuzhiyun 			}
118*4882a593Smuzhiyun 		} else {
119*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1, ih_rb_cntl);
120*4882a593Smuzhiyun 		}
121*4882a593Smuzhiyun 		adev->irq.ih1.enabled = true;
122*4882a593Smuzhiyun 	}
123*4882a593Smuzhiyun 
124*4882a593Smuzhiyun 	if (adev->irq.ih2.ring_size) {
125*4882a593Smuzhiyun 		ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2);
126*4882a593Smuzhiyun 		ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING2,
127*4882a593Smuzhiyun 					   RB_ENABLE, 1);
128*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
129*4882a593Smuzhiyun 			if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING2,
130*4882a593Smuzhiyun 						ih_rb_cntl)) {
131*4882a593Smuzhiyun 				DRM_ERROR("program IH_RB_CNTL_RING2 failed!\n");
132*4882a593Smuzhiyun 				return;
133*4882a593Smuzhiyun 			}
134*4882a593Smuzhiyun 		} else {
135*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2, ih_rb_cntl);
136*4882a593Smuzhiyun 		}
137*4882a593Smuzhiyun 		adev->irq.ih2.enabled = true;
138*4882a593Smuzhiyun 	}
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun /**
142*4882a593Smuzhiyun  * navi10_ih_disable_interrupts - Disable the interrupt ring buffer
143*4882a593Smuzhiyun  *
144*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
145*4882a593Smuzhiyun  *
146*4882a593Smuzhiyun  * Disable the interrupt ring buffer (NAVI10).
147*4882a593Smuzhiyun  */
navi10_ih_disable_interrupts(struct amdgpu_device * adev)148*4882a593Smuzhiyun static void navi10_ih_disable_interrupts(struct amdgpu_device *adev)
149*4882a593Smuzhiyun {
150*4882a593Smuzhiyun 	u32 ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_ENABLE, 0);
153*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, ENABLE_INTR, 0);
154*4882a593Smuzhiyun 	if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
155*4882a593Smuzhiyun 		if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL, ih_rb_cntl)) {
156*4882a593Smuzhiyun 			DRM_ERROR("PSP program IH_RB_CNTL failed!\n");
157*4882a593Smuzhiyun 			return;
158*4882a593Smuzhiyun 		}
159*4882a593Smuzhiyun 	} else {
160*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
161*4882a593Smuzhiyun 	}
162*4882a593Smuzhiyun 
163*4882a593Smuzhiyun 	/* set rptr, wptr to 0 */
164*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
165*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
166*4882a593Smuzhiyun 	adev->irq.ih.enabled = false;
167*4882a593Smuzhiyun 	adev->irq.ih.rptr = 0;
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun 	if (adev->irq.ih1.ring_size) {
170*4882a593Smuzhiyun 		ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1);
171*4882a593Smuzhiyun 		ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING1,
172*4882a593Smuzhiyun 					   RB_ENABLE, 0);
173*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
174*4882a593Smuzhiyun 			if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING1,
175*4882a593Smuzhiyun 						ih_rb_cntl)) {
176*4882a593Smuzhiyun 				DRM_ERROR("program IH_RB_CNTL_RING1 failed!\n");
177*4882a593Smuzhiyun 				return;
178*4882a593Smuzhiyun 			}
179*4882a593Smuzhiyun 		} else {
180*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1, ih_rb_cntl);
181*4882a593Smuzhiyun 		}
182*4882a593Smuzhiyun 		/* set rptr, wptr to 0 */
183*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR_RING1, 0);
184*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_RING1, 0);
185*4882a593Smuzhiyun 		adev->irq.ih1.enabled = false;
186*4882a593Smuzhiyun 		adev->irq.ih1.rptr = 0;
187*4882a593Smuzhiyun 	}
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	if (adev->irq.ih2.ring_size) {
190*4882a593Smuzhiyun 		ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2);
191*4882a593Smuzhiyun 		ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL_RING2,
192*4882a593Smuzhiyun 					   RB_ENABLE, 0);
193*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
194*4882a593Smuzhiyun 			if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING2,
195*4882a593Smuzhiyun 						ih_rb_cntl)) {
196*4882a593Smuzhiyun 				DRM_ERROR("program IH_RB_CNTL_RING2 failed!\n");
197*4882a593Smuzhiyun 				return;
198*4882a593Smuzhiyun 			}
199*4882a593Smuzhiyun 		} else {
200*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2, ih_rb_cntl);
201*4882a593Smuzhiyun 		}
202*4882a593Smuzhiyun 		/* set rptr, wptr to 0 */
203*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR_RING2, 0);
204*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_RING2, 0);
205*4882a593Smuzhiyun 		adev->irq.ih2.enabled = false;
206*4882a593Smuzhiyun 		adev->irq.ih2.rptr = 0;
207*4882a593Smuzhiyun 	}
208*4882a593Smuzhiyun 
209*4882a593Smuzhiyun }
210*4882a593Smuzhiyun 
navi10_ih_rb_cntl(struct amdgpu_ih_ring * ih,uint32_t ih_rb_cntl)211*4882a593Smuzhiyun static uint32_t navi10_ih_rb_cntl(struct amdgpu_ih_ring *ih, uint32_t ih_rb_cntl)
212*4882a593Smuzhiyun {
213*4882a593Smuzhiyun 	int rb_bufsz = order_base_2(ih->ring_size / 4);
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
216*4882a593Smuzhiyun 				   MC_SPACE, ih->use_bus_addr ? 1 : 4);
217*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
218*4882a593Smuzhiyun 				   WPTR_OVERFLOW_CLEAR, 1);
219*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
220*4882a593Smuzhiyun 				   WPTR_OVERFLOW_ENABLE, 1);
221*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RB_SIZE, rb_bufsz);
222*4882a593Smuzhiyun 	/* Ring Buffer write pointer writeback. If enabled, IH_RB_WPTR register
223*4882a593Smuzhiyun 	 * value is written to memory
224*4882a593Smuzhiyun 	 */
225*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
226*4882a593Smuzhiyun 				   WPTR_WRITEBACK_ENABLE, 1);
227*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_SNOOP, 1);
228*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_RO, 0);
229*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, MC_VMID, 0);
230*4882a593Smuzhiyun 
231*4882a593Smuzhiyun 	return ih_rb_cntl;
232*4882a593Smuzhiyun }
233*4882a593Smuzhiyun 
navi10_ih_doorbell_rptr(struct amdgpu_ih_ring * ih)234*4882a593Smuzhiyun static uint32_t navi10_ih_doorbell_rptr(struct amdgpu_ih_ring *ih)
235*4882a593Smuzhiyun {
236*4882a593Smuzhiyun 	u32 ih_doorbell_rtpr = 0;
237*4882a593Smuzhiyun 
238*4882a593Smuzhiyun 	if (ih->use_doorbell) {
239*4882a593Smuzhiyun 		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
240*4882a593Smuzhiyun 						 IH_DOORBELL_RPTR, OFFSET,
241*4882a593Smuzhiyun 						 ih->doorbell_index);
242*4882a593Smuzhiyun 		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
243*4882a593Smuzhiyun 						 IH_DOORBELL_RPTR,
244*4882a593Smuzhiyun 						 ENABLE, 1);
245*4882a593Smuzhiyun 	} else {
246*4882a593Smuzhiyun 		ih_doorbell_rtpr = REG_SET_FIELD(ih_doorbell_rtpr,
247*4882a593Smuzhiyun 						 IH_DOORBELL_RPTR,
248*4882a593Smuzhiyun 						 ENABLE, 0);
249*4882a593Smuzhiyun 	}
250*4882a593Smuzhiyun 	return ih_doorbell_rtpr;
251*4882a593Smuzhiyun }
252*4882a593Smuzhiyun 
navi10_ih_reroute_ih(struct amdgpu_device * adev)253*4882a593Smuzhiyun static void navi10_ih_reroute_ih(struct amdgpu_device *adev)
254*4882a593Smuzhiyun {
255*4882a593Smuzhiyun 	uint32_t tmp;
256*4882a593Smuzhiyun 
257*4882a593Smuzhiyun 	/* Reroute to IH ring 1 for VMC */
258*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_CLIENT_CFG_INDEX, 0x12);
259*4882a593Smuzhiyun 	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_CLIENT_CFG_DATA);
260*4882a593Smuzhiyun 	tmp = REG_SET_FIELD(tmp, IH_CLIENT_CFG_DATA, CLIENT_TYPE, 1);
261*4882a593Smuzhiyun 	tmp = REG_SET_FIELD(tmp, IH_CLIENT_CFG_DATA, RING_ID, 1);
262*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_CLIENT_CFG_DATA, tmp);
263*4882a593Smuzhiyun 
264*4882a593Smuzhiyun 	/* Reroute IH ring 1 for UMC */
265*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_CLIENT_CFG_INDEX, 0x1B);
266*4882a593Smuzhiyun 	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_CLIENT_CFG_DATA);
267*4882a593Smuzhiyun 	tmp = REG_SET_FIELD(tmp, IH_CLIENT_CFG_DATA, RING_ID, 1);
268*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_CLIENT_CFG_DATA, tmp);
269*4882a593Smuzhiyun }
270*4882a593Smuzhiyun 
271*4882a593Smuzhiyun /**
272*4882a593Smuzhiyun  * navi10_ih_irq_init - init and enable the interrupt ring
273*4882a593Smuzhiyun  *
274*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
275*4882a593Smuzhiyun  *
276*4882a593Smuzhiyun  * Allocate a ring buffer for the interrupt controller,
277*4882a593Smuzhiyun  * enable the RLC, disable interrupts, enable the IH
278*4882a593Smuzhiyun  * ring buffer and enable it (NAVI).
279*4882a593Smuzhiyun  * Called at device load and reume.
280*4882a593Smuzhiyun  * Returns 0 for success, errors for failure.
281*4882a593Smuzhiyun  */
navi10_ih_irq_init(struct amdgpu_device * adev)282*4882a593Smuzhiyun static int navi10_ih_irq_init(struct amdgpu_device *adev)
283*4882a593Smuzhiyun {
284*4882a593Smuzhiyun 	struct amdgpu_ih_ring *ih = &adev->irq.ih;
285*4882a593Smuzhiyun 	u32 ih_rb_cntl, ih_chicken;
286*4882a593Smuzhiyun 	u32 tmp;
287*4882a593Smuzhiyun 
288*4882a593Smuzhiyun 	/* disable irqs */
289*4882a593Smuzhiyun 	navi10_ih_disable_interrupts(adev);
290*4882a593Smuzhiyun 
291*4882a593Smuzhiyun 	adev->nbio.funcs->ih_control(adev);
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 	/* Ring Buffer base. [39:8] of 40-bit address of the beginning of the ring buffer*/
294*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE, ih->gpu_addr >> 8);
295*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_HI, (ih->gpu_addr >> 40) & 0xff);
296*4882a593Smuzhiyun 
297*4882a593Smuzhiyun 	ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL);
298*4882a593Smuzhiyun 	ih_rb_cntl = navi10_ih_rb_cntl(ih, ih_rb_cntl);
299*4882a593Smuzhiyun 	ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL, RPTR_REARM,
300*4882a593Smuzhiyun 				   !!adev->irq.msi_enabled);
301*4882a593Smuzhiyun 	if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
302*4882a593Smuzhiyun 		if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL, ih_rb_cntl)) {
303*4882a593Smuzhiyun 			DRM_ERROR("PSP program IH_RB_CNTL failed!\n");
304*4882a593Smuzhiyun 			return -ETIMEDOUT;
305*4882a593Smuzhiyun 		}
306*4882a593Smuzhiyun 	} else {
307*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL, ih_rb_cntl);
308*4882a593Smuzhiyun 	}
309*4882a593Smuzhiyun 	if (adev->irq.ih1.ring_size)
310*4882a593Smuzhiyun 		navi10_ih_reroute_ih(adev);
311*4882a593Smuzhiyun 
312*4882a593Smuzhiyun 	if (unlikely(adev->firmware.load_type == AMDGPU_FW_LOAD_DIRECT)) {
313*4882a593Smuzhiyun 		if (ih->use_bus_addr) {
314*4882a593Smuzhiyun 			switch (adev->asic_type) {
315*4882a593Smuzhiyun 			case CHIP_SIENNA_CICHLID:
316*4882a593Smuzhiyun 			case CHIP_NAVY_FLOUNDER:
317*4882a593Smuzhiyun 				ih_chicken = RREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN_Sienna_Cichlid);
318*4882a593Smuzhiyun 				ih_chicken = REG_SET_FIELD(ih_chicken,
319*4882a593Smuzhiyun 						IH_CHICKEN, MC_SPACE_GPA_ENABLE, 1);
320*4882a593Smuzhiyun 				WREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN_Sienna_Cichlid, ih_chicken);
321*4882a593Smuzhiyun 				break;
322*4882a593Smuzhiyun 			default:
323*4882a593Smuzhiyun 				ih_chicken = RREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN);
324*4882a593Smuzhiyun 				ih_chicken = REG_SET_FIELD(ih_chicken,
325*4882a593Smuzhiyun 						IH_CHICKEN, MC_SPACE_GPA_ENABLE, 1);
326*4882a593Smuzhiyun 				WREG32_SOC15(OSSSYS, 0, mmIH_CHICKEN, ih_chicken);
327*4882a593Smuzhiyun 				break;
328*4882a593Smuzhiyun 			}
329*4882a593Smuzhiyun 		}
330*4882a593Smuzhiyun 	}
331*4882a593Smuzhiyun 
332*4882a593Smuzhiyun 	/* set the writeback address whether it's enabled or not */
333*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_LO,
334*4882a593Smuzhiyun 		     lower_32_bits(ih->wptr_addr));
335*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_ADDR_HI,
336*4882a593Smuzhiyun 		     upper_32_bits(ih->wptr_addr) & 0xFFFF);
337*4882a593Smuzhiyun 
338*4882a593Smuzhiyun 	/* set rptr, wptr to 0 */
339*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, 0);
340*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR, 0);
341*4882a593Smuzhiyun 
342*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR,
343*4882a593Smuzhiyun 			navi10_ih_doorbell_rptr(ih));
344*4882a593Smuzhiyun 
345*4882a593Smuzhiyun 	adev->nbio.funcs->ih_doorbell_range(adev, ih->use_doorbell,
346*4882a593Smuzhiyun 					    ih->doorbell_index);
347*4882a593Smuzhiyun 
348*4882a593Smuzhiyun 	ih = &adev->irq.ih1;
349*4882a593Smuzhiyun 	if (ih->ring_size) {
350*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_RING1, ih->gpu_addr >> 8);
351*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_HI_RING1,
352*4882a593Smuzhiyun 			     (ih->gpu_addr >> 40) & 0xff);
353*4882a593Smuzhiyun 
354*4882a593Smuzhiyun 		ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1);
355*4882a593Smuzhiyun 		ih_rb_cntl = navi10_ih_rb_cntl(ih, ih_rb_cntl);
356*4882a593Smuzhiyun 		ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
357*4882a593Smuzhiyun 					   WPTR_OVERFLOW_ENABLE, 0);
358*4882a593Smuzhiyun 		ih_rb_cntl = REG_SET_FIELD(ih_rb_cntl, IH_RB_CNTL,
359*4882a593Smuzhiyun 					   RB_FULL_DRAIN_ENABLE, 1);
360*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
361*4882a593Smuzhiyun 			if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING1,
362*4882a593Smuzhiyun 						ih_rb_cntl)) {
363*4882a593Smuzhiyun 				DRM_ERROR("program IH_RB_CNTL_RING1 failed!\n");
364*4882a593Smuzhiyun 				return -ETIMEDOUT;
365*4882a593Smuzhiyun 			}
366*4882a593Smuzhiyun 		} else {
367*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING1, ih_rb_cntl);
368*4882a593Smuzhiyun 		}
369*4882a593Smuzhiyun 		/* set rptr, wptr to 0 */
370*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_RING1, 0);
371*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR_RING1, 0);
372*4882a593Smuzhiyun 
373*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR_RING1,
374*4882a593Smuzhiyun 				navi10_ih_doorbell_rptr(ih));
375*4882a593Smuzhiyun 	}
376*4882a593Smuzhiyun 
377*4882a593Smuzhiyun 	ih = &adev->irq.ih2;
378*4882a593Smuzhiyun 	if (ih->ring_size) {
379*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_RING2, ih->gpu_addr >> 8);
380*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_BASE_HI_RING2,
381*4882a593Smuzhiyun 			     (ih->gpu_addr >> 40) & 0xff);
382*4882a593Smuzhiyun 
383*4882a593Smuzhiyun 		ih_rb_cntl = RREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2);
384*4882a593Smuzhiyun 		ih_rb_cntl = navi10_ih_rb_cntl(ih, ih_rb_cntl);
385*4882a593Smuzhiyun 
386*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev) && adev->asic_type < CHIP_NAVI10) {
387*4882a593Smuzhiyun 			if (psp_reg_program(&adev->psp, PSP_REG_IH_RB_CNTL_RING2,
388*4882a593Smuzhiyun 						ih_rb_cntl)) {
389*4882a593Smuzhiyun 				DRM_ERROR("program IH_RB_CNTL_RING2 failed!\n");
390*4882a593Smuzhiyun 				return -ETIMEDOUT;
391*4882a593Smuzhiyun 			}
392*4882a593Smuzhiyun 		} else {
393*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_RB_CNTL_RING2, ih_rb_cntl);
394*4882a593Smuzhiyun 		}
395*4882a593Smuzhiyun 		/* set rptr, wptr to 0 */
396*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_WPTR_RING2, 0);
397*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR_RING2, 0);
398*4882a593Smuzhiyun 
399*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_DOORBELL_RPTR_RING2,
400*4882a593Smuzhiyun 			     navi10_ih_doorbell_rptr(ih));
401*4882a593Smuzhiyun 	}
402*4882a593Smuzhiyun 
403*4882a593Smuzhiyun 
404*4882a593Smuzhiyun 	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL);
405*4882a593Smuzhiyun 	tmp = REG_SET_FIELD(tmp, IH_STORM_CLIENT_LIST_CNTL,
406*4882a593Smuzhiyun 			    CLIENT18_IS_STORM_CLIENT, 1);
407*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_STORM_CLIENT_LIST_CNTL, tmp);
408*4882a593Smuzhiyun 
409*4882a593Smuzhiyun 	tmp = RREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL);
410*4882a593Smuzhiyun 	tmp = REG_SET_FIELD(tmp, IH_INT_FLOOD_CNTL, FLOOD_CNTL_ENABLE, 1);
411*4882a593Smuzhiyun 	WREG32_SOC15(OSSSYS, 0, mmIH_INT_FLOOD_CNTL, tmp);
412*4882a593Smuzhiyun 
413*4882a593Smuzhiyun 	pci_set_master(adev->pdev);
414*4882a593Smuzhiyun 
415*4882a593Smuzhiyun 	/* enable interrupts */
416*4882a593Smuzhiyun 	navi10_ih_enable_interrupts(adev);
417*4882a593Smuzhiyun 	/* enable wptr force update for self int */
418*4882a593Smuzhiyun 	force_update_wptr_for_self_int(adev, 0, 8, true);
419*4882a593Smuzhiyun 
420*4882a593Smuzhiyun 	return 0;
421*4882a593Smuzhiyun }
422*4882a593Smuzhiyun 
423*4882a593Smuzhiyun /**
424*4882a593Smuzhiyun  * navi10_ih_irq_disable - disable interrupts
425*4882a593Smuzhiyun  *
426*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
427*4882a593Smuzhiyun  *
428*4882a593Smuzhiyun  * Disable interrupts on the hw (NAVI10).
429*4882a593Smuzhiyun  */
navi10_ih_irq_disable(struct amdgpu_device * adev)430*4882a593Smuzhiyun static void navi10_ih_irq_disable(struct amdgpu_device *adev)
431*4882a593Smuzhiyun {
432*4882a593Smuzhiyun 	force_update_wptr_for_self_int(adev, 0, 8, false);
433*4882a593Smuzhiyun 	navi10_ih_disable_interrupts(adev);
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 	/* Wait and acknowledge irq */
436*4882a593Smuzhiyun 	mdelay(1);
437*4882a593Smuzhiyun }
438*4882a593Smuzhiyun 
439*4882a593Smuzhiyun /**
440*4882a593Smuzhiyun  * navi10_ih_get_wptr - get the IH ring buffer wptr
441*4882a593Smuzhiyun  *
442*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
443*4882a593Smuzhiyun  *
444*4882a593Smuzhiyun  * Get the IH ring buffer wptr from either the register
445*4882a593Smuzhiyun  * or the writeback memory buffer (NAVI10).  Also check for
446*4882a593Smuzhiyun  * ring buffer overflow and deal with it.
447*4882a593Smuzhiyun  * Returns the value of the wptr.
448*4882a593Smuzhiyun  */
navi10_ih_get_wptr(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih)449*4882a593Smuzhiyun static u32 navi10_ih_get_wptr(struct amdgpu_device *adev,
450*4882a593Smuzhiyun 			      struct amdgpu_ih_ring *ih)
451*4882a593Smuzhiyun {
452*4882a593Smuzhiyun 	u32 wptr, reg, tmp;
453*4882a593Smuzhiyun 
454*4882a593Smuzhiyun 	wptr = le32_to_cpu(*ih->wptr_cpu);
455*4882a593Smuzhiyun 
456*4882a593Smuzhiyun 	if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
457*4882a593Smuzhiyun 		goto out;
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun 	if (ih == &adev->irq.ih)
460*4882a593Smuzhiyun 		reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_WPTR);
461*4882a593Smuzhiyun 	else if (ih == &adev->irq.ih1)
462*4882a593Smuzhiyun 		reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_WPTR_RING1);
463*4882a593Smuzhiyun 	else if (ih == &adev->irq.ih2)
464*4882a593Smuzhiyun 		reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_WPTR_RING2);
465*4882a593Smuzhiyun 	else
466*4882a593Smuzhiyun 		BUG();
467*4882a593Smuzhiyun 
468*4882a593Smuzhiyun 	wptr = RREG32_NO_KIQ(reg);
469*4882a593Smuzhiyun 	if (!REG_GET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW))
470*4882a593Smuzhiyun 		goto out;
471*4882a593Smuzhiyun 	wptr = REG_SET_FIELD(wptr, IH_RB_WPTR, RB_OVERFLOW, 0);
472*4882a593Smuzhiyun 
473*4882a593Smuzhiyun 	/* When a ring buffer overflow happen start parsing interrupt
474*4882a593Smuzhiyun 	 * from the last not overwritten vector (wptr + 32). Hopefully
475*4882a593Smuzhiyun 	 * this should allow us to catch up.
476*4882a593Smuzhiyun 	 */
477*4882a593Smuzhiyun 	tmp = (wptr + 32) & ih->ptr_mask;
478*4882a593Smuzhiyun 	dev_warn(adev->dev, "IH ring buffer overflow "
479*4882a593Smuzhiyun 		 "(0x%08X, 0x%08X, 0x%08X)\n",
480*4882a593Smuzhiyun 		 wptr, ih->rptr, tmp);
481*4882a593Smuzhiyun 	ih->rptr = tmp;
482*4882a593Smuzhiyun 
483*4882a593Smuzhiyun 	if (ih == &adev->irq.ih)
484*4882a593Smuzhiyun 		reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_CNTL);
485*4882a593Smuzhiyun 	else if (ih == &adev->irq.ih1)
486*4882a593Smuzhiyun 		reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_CNTL_RING1);
487*4882a593Smuzhiyun 	else if (ih == &adev->irq.ih2)
488*4882a593Smuzhiyun 		reg = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_CNTL_RING2);
489*4882a593Smuzhiyun 	else
490*4882a593Smuzhiyun 		BUG();
491*4882a593Smuzhiyun 
492*4882a593Smuzhiyun 	tmp = RREG32_NO_KIQ(reg);
493*4882a593Smuzhiyun 	tmp = REG_SET_FIELD(tmp, IH_RB_CNTL, WPTR_OVERFLOW_CLEAR, 1);
494*4882a593Smuzhiyun 	WREG32_NO_KIQ(reg, tmp);
495*4882a593Smuzhiyun out:
496*4882a593Smuzhiyun 	return (wptr & ih->ptr_mask);
497*4882a593Smuzhiyun }
498*4882a593Smuzhiyun 
499*4882a593Smuzhiyun /**
500*4882a593Smuzhiyun  * navi10_ih_decode_iv - decode an interrupt vector
501*4882a593Smuzhiyun  *
502*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
503*4882a593Smuzhiyun  *
504*4882a593Smuzhiyun  * Decodes the interrupt vector at the current rptr
505*4882a593Smuzhiyun  * position and also advance the position.
506*4882a593Smuzhiyun  */
navi10_ih_decode_iv(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih,struct amdgpu_iv_entry * entry)507*4882a593Smuzhiyun static void navi10_ih_decode_iv(struct amdgpu_device *adev,
508*4882a593Smuzhiyun 				struct amdgpu_ih_ring *ih,
509*4882a593Smuzhiyun 				struct amdgpu_iv_entry *entry)
510*4882a593Smuzhiyun {
511*4882a593Smuzhiyun 	/* wptr/rptr are in bytes! */
512*4882a593Smuzhiyun 	u32 ring_index = ih->rptr >> 2;
513*4882a593Smuzhiyun 	uint32_t dw[8];
514*4882a593Smuzhiyun 
515*4882a593Smuzhiyun 	dw[0] = le32_to_cpu(ih->ring[ring_index + 0]);
516*4882a593Smuzhiyun 	dw[1] = le32_to_cpu(ih->ring[ring_index + 1]);
517*4882a593Smuzhiyun 	dw[2] = le32_to_cpu(ih->ring[ring_index + 2]);
518*4882a593Smuzhiyun 	dw[3] = le32_to_cpu(ih->ring[ring_index + 3]);
519*4882a593Smuzhiyun 	dw[4] = le32_to_cpu(ih->ring[ring_index + 4]);
520*4882a593Smuzhiyun 	dw[5] = le32_to_cpu(ih->ring[ring_index + 5]);
521*4882a593Smuzhiyun 	dw[6] = le32_to_cpu(ih->ring[ring_index + 6]);
522*4882a593Smuzhiyun 	dw[7] = le32_to_cpu(ih->ring[ring_index + 7]);
523*4882a593Smuzhiyun 
524*4882a593Smuzhiyun 	entry->client_id = dw[0] & 0xff;
525*4882a593Smuzhiyun 	entry->src_id = (dw[0] >> 8) & 0xff;
526*4882a593Smuzhiyun 	entry->ring_id = (dw[0] >> 16) & 0xff;
527*4882a593Smuzhiyun 	entry->vmid = (dw[0] >> 24) & 0xf;
528*4882a593Smuzhiyun 	entry->vmid_src = (dw[0] >> 31);
529*4882a593Smuzhiyun 	entry->timestamp = dw[1] | ((u64)(dw[2] & 0xffff) << 32);
530*4882a593Smuzhiyun 	entry->timestamp_src = dw[2] >> 31;
531*4882a593Smuzhiyun 	entry->pasid = dw[3] & 0xffff;
532*4882a593Smuzhiyun 	entry->pasid_src = dw[3] >> 31;
533*4882a593Smuzhiyun 	entry->src_data[0] = dw[4];
534*4882a593Smuzhiyun 	entry->src_data[1] = dw[5];
535*4882a593Smuzhiyun 	entry->src_data[2] = dw[6];
536*4882a593Smuzhiyun 	entry->src_data[3] = dw[7];
537*4882a593Smuzhiyun 
538*4882a593Smuzhiyun 	/* wptr/rptr are in bytes! */
539*4882a593Smuzhiyun 	ih->rptr += 32;
540*4882a593Smuzhiyun }
541*4882a593Smuzhiyun 
542*4882a593Smuzhiyun /**
543*4882a593Smuzhiyun  * navi10_ih_irq_rearm - rearm IRQ if lost
544*4882a593Smuzhiyun  *
545*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
546*4882a593Smuzhiyun  *
547*4882a593Smuzhiyun  */
navi10_ih_irq_rearm(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih)548*4882a593Smuzhiyun static void navi10_ih_irq_rearm(struct amdgpu_device *adev,
549*4882a593Smuzhiyun 			       struct amdgpu_ih_ring *ih)
550*4882a593Smuzhiyun {
551*4882a593Smuzhiyun 	uint32_t reg_rptr = 0;
552*4882a593Smuzhiyun 	uint32_t v = 0;
553*4882a593Smuzhiyun 	uint32_t i = 0;
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 	if (ih == &adev->irq.ih)
556*4882a593Smuzhiyun 		reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR);
557*4882a593Smuzhiyun 	else if (ih == &adev->irq.ih1)
558*4882a593Smuzhiyun 		reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR_RING1);
559*4882a593Smuzhiyun 	else if (ih == &adev->irq.ih2)
560*4882a593Smuzhiyun 		reg_rptr = SOC15_REG_OFFSET(OSSSYS, 0, mmIH_RB_RPTR_RING2);
561*4882a593Smuzhiyun 	else
562*4882a593Smuzhiyun 		return;
563*4882a593Smuzhiyun 
564*4882a593Smuzhiyun 	/* Rearm IRQ / re-write doorbell if doorbell write is lost */
565*4882a593Smuzhiyun 	for (i = 0; i < MAX_REARM_RETRY; i++) {
566*4882a593Smuzhiyun 		v = RREG32_NO_KIQ(reg_rptr);
567*4882a593Smuzhiyun 		if ((v < ih->ring_size) && (v != ih->rptr))
568*4882a593Smuzhiyun 			WDOORBELL32(ih->doorbell_index, ih->rptr);
569*4882a593Smuzhiyun 		else
570*4882a593Smuzhiyun 			break;
571*4882a593Smuzhiyun 	}
572*4882a593Smuzhiyun }
573*4882a593Smuzhiyun 
574*4882a593Smuzhiyun /**
575*4882a593Smuzhiyun  * navi10_ih_set_rptr - set the IH ring buffer rptr
576*4882a593Smuzhiyun  *
577*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
578*4882a593Smuzhiyun  *
579*4882a593Smuzhiyun  * Set the IH ring buffer rptr.
580*4882a593Smuzhiyun  */
navi10_ih_set_rptr(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih)581*4882a593Smuzhiyun static void navi10_ih_set_rptr(struct amdgpu_device *adev,
582*4882a593Smuzhiyun 			       struct amdgpu_ih_ring *ih)
583*4882a593Smuzhiyun {
584*4882a593Smuzhiyun 	if (ih->use_doorbell) {
585*4882a593Smuzhiyun 		/* XXX check if swapping is necessary on BE */
586*4882a593Smuzhiyun 		*ih->rptr_cpu = ih->rptr;
587*4882a593Smuzhiyun 		WDOORBELL32(ih->doorbell_index, ih->rptr);
588*4882a593Smuzhiyun 
589*4882a593Smuzhiyun 		if (amdgpu_sriov_vf(adev))
590*4882a593Smuzhiyun 			navi10_ih_irq_rearm(adev, ih);
591*4882a593Smuzhiyun 	} else if (ih == &adev->irq.ih) {
592*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR, ih->rptr);
593*4882a593Smuzhiyun 	} else if (ih == &adev->irq.ih1) {
594*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR_RING1, ih->rptr);
595*4882a593Smuzhiyun 	} else if (ih == &adev->irq.ih2) {
596*4882a593Smuzhiyun 		WREG32_SOC15(OSSSYS, 0, mmIH_RB_RPTR_RING2, ih->rptr);
597*4882a593Smuzhiyun 	}
598*4882a593Smuzhiyun }
599*4882a593Smuzhiyun 
600*4882a593Smuzhiyun /**
601*4882a593Smuzhiyun  * navi10_ih_self_irq - dispatch work for ring 1 and 2
602*4882a593Smuzhiyun  *
603*4882a593Smuzhiyun  * @adev: amdgpu_device pointer
604*4882a593Smuzhiyun  * @source: irq source
605*4882a593Smuzhiyun  * @entry: IV with WPTR update
606*4882a593Smuzhiyun  *
607*4882a593Smuzhiyun  * Update the WPTR from the IV and schedule work to handle the entries.
608*4882a593Smuzhiyun  */
navi10_ih_self_irq(struct amdgpu_device * adev,struct amdgpu_irq_src * source,struct amdgpu_iv_entry * entry)609*4882a593Smuzhiyun static int navi10_ih_self_irq(struct amdgpu_device *adev,
610*4882a593Smuzhiyun 			      struct amdgpu_irq_src *source,
611*4882a593Smuzhiyun 			      struct amdgpu_iv_entry *entry)
612*4882a593Smuzhiyun {
613*4882a593Smuzhiyun 	uint32_t wptr = cpu_to_le32(entry->src_data[0]);
614*4882a593Smuzhiyun 
615*4882a593Smuzhiyun 	switch (entry->ring_id) {
616*4882a593Smuzhiyun 	case 1:
617*4882a593Smuzhiyun 		*adev->irq.ih1.wptr_cpu = wptr;
618*4882a593Smuzhiyun 		schedule_work(&adev->irq.ih1_work);
619*4882a593Smuzhiyun 		break;
620*4882a593Smuzhiyun 	case 2:
621*4882a593Smuzhiyun 		*adev->irq.ih2.wptr_cpu = wptr;
622*4882a593Smuzhiyun 		schedule_work(&adev->irq.ih2_work);
623*4882a593Smuzhiyun 		break;
624*4882a593Smuzhiyun 	default: break;
625*4882a593Smuzhiyun 	}
626*4882a593Smuzhiyun 	return 0;
627*4882a593Smuzhiyun }
628*4882a593Smuzhiyun 
629*4882a593Smuzhiyun static const struct amdgpu_irq_src_funcs navi10_ih_self_irq_funcs = {
630*4882a593Smuzhiyun 	.process = navi10_ih_self_irq,
631*4882a593Smuzhiyun };
632*4882a593Smuzhiyun 
navi10_ih_set_self_irq_funcs(struct amdgpu_device * adev)633*4882a593Smuzhiyun static void navi10_ih_set_self_irq_funcs(struct amdgpu_device *adev)
634*4882a593Smuzhiyun {
635*4882a593Smuzhiyun 	adev->irq.self_irq.num_types = 0;
636*4882a593Smuzhiyun 	adev->irq.self_irq.funcs = &navi10_ih_self_irq_funcs;
637*4882a593Smuzhiyun }
638*4882a593Smuzhiyun 
navi10_ih_early_init(void * handle)639*4882a593Smuzhiyun static int navi10_ih_early_init(void *handle)
640*4882a593Smuzhiyun {
641*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
642*4882a593Smuzhiyun 
643*4882a593Smuzhiyun 	navi10_ih_set_interrupt_funcs(adev);
644*4882a593Smuzhiyun 	navi10_ih_set_self_irq_funcs(adev);
645*4882a593Smuzhiyun 	return 0;
646*4882a593Smuzhiyun }
647*4882a593Smuzhiyun 
navi10_ih_sw_init(void * handle)648*4882a593Smuzhiyun static int navi10_ih_sw_init(void *handle)
649*4882a593Smuzhiyun {
650*4882a593Smuzhiyun 	int r;
651*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
652*4882a593Smuzhiyun 	bool use_bus_addr;
653*4882a593Smuzhiyun 
654*4882a593Smuzhiyun 	r = amdgpu_irq_add_id(adev, SOC15_IH_CLIENTID_IH, 0,
655*4882a593Smuzhiyun 				&adev->irq.self_irq);
656*4882a593Smuzhiyun 
657*4882a593Smuzhiyun 	if (r)
658*4882a593Smuzhiyun 		return r;
659*4882a593Smuzhiyun 
660*4882a593Smuzhiyun 	/* use gpu virtual address for ih ring
661*4882a593Smuzhiyun 	 * until ih_checken is programmed to allow
662*4882a593Smuzhiyun 	 * use bus address for ih ring by psp bl */
663*4882a593Smuzhiyun 	use_bus_addr =
664*4882a593Smuzhiyun 		(adev->firmware.load_type == AMDGPU_FW_LOAD_PSP) ? false : true;
665*4882a593Smuzhiyun 	r = amdgpu_ih_ring_init(adev, &adev->irq.ih, 256 * 1024, use_bus_addr);
666*4882a593Smuzhiyun 	if (r)
667*4882a593Smuzhiyun 		return r;
668*4882a593Smuzhiyun 
669*4882a593Smuzhiyun 	adev->irq.ih.use_doorbell = true;
670*4882a593Smuzhiyun 	adev->irq.ih.doorbell_index = adev->doorbell_index.ih << 1;
671*4882a593Smuzhiyun 
672*4882a593Smuzhiyun 	adev->irq.ih1.ring_size = 0;
673*4882a593Smuzhiyun 	adev->irq.ih2.ring_size = 0;
674*4882a593Smuzhiyun 
675*4882a593Smuzhiyun 	if (adev->asic_type < CHIP_NAVI10) {
676*4882a593Smuzhiyun 		r = amdgpu_ih_ring_init(adev, &adev->irq.ih1, PAGE_SIZE, true);
677*4882a593Smuzhiyun 		if (r)
678*4882a593Smuzhiyun 			return r;
679*4882a593Smuzhiyun 
680*4882a593Smuzhiyun 		adev->irq.ih1.use_doorbell = true;
681*4882a593Smuzhiyun 		adev->irq.ih1.doorbell_index =
682*4882a593Smuzhiyun 					(adev->doorbell_index.ih + 1) << 1;
683*4882a593Smuzhiyun 
684*4882a593Smuzhiyun 		r = amdgpu_ih_ring_init(adev, &adev->irq.ih2, PAGE_SIZE, true);
685*4882a593Smuzhiyun 		if (r)
686*4882a593Smuzhiyun 			return r;
687*4882a593Smuzhiyun 
688*4882a593Smuzhiyun 		adev->irq.ih2.use_doorbell = true;
689*4882a593Smuzhiyun 		adev->irq.ih2.doorbell_index =
690*4882a593Smuzhiyun 					(adev->doorbell_index.ih + 2) << 1;
691*4882a593Smuzhiyun 	}
692*4882a593Smuzhiyun 
693*4882a593Smuzhiyun 	r = amdgpu_irq_init(adev);
694*4882a593Smuzhiyun 
695*4882a593Smuzhiyun 	return r;
696*4882a593Smuzhiyun }
697*4882a593Smuzhiyun 
navi10_ih_sw_fini(void * handle)698*4882a593Smuzhiyun static int navi10_ih_sw_fini(void *handle)
699*4882a593Smuzhiyun {
700*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
701*4882a593Smuzhiyun 
702*4882a593Smuzhiyun 	amdgpu_irq_fini(adev);
703*4882a593Smuzhiyun 	amdgpu_ih_ring_fini(adev, &adev->irq.ih2);
704*4882a593Smuzhiyun 	amdgpu_ih_ring_fini(adev, &adev->irq.ih1);
705*4882a593Smuzhiyun 	amdgpu_ih_ring_fini(adev, &adev->irq.ih);
706*4882a593Smuzhiyun 
707*4882a593Smuzhiyun 	return 0;
708*4882a593Smuzhiyun }
709*4882a593Smuzhiyun 
navi10_ih_hw_init(void * handle)710*4882a593Smuzhiyun static int navi10_ih_hw_init(void *handle)
711*4882a593Smuzhiyun {
712*4882a593Smuzhiyun 	int r;
713*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
714*4882a593Smuzhiyun 
715*4882a593Smuzhiyun 	r = navi10_ih_irq_init(adev);
716*4882a593Smuzhiyun 	if (r)
717*4882a593Smuzhiyun 		return r;
718*4882a593Smuzhiyun 
719*4882a593Smuzhiyun 	return 0;
720*4882a593Smuzhiyun }
721*4882a593Smuzhiyun 
navi10_ih_hw_fini(void * handle)722*4882a593Smuzhiyun static int navi10_ih_hw_fini(void *handle)
723*4882a593Smuzhiyun {
724*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
725*4882a593Smuzhiyun 
726*4882a593Smuzhiyun 	navi10_ih_irq_disable(adev);
727*4882a593Smuzhiyun 
728*4882a593Smuzhiyun 	return 0;
729*4882a593Smuzhiyun }
730*4882a593Smuzhiyun 
navi10_ih_suspend(void * handle)731*4882a593Smuzhiyun static int navi10_ih_suspend(void *handle)
732*4882a593Smuzhiyun {
733*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
734*4882a593Smuzhiyun 
735*4882a593Smuzhiyun 	return navi10_ih_hw_fini(adev);
736*4882a593Smuzhiyun }
737*4882a593Smuzhiyun 
navi10_ih_resume(void * handle)738*4882a593Smuzhiyun static int navi10_ih_resume(void *handle)
739*4882a593Smuzhiyun {
740*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
741*4882a593Smuzhiyun 
742*4882a593Smuzhiyun 	return navi10_ih_hw_init(adev);
743*4882a593Smuzhiyun }
744*4882a593Smuzhiyun 
navi10_ih_is_idle(void * handle)745*4882a593Smuzhiyun static bool navi10_ih_is_idle(void *handle)
746*4882a593Smuzhiyun {
747*4882a593Smuzhiyun 	/* todo */
748*4882a593Smuzhiyun 	return true;
749*4882a593Smuzhiyun }
750*4882a593Smuzhiyun 
navi10_ih_wait_for_idle(void * handle)751*4882a593Smuzhiyun static int navi10_ih_wait_for_idle(void *handle)
752*4882a593Smuzhiyun {
753*4882a593Smuzhiyun 	/* todo */
754*4882a593Smuzhiyun 	return -ETIMEDOUT;
755*4882a593Smuzhiyun }
756*4882a593Smuzhiyun 
navi10_ih_soft_reset(void * handle)757*4882a593Smuzhiyun static int navi10_ih_soft_reset(void *handle)
758*4882a593Smuzhiyun {
759*4882a593Smuzhiyun 	/* todo */
760*4882a593Smuzhiyun 	return 0;
761*4882a593Smuzhiyun }
762*4882a593Smuzhiyun 
navi10_ih_update_clockgating_state(struct amdgpu_device * adev,bool enable)763*4882a593Smuzhiyun static void navi10_ih_update_clockgating_state(struct amdgpu_device *adev,
764*4882a593Smuzhiyun 					       bool enable)
765*4882a593Smuzhiyun {
766*4882a593Smuzhiyun 	uint32_t data, def, field_val;
767*4882a593Smuzhiyun 
768*4882a593Smuzhiyun 	if (adev->cg_flags & AMD_CG_SUPPORT_IH_CG) {
769*4882a593Smuzhiyun 		def = data = RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL);
770*4882a593Smuzhiyun 		field_val = enable ? 0 : 1;
771*4882a593Smuzhiyun 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
772*4882a593Smuzhiyun 				     DBUS_MUX_CLK_SOFT_OVERRIDE, field_val);
773*4882a593Smuzhiyun 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
774*4882a593Smuzhiyun 				     OSSSYS_SHARE_CLK_SOFT_OVERRIDE, field_val);
775*4882a593Smuzhiyun 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
776*4882a593Smuzhiyun 				     LIMIT_SMN_CLK_SOFT_OVERRIDE, field_val);
777*4882a593Smuzhiyun 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
778*4882a593Smuzhiyun 				     DYN_CLK_SOFT_OVERRIDE, field_val);
779*4882a593Smuzhiyun 		data = REG_SET_FIELD(data, IH_CLK_CTRL,
780*4882a593Smuzhiyun 				     REG_CLK_SOFT_OVERRIDE, field_val);
781*4882a593Smuzhiyun 		if (def != data)
782*4882a593Smuzhiyun 			WREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL, data);
783*4882a593Smuzhiyun 	}
784*4882a593Smuzhiyun 
785*4882a593Smuzhiyun 	return;
786*4882a593Smuzhiyun }
787*4882a593Smuzhiyun 
navi10_ih_set_clockgating_state(void * handle,enum amd_clockgating_state state)788*4882a593Smuzhiyun static int navi10_ih_set_clockgating_state(void *handle,
789*4882a593Smuzhiyun 					   enum amd_clockgating_state state)
790*4882a593Smuzhiyun {
791*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
792*4882a593Smuzhiyun 
793*4882a593Smuzhiyun 	navi10_ih_update_clockgating_state(adev,
794*4882a593Smuzhiyun 				state == AMD_CG_STATE_GATE);
795*4882a593Smuzhiyun 	return 0;
796*4882a593Smuzhiyun }
797*4882a593Smuzhiyun 
navi10_ih_set_powergating_state(void * handle,enum amd_powergating_state state)798*4882a593Smuzhiyun static int navi10_ih_set_powergating_state(void *handle,
799*4882a593Smuzhiyun 					   enum amd_powergating_state state)
800*4882a593Smuzhiyun {
801*4882a593Smuzhiyun 	return 0;
802*4882a593Smuzhiyun }
803*4882a593Smuzhiyun 
navi10_ih_get_clockgating_state(void * handle,u32 * flags)804*4882a593Smuzhiyun static void navi10_ih_get_clockgating_state(void *handle, u32 *flags)
805*4882a593Smuzhiyun {
806*4882a593Smuzhiyun 	struct amdgpu_device *adev = (struct amdgpu_device *)handle;
807*4882a593Smuzhiyun 
808*4882a593Smuzhiyun 	if (!RREG32_SOC15(OSSSYS, 0, mmIH_CLK_CTRL))
809*4882a593Smuzhiyun 		*flags |= AMD_CG_SUPPORT_IH_CG;
810*4882a593Smuzhiyun 
811*4882a593Smuzhiyun 	return;
812*4882a593Smuzhiyun }
813*4882a593Smuzhiyun 
814*4882a593Smuzhiyun static const struct amd_ip_funcs navi10_ih_ip_funcs = {
815*4882a593Smuzhiyun 	.name = "navi10_ih",
816*4882a593Smuzhiyun 	.early_init = navi10_ih_early_init,
817*4882a593Smuzhiyun 	.late_init = NULL,
818*4882a593Smuzhiyun 	.sw_init = navi10_ih_sw_init,
819*4882a593Smuzhiyun 	.sw_fini = navi10_ih_sw_fini,
820*4882a593Smuzhiyun 	.hw_init = navi10_ih_hw_init,
821*4882a593Smuzhiyun 	.hw_fini = navi10_ih_hw_fini,
822*4882a593Smuzhiyun 	.suspend = navi10_ih_suspend,
823*4882a593Smuzhiyun 	.resume = navi10_ih_resume,
824*4882a593Smuzhiyun 	.is_idle = navi10_ih_is_idle,
825*4882a593Smuzhiyun 	.wait_for_idle = navi10_ih_wait_for_idle,
826*4882a593Smuzhiyun 	.soft_reset = navi10_ih_soft_reset,
827*4882a593Smuzhiyun 	.set_clockgating_state = navi10_ih_set_clockgating_state,
828*4882a593Smuzhiyun 	.set_powergating_state = navi10_ih_set_powergating_state,
829*4882a593Smuzhiyun 	.get_clockgating_state = navi10_ih_get_clockgating_state,
830*4882a593Smuzhiyun };
831*4882a593Smuzhiyun 
832*4882a593Smuzhiyun static const struct amdgpu_ih_funcs navi10_ih_funcs = {
833*4882a593Smuzhiyun 	.get_wptr = navi10_ih_get_wptr,
834*4882a593Smuzhiyun 	.decode_iv = navi10_ih_decode_iv,
835*4882a593Smuzhiyun 	.set_rptr = navi10_ih_set_rptr
836*4882a593Smuzhiyun };
837*4882a593Smuzhiyun 
navi10_ih_set_interrupt_funcs(struct amdgpu_device * adev)838*4882a593Smuzhiyun static void navi10_ih_set_interrupt_funcs(struct amdgpu_device *adev)
839*4882a593Smuzhiyun {
840*4882a593Smuzhiyun 	if (adev->irq.ih_funcs == NULL)
841*4882a593Smuzhiyun 		adev->irq.ih_funcs = &navi10_ih_funcs;
842*4882a593Smuzhiyun }
843*4882a593Smuzhiyun 
844*4882a593Smuzhiyun const struct amdgpu_ip_block_version navi10_ih_ip_block =
845*4882a593Smuzhiyun {
846*4882a593Smuzhiyun 	.type = AMD_IP_BLOCK_TYPE_IH,
847*4882a593Smuzhiyun 	.major = 5,
848*4882a593Smuzhiyun 	.minor = 0,
849*4882a593Smuzhiyun 	.rev = 0,
850*4882a593Smuzhiyun 	.funcs = &navi10_ih_ip_funcs,
851*4882a593Smuzhiyun };
852