1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * Copyright 2015 Advanced Micro Devices, Inc.
3*4882a593Smuzhiyun *
4*4882a593Smuzhiyun * Permission is hereby granted, free of charge, to any person obtaining a
5*4882a593Smuzhiyun * copy of this software and associated documentation files (the "Software"),
6*4882a593Smuzhiyun * to deal in the Software without restriction, including without limitation
7*4882a593Smuzhiyun * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8*4882a593Smuzhiyun * and/or sell copies of the Software, and to permit persons to whom the
9*4882a593Smuzhiyun * Software is furnished to do so, subject to the following conditions:
10*4882a593Smuzhiyun *
11*4882a593Smuzhiyun * The above copyright notice and this permission notice shall be included in
12*4882a593Smuzhiyun * all copies or substantial portions of the Software.
13*4882a593Smuzhiyun *
14*4882a593Smuzhiyun * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
15*4882a593Smuzhiyun * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
16*4882a593Smuzhiyun * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
17*4882a593Smuzhiyun * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR
18*4882a593Smuzhiyun * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
19*4882a593Smuzhiyun * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
20*4882a593Smuzhiyun * OTHER DEALINGS IN THE SOFTWARE.
21*4882a593Smuzhiyun *
22*4882a593Smuzhiyun */
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun #include <linux/pci.h>
25*4882a593Smuzhiyun
26*4882a593Smuzhiyun #include "amdgpu.h"
27*4882a593Smuzhiyun #include "amdgpu_ih.h"
28*4882a593Smuzhiyun #include "sid.h"
29*4882a593Smuzhiyun #include "si_ih.h"
30*4882a593Smuzhiyun #include "oss/oss_1_0_d.h"
31*4882a593Smuzhiyun #include "oss/oss_1_0_sh_mask.h"
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun static void si_ih_set_interrupt_funcs(struct amdgpu_device *adev);
34*4882a593Smuzhiyun
si_ih_enable_interrupts(struct amdgpu_device * adev)35*4882a593Smuzhiyun static void si_ih_enable_interrupts(struct amdgpu_device *adev)
36*4882a593Smuzhiyun {
37*4882a593Smuzhiyun u32 ih_cntl = RREG32(IH_CNTL);
38*4882a593Smuzhiyun u32 ih_rb_cntl = RREG32(IH_RB_CNTL);
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun ih_cntl |= ENABLE_INTR;
41*4882a593Smuzhiyun ih_rb_cntl |= IH_RB_ENABLE;
42*4882a593Smuzhiyun WREG32(IH_CNTL, ih_cntl);
43*4882a593Smuzhiyun WREG32(IH_RB_CNTL, ih_rb_cntl);
44*4882a593Smuzhiyun adev->irq.ih.enabled = true;
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun
si_ih_disable_interrupts(struct amdgpu_device * adev)47*4882a593Smuzhiyun static void si_ih_disable_interrupts(struct amdgpu_device *adev)
48*4882a593Smuzhiyun {
49*4882a593Smuzhiyun u32 ih_rb_cntl = RREG32(IH_RB_CNTL);
50*4882a593Smuzhiyun u32 ih_cntl = RREG32(IH_CNTL);
51*4882a593Smuzhiyun
52*4882a593Smuzhiyun ih_rb_cntl &= ~IH_RB_ENABLE;
53*4882a593Smuzhiyun ih_cntl &= ~ENABLE_INTR;
54*4882a593Smuzhiyun WREG32(IH_RB_CNTL, ih_rb_cntl);
55*4882a593Smuzhiyun WREG32(IH_CNTL, ih_cntl);
56*4882a593Smuzhiyun WREG32(IH_RB_RPTR, 0);
57*4882a593Smuzhiyun WREG32(IH_RB_WPTR, 0);
58*4882a593Smuzhiyun adev->irq.ih.enabled = false;
59*4882a593Smuzhiyun adev->irq.ih.rptr = 0;
60*4882a593Smuzhiyun }
61*4882a593Smuzhiyun
si_ih_irq_init(struct amdgpu_device * adev)62*4882a593Smuzhiyun static int si_ih_irq_init(struct amdgpu_device *adev)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun struct amdgpu_ih_ring *ih = &adev->irq.ih;
65*4882a593Smuzhiyun int rb_bufsz;
66*4882a593Smuzhiyun u32 interrupt_cntl, ih_cntl, ih_rb_cntl;
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun si_ih_disable_interrupts(adev);
69*4882a593Smuzhiyun /* set dummy read address to dummy page address */
70*4882a593Smuzhiyun WREG32(INTERRUPT_CNTL2, adev->dummy_page_addr >> 8);
71*4882a593Smuzhiyun interrupt_cntl = RREG32(INTERRUPT_CNTL);
72*4882a593Smuzhiyun interrupt_cntl &= ~IH_DUMMY_RD_OVERRIDE;
73*4882a593Smuzhiyun interrupt_cntl &= ~IH_REQ_NONSNOOP_EN;
74*4882a593Smuzhiyun WREG32(INTERRUPT_CNTL, interrupt_cntl);
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun WREG32(IH_RB_BASE, adev->irq.ih.gpu_addr >> 8);
77*4882a593Smuzhiyun rb_bufsz = order_base_2(adev->irq.ih.ring_size / 4);
78*4882a593Smuzhiyun
79*4882a593Smuzhiyun ih_rb_cntl = IH_WPTR_OVERFLOW_ENABLE |
80*4882a593Smuzhiyun IH_WPTR_OVERFLOW_CLEAR |
81*4882a593Smuzhiyun (rb_bufsz << 1) |
82*4882a593Smuzhiyun IH_WPTR_WRITEBACK_ENABLE;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun WREG32(IH_RB_WPTR_ADDR_LO, lower_32_bits(ih->wptr_addr));
85*4882a593Smuzhiyun WREG32(IH_RB_WPTR_ADDR_HI, upper_32_bits(ih->wptr_addr) & 0xFF);
86*4882a593Smuzhiyun WREG32(IH_RB_CNTL, ih_rb_cntl);
87*4882a593Smuzhiyun WREG32(IH_RB_RPTR, 0);
88*4882a593Smuzhiyun WREG32(IH_RB_WPTR, 0);
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun ih_cntl = MC_WRREQ_CREDIT(0x10) | MC_WR_CLEAN_CNT(0x10) | MC_VMID(0);
91*4882a593Smuzhiyun if (adev->irq.msi_enabled)
92*4882a593Smuzhiyun ih_cntl |= RPTR_REARM;
93*4882a593Smuzhiyun WREG32(IH_CNTL, ih_cntl);
94*4882a593Smuzhiyun
95*4882a593Smuzhiyun pci_set_master(adev->pdev);
96*4882a593Smuzhiyun si_ih_enable_interrupts(adev);
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun return 0;
99*4882a593Smuzhiyun }
100*4882a593Smuzhiyun
si_ih_irq_disable(struct amdgpu_device * adev)101*4882a593Smuzhiyun static void si_ih_irq_disable(struct amdgpu_device *adev)
102*4882a593Smuzhiyun {
103*4882a593Smuzhiyun si_ih_disable_interrupts(adev);
104*4882a593Smuzhiyun mdelay(1);
105*4882a593Smuzhiyun }
106*4882a593Smuzhiyun
si_ih_get_wptr(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih)107*4882a593Smuzhiyun static u32 si_ih_get_wptr(struct amdgpu_device *adev,
108*4882a593Smuzhiyun struct amdgpu_ih_ring *ih)
109*4882a593Smuzhiyun {
110*4882a593Smuzhiyun u32 wptr, tmp;
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun wptr = le32_to_cpu(*ih->wptr_cpu);
113*4882a593Smuzhiyun
114*4882a593Smuzhiyun if (wptr & IH_RB_WPTR__RB_OVERFLOW_MASK) {
115*4882a593Smuzhiyun wptr &= ~IH_RB_WPTR__RB_OVERFLOW_MASK;
116*4882a593Smuzhiyun dev_warn(adev->dev, "IH ring buffer overflow (0x%08X, 0x%08X, 0x%08X)\n",
117*4882a593Smuzhiyun wptr, ih->rptr, (wptr + 16) & ih->ptr_mask);
118*4882a593Smuzhiyun ih->rptr = (wptr + 16) & ih->ptr_mask;
119*4882a593Smuzhiyun tmp = RREG32(IH_RB_CNTL);
120*4882a593Smuzhiyun tmp |= IH_RB_CNTL__WPTR_OVERFLOW_CLEAR_MASK;
121*4882a593Smuzhiyun WREG32(IH_RB_CNTL, tmp);
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun return (wptr & ih->ptr_mask);
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun
si_ih_decode_iv(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih,struct amdgpu_iv_entry * entry)126*4882a593Smuzhiyun static void si_ih_decode_iv(struct amdgpu_device *adev,
127*4882a593Smuzhiyun struct amdgpu_ih_ring *ih,
128*4882a593Smuzhiyun struct amdgpu_iv_entry *entry)
129*4882a593Smuzhiyun {
130*4882a593Smuzhiyun u32 ring_index = ih->rptr >> 2;
131*4882a593Smuzhiyun uint32_t dw[4];
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun dw[0] = le32_to_cpu(ih->ring[ring_index + 0]);
134*4882a593Smuzhiyun dw[1] = le32_to_cpu(ih->ring[ring_index + 1]);
135*4882a593Smuzhiyun dw[2] = le32_to_cpu(ih->ring[ring_index + 2]);
136*4882a593Smuzhiyun dw[3] = le32_to_cpu(ih->ring[ring_index + 3]);
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun entry->client_id = AMDGPU_IRQ_CLIENTID_LEGACY;
139*4882a593Smuzhiyun entry->src_id = dw[0] & 0xff;
140*4882a593Smuzhiyun entry->src_data[0] = dw[1] & 0xfffffff;
141*4882a593Smuzhiyun entry->ring_id = dw[2] & 0xff;
142*4882a593Smuzhiyun entry->vmid = (dw[2] >> 8) & 0xff;
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun ih->rptr += 16;
145*4882a593Smuzhiyun }
146*4882a593Smuzhiyun
si_ih_set_rptr(struct amdgpu_device * adev,struct amdgpu_ih_ring * ih)147*4882a593Smuzhiyun static void si_ih_set_rptr(struct amdgpu_device *adev,
148*4882a593Smuzhiyun struct amdgpu_ih_ring *ih)
149*4882a593Smuzhiyun {
150*4882a593Smuzhiyun WREG32(IH_RB_RPTR, ih->rptr);
151*4882a593Smuzhiyun }
152*4882a593Smuzhiyun
si_ih_early_init(void * handle)153*4882a593Smuzhiyun static int si_ih_early_init(void *handle)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun si_ih_set_interrupt_funcs(adev);
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun return 0;
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun
si_ih_sw_init(void * handle)162*4882a593Smuzhiyun static int si_ih_sw_init(void *handle)
163*4882a593Smuzhiyun {
164*4882a593Smuzhiyun int r;
165*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun r = amdgpu_ih_ring_init(adev, &adev->irq.ih, 64 * 1024, false);
168*4882a593Smuzhiyun if (r)
169*4882a593Smuzhiyun return r;
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun return amdgpu_irq_init(adev);
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun
si_ih_sw_fini(void * handle)174*4882a593Smuzhiyun static int si_ih_sw_fini(void *handle)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
177*4882a593Smuzhiyun
178*4882a593Smuzhiyun amdgpu_irq_fini(adev);
179*4882a593Smuzhiyun amdgpu_ih_ring_fini(adev, &adev->irq.ih);
180*4882a593Smuzhiyun
181*4882a593Smuzhiyun return 0;
182*4882a593Smuzhiyun }
183*4882a593Smuzhiyun
si_ih_hw_init(void * handle)184*4882a593Smuzhiyun static int si_ih_hw_init(void *handle)
185*4882a593Smuzhiyun {
186*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun return si_ih_irq_init(adev);
189*4882a593Smuzhiyun }
190*4882a593Smuzhiyun
si_ih_hw_fini(void * handle)191*4882a593Smuzhiyun static int si_ih_hw_fini(void *handle)
192*4882a593Smuzhiyun {
193*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun si_ih_irq_disable(adev);
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun return 0;
198*4882a593Smuzhiyun }
199*4882a593Smuzhiyun
si_ih_suspend(void * handle)200*4882a593Smuzhiyun static int si_ih_suspend(void *handle)
201*4882a593Smuzhiyun {
202*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
203*4882a593Smuzhiyun
204*4882a593Smuzhiyun return si_ih_hw_fini(adev);
205*4882a593Smuzhiyun }
206*4882a593Smuzhiyun
si_ih_resume(void * handle)207*4882a593Smuzhiyun static int si_ih_resume(void *handle)
208*4882a593Smuzhiyun {
209*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun return si_ih_hw_init(adev);
212*4882a593Smuzhiyun }
213*4882a593Smuzhiyun
si_ih_is_idle(void * handle)214*4882a593Smuzhiyun static bool si_ih_is_idle(void *handle)
215*4882a593Smuzhiyun {
216*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
217*4882a593Smuzhiyun u32 tmp = RREG32(SRBM_STATUS);
218*4882a593Smuzhiyun
219*4882a593Smuzhiyun if (tmp & SRBM_STATUS__IH_BUSY_MASK)
220*4882a593Smuzhiyun return false;
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun return true;
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun
si_ih_wait_for_idle(void * handle)225*4882a593Smuzhiyun static int si_ih_wait_for_idle(void *handle)
226*4882a593Smuzhiyun {
227*4882a593Smuzhiyun unsigned i;
228*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
229*4882a593Smuzhiyun
230*4882a593Smuzhiyun for (i = 0; i < adev->usec_timeout; i++) {
231*4882a593Smuzhiyun if (si_ih_is_idle(handle))
232*4882a593Smuzhiyun return 0;
233*4882a593Smuzhiyun udelay(1);
234*4882a593Smuzhiyun }
235*4882a593Smuzhiyun return -ETIMEDOUT;
236*4882a593Smuzhiyun }
237*4882a593Smuzhiyun
si_ih_soft_reset(void * handle)238*4882a593Smuzhiyun static int si_ih_soft_reset(void *handle)
239*4882a593Smuzhiyun {
240*4882a593Smuzhiyun struct amdgpu_device *adev = (struct amdgpu_device *)handle;
241*4882a593Smuzhiyun
242*4882a593Smuzhiyun u32 srbm_soft_reset = 0;
243*4882a593Smuzhiyun u32 tmp = RREG32(SRBM_STATUS);
244*4882a593Smuzhiyun
245*4882a593Smuzhiyun if (tmp & SRBM_STATUS__IH_BUSY_MASK)
246*4882a593Smuzhiyun srbm_soft_reset |= SRBM_SOFT_RESET__SOFT_RESET_IH_MASK;
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun if (srbm_soft_reset) {
249*4882a593Smuzhiyun tmp = RREG32(SRBM_SOFT_RESET);
250*4882a593Smuzhiyun tmp |= srbm_soft_reset;
251*4882a593Smuzhiyun dev_info(adev->dev, "SRBM_SOFT_RESET=0x%08X\n", tmp);
252*4882a593Smuzhiyun WREG32(SRBM_SOFT_RESET, tmp);
253*4882a593Smuzhiyun tmp = RREG32(SRBM_SOFT_RESET);
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun udelay(50);
256*4882a593Smuzhiyun
257*4882a593Smuzhiyun tmp &= ~srbm_soft_reset;
258*4882a593Smuzhiyun WREG32(SRBM_SOFT_RESET, tmp);
259*4882a593Smuzhiyun tmp = RREG32(SRBM_SOFT_RESET);
260*4882a593Smuzhiyun
261*4882a593Smuzhiyun udelay(50);
262*4882a593Smuzhiyun }
263*4882a593Smuzhiyun
264*4882a593Smuzhiyun return 0;
265*4882a593Smuzhiyun }
266*4882a593Smuzhiyun
si_ih_set_clockgating_state(void * handle,enum amd_clockgating_state state)267*4882a593Smuzhiyun static int si_ih_set_clockgating_state(void *handle,
268*4882a593Smuzhiyun enum amd_clockgating_state state)
269*4882a593Smuzhiyun {
270*4882a593Smuzhiyun return 0;
271*4882a593Smuzhiyun }
272*4882a593Smuzhiyun
si_ih_set_powergating_state(void * handle,enum amd_powergating_state state)273*4882a593Smuzhiyun static int si_ih_set_powergating_state(void *handle,
274*4882a593Smuzhiyun enum amd_powergating_state state)
275*4882a593Smuzhiyun {
276*4882a593Smuzhiyun return 0;
277*4882a593Smuzhiyun }
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun static const struct amd_ip_funcs si_ih_ip_funcs = {
280*4882a593Smuzhiyun .name = "si_ih",
281*4882a593Smuzhiyun .early_init = si_ih_early_init,
282*4882a593Smuzhiyun .late_init = NULL,
283*4882a593Smuzhiyun .sw_init = si_ih_sw_init,
284*4882a593Smuzhiyun .sw_fini = si_ih_sw_fini,
285*4882a593Smuzhiyun .hw_init = si_ih_hw_init,
286*4882a593Smuzhiyun .hw_fini = si_ih_hw_fini,
287*4882a593Smuzhiyun .suspend = si_ih_suspend,
288*4882a593Smuzhiyun .resume = si_ih_resume,
289*4882a593Smuzhiyun .is_idle = si_ih_is_idle,
290*4882a593Smuzhiyun .wait_for_idle = si_ih_wait_for_idle,
291*4882a593Smuzhiyun .soft_reset = si_ih_soft_reset,
292*4882a593Smuzhiyun .set_clockgating_state = si_ih_set_clockgating_state,
293*4882a593Smuzhiyun .set_powergating_state = si_ih_set_powergating_state,
294*4882a593Smuzhiyun };
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun static const struct amdgpu_ih_funcs si_ih_funcs = {
297*4882a593Smuzhiyun .get_wptr = si_ih_get_wptr,
298*4882a593Smuzhiyun .decode_iv = si_ih_decode_iv,
299*4882a593Smuzhiyun .set_rptr = si_ih_set_rptr
300*4882a593Smuzhiyun };
301*4882a593Smuzhiyun
si_ih_set_interrupt_funcs(struct amdgpu_device * adev)302*4882a593Smuzhiyun static void si_ih_set_interrupt_funcs(struct amdgpu_device *adev)
303*4882a593Smuzhiyun {
304*4882a593Smuzhiyun adev->irq.ih_funcs = &si_ih_funcs;
305*4882a593Smuzhiyun }
306*4882a593Smuzhiyun
307*4882a593Smuzhiyun const struct amdgpu_ip_block_version si_ih_ip_block =
308*4882a593Smuzhiyun {
309*4882a593Smuzhiyun .type = AMD_IP_BLOCK_TYPE_IH,
310*4882a593Smuzhiyun .major = 1,
311*4882a593Smuzhiyun .minor = 0,
312*4882a593Smuzhiyun .rev = 0,
313*4882a593Smuzhiyun .funcs = &si_ih_ip_funcs,
314*4882a593Smuzhiyun };
315