1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * This file is provided under a dual BSD/GPLv2 license. When using or
3*4882a593Smuzhiyun * redistributing this file, you may do so under either license.
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * GPL LICENSE SUMMARY
6*4882a593Smuzhiyun *
7*4882a593Smuzhiyun * Copyright (C) 2016 Advanced Micro Devices, Inc. All Rights Reserved.
8*4882a593Smuzhiyun * Copyright (C) 2016 T-Platforms. All Rights Reserved.
9*4882a593Smuzhiyun *
10*4882a593Smuzhiyun * This program is free software; you can redistribute it and/or modify
11*4882a593Smuzhiyun * it under the terms of version 2 of the GNU General Public License as
12*4882a593Smuzhiyun * published by the Free Software Foundation.
13*4882a593Smuzhiyun *
14*4882a593Smuzhiyun * BSD LICENSE
15*4882a593Smuzhiyun *
16*4882a593Smuzhiyun * Copyright (C) 2016 Advanced Micro Devices, Inc. All Rights Reserved.
17*4882a593Smuzhiyun * Copyright (C) 2016 T-Platforms. All Rights Reserved.
18*4882a593Smuzhiyun *
19*4882a593Smuzhiyun * Redistribution and use in source and binary forms, with or without
20*4882a593Smuzhiyun * modification, are permitted provided that the following conditions
21*4882a593Smuzhiyun * are met:
22*4882a593Smuzhiyun *
23*4882a593Smuzhiyun * * Redistributions of source code must retain the above copyright
24*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer.
25*4882a593Smuzhiyun * * Redistributions in binary form must reproduce the above copy
26*4882a593Smuzhiyun * notice, this list of conditions and the following disclaimer in
27*4882a593Smuzhiyun * the documentation and/or other materials provided with the
28*4882a593Smuzhiyun * distribution.
29*4882a593Smuzhiyun * * Neither the name of AMD Corporation nor the names of its
30*4882a593Smuzhiyun * contributors may be used to endorse or promote products derived
31*4882a593Smuzhiyun * from this software without specific prior written permission.
32*4882a593Smuzhiyun *
33*4882a593Smuzhiyun * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
34*4882a593Smuzhiyun * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
35*4882a593Smuzhiyun * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
36*4882a593Smuzhiyun * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
37*4882a593Smuzhiyun * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
38*4882a593Smuzhiyun * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
39*4882a593Smuzhiyun * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
40*4882a593Smuzhiyun * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
41*4882a593Smuzhiyun * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
42*4882a593Smuzhiyun * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
43*4882a593Smuzhiyun * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
44*4882a593Smuzhiyun *
45*4882a593Smuzhiyun * AMD PCIe NTB Linux driver
46*4882a593Smuzhiyun *
47*4882a593Smuzhiyun * Contact Information:
48*4882a593Smuzhiyun * Xiangliang Yu <Xiangliang.Yu@amd.com>
49*4882a593Smuzhiyun */
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun #include <linux/debugfs.h>
52*4882a593Smuzhiyun #include <linux/delay.h>
53*4882a593Smuzhiyun #include <linux/init.h>
54*4882a593Smuzhiyun #include <linux/interrupt.h>
55*4882a593Smuzhiyun #include <linux/module.h>
56*4882a593Smuzhiyun #include <linux/acpi.h>
57*4882a593Smuzhiyun #include <linux/pci.h>
58*4882a593Smuzhiyun #include <linux/random.h>
59*4882a593Smuzhiyun #include <linux/slab.h>
60*4882a593Smuzhiyun #include <linux/ntb.h>
61*4882a593Smuzhiyun
62*4882a593Smuzhiyun #include "ntb_hw_amd.h"
63*4882a593Smuzhiyun
64*4882a593Smuzhiyun #define NTB_NAME "ntb_hw_amd"
65*4882a593Smuzhiyun #define NTB_DESC "AMD(R) PCI-E Non-Transparent Bridge Driver"
66*4882a593Smuzhiyun #define NTB_VER "1.0"
67*4882a593Smuzhiyun
68*4882a593Smuzhiyun MODULE_DESCRIPTION(NTB_DESC);
69*4882a593Smuzhiyun MODULE_VERSION(NTB_VER);
70*4882a593Smuzhiyun MODULE_LICENSE("Dual BSD/GPL");
71*4882a593Smuzhiyun MODULE_AUTHOR("AMD Inc.");
72*4882a593Smuzhiyun
73*4882a593Smuzhiyun static const struct file_operations amd_ntb_debugfs_info;
74*4882a593Smuzhiyun static struct dentry *debugfs_dir;
75*4882a593Smuzhiyun
ndev_mw_to_bar(struct amd_ntb_dev * ndev,int idx)76*4882a593Smuzhiyun static int ndev_mw_to_bar(struct amd_ntb_dev *ndev, int idx)
77*4882a593Smuzhiyun {
78*4882a593Smuzhiyun if (idx < 0 || idx > ndev->mw_count)
79*4882a593Smuzhiyun return -EINVAL;
80*4882a593Smuzhiyun
81*4882a593Smuzhiyun return ndev->dev_data->mw_idx << idx;
82*4882a593Smuzhiyun }
83*4882a593Smuzhiyun
amd_ntb_mw_count(struct ntb_dev * ntb,int pidx)84*4882a593Smuzhiyun static int amd_ntb_mw_count(struct ntb_dev *ntb, int pidx)
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun if (pidx != NTB_DEF_PEER_IDX)
87*4882a593Smuzhiyun return -EINVAL;
88*4882a593Smuzhiyun
89*4882a593Smuzhiyun return ntb_ndev(ntb)->mw_count;
90*4882a593Smuzhiyun }
91*4882a593Smuzhiyun
amd_ntb_mw_get_align(struct ntb_dev * ntb,int pidx,int idx,resource_size_t * addr_align,resource_size_t * size_align,resource_size_t * size_max)92*4882a593Smuzhiyun static int amd_ntb_mw_get_align(struct ntb_dev *ntb, int pidx, int idx,
93*4882a593Smuzhiyun resource_size_t *addr_align,
94*4882a593Smuzhiyun resource_size_t *size_align,
95*4882a593Smuzhiyun resource_size_t *size_max)
96*4882a593Smuzhiyun {
97*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
98*4882a593Smuzhiyun int bar;
99*4882a593Smuzhiyun
100*4882a593Smuzhiyun if (pidx != NTB_DEF_PEER_IDX)
101*4882a593Smuzhiyun return -EINVAL;
102*4882a593Smuzhiyun
103*4882a593Smuzhiyun bar = ndev_mw_to_bar(ndev, idx);
104*4882a593Smuzhiyun if (bar < 0)
105*4882a593Smuzhiyun return bar;
106*4882a593Smuzhiyun
107*4882a593Smuzhiyun if (addr_align)
108*4882a593Smuzhiyun *addr_align = SZ_4K;
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun if (size_align)
111*4882a593Smuzhiyun *size_align = 1;
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun if (size_max)
114*4882a593Smuzhiyun *size_max = pci_resource_len(ndev->ntb.pdev, bar);
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun return 0;
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun
amd_ntb_mw_set_trans(struct ntb_dev * ntb,int pidx,int idx,dma_addr_t addr,resource_size_t size)119*4882a593Smuzhiyun static int amd_ntb_mw_set_trans(struct ntb_dev *ntb, int pidx, int idx,
120*4882a593Smuzhiyun dma_addr_t addr, resource_size_t size)
121*4882a593Smuzhiyun {
122*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
123*4882a593Smuzhiyun unsigned long xlat_reg, limit_reg = 0;
124*4882a593Smuzhiyun resource_size_t mw_size;
125*4882a593Smuzhiyun void __iomem *mmio, *peer_mmio;
126*4882a593Smuzhiyun u64 base_addr, limit, reg_val;
127*4882a593Smuzhiyun int bar;
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun if (pidx != NTB_DEF_PEER_IDX)
130*4882a593Smuzhiyun return -EINVAL;
131*4882a593Smuzhiyun
132*4882a593Smuzhiyun bar = ndev_mw_to_bar(ndev, idx);
133*4882a593Smuzhiyun if (bar < 0)
134*4882a593Smuzhiyun return bar;
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun mw_size = pci_resource_len(ntb->pdev, bar);
137*4882a593Smuzhiyun
138*4882a593Smuzhiyun /* make sure the range fits in the usable mw size */
139*4882a593Smuzhiyun if (size > mw_size)
140*4882a593Smuzhiyun return -EINVAL;
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun mmio = ndev->self_mmio;
143*4882a593Smuzhiyun peer_mmio = ndev->peer_mmio;
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun base_addr = pci_resource_start(ntb->pdev, bar);
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun if (bar != 1) {
148*4882a593Smuzhiyun xlat_reg = AMD_BAR23XLAT_OFFSET + ((bar - 2) << 2);
149*4882a593Smuzhiyun limit_reg = AMD_BAR23LMT_OFFSET + ((bar - 2) << 2);
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun /* Set the limit if supported */
152*4882a593Smuzhiyun limit = size;
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun /* set and verify setting the translation address */
155*4882a593Smuzhiyun write64(addr, peer_mmio + xlat_reg);
156*4882a593Smuzhiyun reg_val = read64(peer_mmio + xlat_reg);
157*4882a593Smuzhiyun if (reg_val != addr) {
158*4882a593Smuzhiyun write64(0, peer_mmio + xlat_reg);
159*4882a593Smuzhiyun return -EIO;
160*4882a593Smuzhiyun }
161*4882a593Smuzhiyun
162*4882a593Smuzhiyun /* set and verify setting the limit */
163*4882a593Smuzhiyun write64(limit, peer_mmio + limit_reg);
164*4882a593Smuzhiyun reg_val = read64(peer_mmio + limit_reg);
165*4882a593Smuzhiyun if (reg_val != limit) {
166*4882a593Smuzhiyun write64(base_addr, mmio + limit_reg);
167*4882a593Smuzhiyun write64(0, peer_mmio + xlat_reg);
168*4882a593Smuzhiyun return -EIO;
169*4882a593Smuzhiyun }
170*4882a593Smuzhiyun } else {
171*4882a593Smuzhiyun xlat_reg = AMD_BAR1XLAT_OFFSET;
172*4882a593Smuzhiyun limit_reg = AMD_BAR1LMT_OFFSET;
173*4882a593Smuzhiyun
174*4882a593Smuzhiyun /* Set the limit if supported */
175*4882a593Smuzhiyun limit = size;
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun /* set and verify setting the translation address */
178*4882a593Smuzhiyun write64(addr, peer_mmio + xlat_reg);
179*4882a593Smuzhiyun reg_val = read64(peer_mmio + xlat_reg);
180*4882a593Smuzhiyun if (reg_val != addr) {
181*4882a593Smuzhiyun write64(0, peer_mmio + xlat_reg);
182*4882a593Smuzhiyun return -EIO;
183*4882a593Smuzhiyun }
184*4882a593Smuzhiyun
185*4882a593Smuzhiyun /* set and verify setting the limit */
186*4882a593Smuzhiyun writel(limit, peer_mmio + limit_reg);
187*4882a593Smuzhiyun reg_val = readl(peer_mmio + limit_reg);
188*4882a593Smuzhiyun if (reg_val != limit) {
189*4882a593Smuzhiyun writel(base_addr, mmio + limit_reg);
190*4882a593Smuzhiyun writel(0, peer_mmio + xlat_reg);
191*4882a593Smuzhiyun return -EIO;
192*4882a593Smuzhiyun }
193*4882a593Smuzhiyun }
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun return 0;
196*4882a593Smuzhiyun }
197*4882a593Smuzhiyun
amd_ntb_get_link_status(struct amd_ntb_dev * ndev)198*4882a593Smuzhiyun static int amd_ntb_get_link_status(struct amd_ntb_dev *ndev)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun struct pci_dev *pdev = NULL;
201*4882a593Smuzhiyun struct pci_dev *pci_swds = NULL;
202*4882a593Smuzhiyun struct pci_dev *pci_swus = NULL;
203*4882a593Smuzhiyun u32 stat;
204*4882a593Smuzhiyun int rc;
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun if (ndev->ntb.topo == NTB_TOPO_SEC) {
207*4882a593Smuzhiyun /* Locate the pointer to Downstream Switch for this device */
208*4882a593Smuzhiyun pci_swds = pci_upstream_bridge(ndev->ntb.pdev);
209*4882a593Smuzhiyun if (pci_swds) {
210*4882a593Smuzhiyun /*
211*4882a593Smuzhiyun * Locate the pointer to Upstream Switch for
212*4882a593Smuzhiyun * the Downstream Switch.
213*4882a593Smuzhiyun */
214*4882a593Smuzhiyun pci_swus = pci_upstream_bridge(pci_swds);
215*4882a593Smuzhiyun if (pci_swus) {
216*4882a593Smuzhiyun rc = pcie_capability_read_dword(pci_swus,
217*4882a593Smuzhiyun PCI_EXP_LNKCTL,
218*4882a593Smuzhiyun &stat);
219*4882a593Smuzhiyun if (rc)
220*4882a593Smuzhiyun return 0;
221*4882a593Smuzhiyun } else {
222*4882a593Smuzhiyun return 0;
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun } else {
225*4882a593Smuzhiyun return 0;
226*4882a593Smuzhiyun }
227*4882a593Smuzhiyun } else if (ndev->ntb.topo == NTB_TOPO_PRI) {
228*4882a593Smuzhiyun /*
229*4882a593Smuzhiyun * For NTB primary, we simply read the Link Status and control
230*4882a593Smuzhiyun * register of the NTB device itself.
231*4882a593Smuzhiyun */
232*4882a593Smuzhiyun pdev = ndev->ntb.pdev;
233*4882a593Smuzhiyun rc = pcie_capability_read_dword(pdev, PCI_EXP_LNKCTL, &stat);
234*4882a593Smuzhiyun if (rc)
235*4882a593Smuzhiyun return 0;
236*4882a593Smuzhiyun } else {
237*4882a593Smuzhiyun /* Catch all for everything else */
238*4882a593Smuzhiyun return 0;
239*4882a593Smuzhiyun }
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun ndev->lnk_sta = stat;
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun return 1;
244*4882a593Smuzhiyun }
245*4882a593Smuzhiyun
amd_link_is_up(struct amd_ntb_dev * ndev)246*4882a593Smuzhiyun static int amd_link_is_up(struct amd_ntb_dev *ndev)
247*4882a593Smuzhiyun {
248*4882a593Smuzhiyun int ret;
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun /*
251*4882a593Smuzhiyun * We consider the link to be up under two conditions:
252*4882a593Smuzhiyun *
253*4882a593Smuzhiyun * - When a link-up event is received. This is indicated by
254*4882a593Smuzhiyun * AMD_LINK_UP_EVENT set in peer_sta.
255*4882a593Smuzhiyun * - When driver on both sides of the link have been loaded.
256*4882a593Smuzhiyun * This is indicated by bit 1 being set in the peer
257*4882a593Smuzhiyun * SIDEINFO register.
258*4882a593Smuzhiyun *
259*4882a593Smuzhiyun * This function should return 1 when the latter of the above
260*4882a593Smuzhiyun * two conditions is true.
261*4882a593Smuzhiyun *
262*4882a593Smuzhiyun * Now consider the sequence of events - Link-Up event occurs,
263*4882a593Smuzhiyun * then the peer side driver loads. In this case, we would have
264*4882a593Smuzhiyun * received LINK_UP event and bit 1 of peer SIDEINFO is also
265*4882a593Smuzhiyun * set. What happens now if the link goes down? Bit 1 of
266*4882a593Smuzhiyun * peer SIDEINFO remains set, but LINK_DOWN bit is set in
267*4882a593Smuzhiyun * peer_sta. So we should return 0 from this function. Not only
268*4882a593Smuzhiyun * that, we clear bit 1 of peer SIDEINFO to 0, since the peer
269*4882a593Smuzhiyun * side driver did not even get a chance to clear it before
270*4882a593Smuzhiyun * the link went down. This can be the case of surprise link
271*4882a593Smuzhiyun * removal.
272*4882a593Smuzhiyun *
273*4882a593Smuzhiyun * LINK_UP event will always occur before the peer side driver
274*4882a593Smuzhiyun * gets loaded the very first time. So there can be a case when
275*4882a593Smuzhiyun * the LINK_UP event has occurred, but the peer side driver hasn't
276*4882a593Smuzhiyun * yet loaded. We return 0 in that case.
277*4882a593Smuzhiyun *
278*4882a593Smuzhiyun * There is also a special case when the primary side driver is
279*4882a593Smuzhiyun * unloaded and then loaded again. Since there is no change in
280*4882a593Smuzhiyun * the status of NTB secondary in this case, there is no Link-Up
281*4882a593Smuzhiyun * or Link-Down notification received. We recognize this condition
282*4882a593Smuzhiyun * with peer_sta being set to 0.
283*4882a593Smuzhiyun *
284*4882a593Smuzhiyun * If bit 1 of peer SIDEINFO register is not set, then we
285*4882a593Smuzhiyun * simply return 0 irrespective of the link up or down status
286*4882a593Smuzhiyun * set in peer_sta.
287*4882a593Smuzhiyun */
288*4882a593Smuzhiyun ret = amd_poll_link(ndev);
289*4882a593Smuzhiyun if (ret) {
290*4882a593Smuzhiyun /*
291*4882a593Smuzhiyun * We need to check the below only for NTB primary. For NTB
292*4882a593Smuzhiyun * secondary, simply checking the result of PSIDE_INFO
293*4882a593Smuzhiyun * register will suffice.
294*4882a593Smuzhiyun */
295*4882a593Smuzhiyun if (ndev->ntb.topo == NTB_TOPO_PRI) {
296*4882a593Smuzhiyun if ((ndev->peer_sta & AMD_LINK_UP_EVENT) ||
297*4882a593Smuzhiyun (ndev->peer_sta == 0))
298*4882a593Smuzhiyun return ret;
299*4882a593Smuzhiyun else if (ndev->peer_sta & AMD_LINK_DOWN_EVENT) {
300*4882a593Smuzhiyun /* Clear peer sideinfo register */
301*4882a593Smuzhiyun amd_clear_side_info_reg(ndev, true);
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun return 0;
304*4882a593Smuzhiyun }
305*4882a593Smuzhiyun } else { /* NTB_TOPO_SEC */
306*4882a593Smuzhiyun return ret;
307*4882a593Smuzhiyun }
308*4882a593Smuzhiyun }
309*4882a593Smuzhiyun
310*4882a593Smuzhiyun return 0;
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun
amd_ntb_link_is_up(struct ntb_dev * ntb,enum ntb_speed * speed,enum ntb_width * width)313*4882a593Smuzhiyun static u64 amd_ntb_link_is_up(struct ntb_dev *ntb,
314*4882a593Smuzhiyun enum ntb_speed *speed,
315*4882a593Smuzhiyun enum ntb_width *width)
316*4882a593Smuzhiyun {
317*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
318*4882a593Smuzhiyun int ret = 0;
319*4882a593Smuzhiyun
320*4882a593Smuzhiyun if (amd_link_is_up(ndev)) {
321*4882a593Smuzhiyun if (speed)
322*4882a593Smuzhiyun *speed = NTB_LNK_STA_SPEED(ndev->lnk_sta);
323*4882a593Smuzhiyun if (width)
324*4882a593Smuzhiyun *width = NTB_LNK_STA_WIDTH(ndev->lnk_sta);
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun dev_dbg(&ntb->pdev->dev, "link is up.\n");
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun ret = 1;
329*4882a593Smuzhiyun } else {
330*4882a593Smuzhiyun if (speed)
331*4882a593Smuzhiyun *speed = NTB_SPEED_NONE;
332*4882a593Smuzhiyun if (width)
333*4882a593Smuzhiyun *width = NTB_WIDTH_NONE;
334*4882a593Smuzhiyun
335*4882a593Smuzhiyun dev_dbg(&ntb->pdev->dev, "link is down.\n");
336*4882a593Smuzhiyun }
337*4882a593Smuzhiyun
338*4882a593Smuzhiyun return ret;
339*4882a593Smuzhiyun }
340*4882a593Smuzhiyun
amd_ntb_link_enable(struct ntb_dev * ntb,enum ntb_speed max_speed,enum ntb_width max_width)341*4882a593Smuzhiyun static int amd_ntb_link_enable(struct ntb_dev *ntb,
342*4882a593Smuzhiyun enum ntb_speed max_speed,
343*4882a593Smuzhiyun enum ntb_width max_width)
344*4882a593Smuzhiyun {
345*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
346*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun /* Enable event interrupt */
349*4882a593Smuzhiyun ndev->int_mask &= ~AMD_EVENT_INTMASK;
350*4882a593Smuzhiyun writel(ndev->int_mask, mmio + AMD_INTMASK_OFFSET);
351*4882a593Smuzhiyun
352*4882a593Smuzhiyun if (ndev->ntb.topo == NTB_TOPO_SEC)
353*4882a593Smuzhiyun return -EINVAL;
354*4882a593Smuzhiyun dev_dbg(&ntb->pdev->dev, "Enabling Link.\n");
355*4882a593Smuzhiyun
356*4882a593Smuzhiyun return 0;
357*4882a593Smuzhiyun }
358*4882a593Smuzhiyun
amd_ntb_link_disable(struct ntb_dev * ntb)359*4882a593Smuzhiyun static int amd_ntb_link_disable(struct ntb_dev *ntb)
360*4882a593Smuzhiyun {
361*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
362*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
363*4882a593Smuzhiyun
364*4882a593Smuzhiyun /* Disable event interrupt */
365*4882a593Smuzhiyun ndev->int_mask |= AMD_EVENT_INTMASK;
366*4882a593Smuzhiyun writel(ndev->int_mask, mmio + AMD_INTMASK_OFFSET);
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun if (ndev->ntb.topo == NTB_TOPO_SEC)
369*4882a593Smuzhiyun return -EINVAL;
370*4882a593Smuzhiyun dev_dbg(&ntb->pdev->dev, "Enabling Link.\n");
371*4882a593Smuzhiyun
372*4882a593Smuzhiyun return 0;
373*4882a593Smuzhiyun }
374*4882a593Smuzhiyun
amd_ntb_peer_mw_count(struct ntb_dev * ntb)375*4882a593Smuzhiyun static int amd_ntb_peer_mw_count(struct ntb_dev *ntb)
376*4882a593Smuzhiyun {
377*4882a593Smuzhiyun /* The same as for inbound MWs */
378*4882a593Smuzhiyun return ntb_ndev(ntb)->mw_count;
379*4882a593Smuzhiyun }
380*4882a593Smuzhiyun
amd_ntb_peer_mw_get_addr(struct ntb_dev * ntb,int idx,phys_addr_t * base,resource_size_t * size)381*4882a593Smuzhiyun static int amd_ntb_peer_mw_get_addr(struct ntb_dev *ntb, int idx,
382*4882a593Smuzhiyun phys_addr_t *base, resource_size_t *size)
383*4882a593Smuzhiyun {
384*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
385*4882a593Smuzhiyun int bar;
386*4882a593Smuzhiyun
387*4882a593Smuzhiyun bar = ndev_mw_to_bar(ndev, idx);
388*4882a593Smuzhiyun if (bar < 0)
389*4882a593Smuzhiyun return bar;
390*4882a593Smuzhiyun
391*4882a593Smuzhiyun if (base)
392*4882a593Smuzhiyun *base = pci_resource_start(ndev->ntb.pdev, bar);
393*4882a593Smuzhiyun
394*4882a593Smuzhiyun if (size)
395*4882a593Smuzhiyun *size = pci_resource_len(ndev->ntb.pdev, bar);
396*4882a593Smuzhiyun
397*4882a593Smuzhiyun return 0;
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun
amd_ntb_db_valid_mask(struct ntb_dev * ntb)400*4882a593Smuzhiyun static u64 amd_ntb_db_valid_mask(struct ntb_dev *ntb)
401*4882a593Smuzhiyun {
402*4882a593Smuzhiyun return ntb_ndev(ntb)->db_valid_mask;
403*4882a593Smuzhiyun }
404*4882a593Smuzhiyun
amd_ntb_db_vector_count(struct ntb_dev * ntb)405*4882a593Smuzhiyun static int amd_ntb_db_vector_count(struct ntb_dev *ntb)
406*4882a593Smuzhiyun {
407*4882a593Smuzhiyun return ntb_ndev(ntb)->db_count;
408*4882a593Smuzhiyun }
409*4882a593Smuzhiyun
amd_ntb_db_vector_mask(struct ntb_dev * ntb,int db_vector)410*4882a593Smuzhiyun static u64 amd_ntb_db_vector_mask(struct ntb_dev *ntb, int db_vector)
411*4882a593Smuzhiyun {
412*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
413*4882a593Smuzhiyun
414*4882a593Smuzhiyun if (db_vector < 0 || db_vector > ndev->db_count)
415*4882a593Smuzhiyun return 0;
416*4882a593Smuzhiyun
417*4882a593Smuzhiyun return ntb_ndev(ntb)->db_valid_mask & (1ULL << db_vector);
418*4882a593Smuzhiyun }
419*4882a593Smuzhiyun
amd_ntb_db_read(struct ntb_dev * ntb)420*4882a593Smuzhiyun static u64 amd_ntb_db_read(struct ntb_dev *ntb)
421*4882a593Smuzhiyun {
422*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
423*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
424*4882a593Smuzhiyun
425*4882a593Smuzhiyun return (u64)readw(mmio + AMD_DBSTAT_OFFSET);
426*4882a593Smuzhiyun }
427*4882a593Smuzhiyun
amd_ntb_db_clear(struct ntb_dev * ntb,u64 db_bits)428*4882a593Smuzhiyun static int amd_ntb_db_clear(struct ntb_dev *ntb, u64 db_bits)
429*4882a593Smuzhiyun {
430*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
431*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
432*4882a593Smuzhiyun
433*4882a593Smuzhiyun writew((u16)db_bits, mmio + AMD_DBSTAT_OFFSET);
434*4882a593Smuzhiyun
435*4882a593Smuzhiyun return 0;
436*4882a593Smuzhiyun }
437*4882a593Smuzhiyun
amd_ntb_db_set_mask(struct ntb_dev * ntb,u64 db_bits)438*4882a593Smuzhiyun static int amd_ntb_db_set_mask(struct ntb_dev *ntb, u64 db_bits)
439*4882a593Smuzhiyun {
440*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
441*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
442*4882a593Smuzhiyun unsigned long flags;
443*4882a593Smuzhiyun
444*4882a593Smuzhiyun if (db_bits & ~ndev->db_valid_mask)
445*4882a593Smuzhiyun return -EINVAL;
446*4882a593Smuzhiyun
447*4882a593Smuzhiyun spin_lock_irqsave(&ndev->db_mask_lock, flags);
448*4882a593Smuzhiyun ndev->db_mask |= db_bits;
449*4882a593Smuzhiyun writew((u16)ndev->db_mask, mmio + AMD_DBMASK_OFFSET);
450*4882a593Smuzhiyun spin_unlock_irqrestore(&ndev->db_mask_lock, flags);
451*4882a593Smuzhiyun
452*4882a593Smuzhiyun return 0;
453*4882a593Smuzhiyun }
454*4882a593Smuzhiyun
amd_ntb_db_clear_mask(struct ntb_dev * ntb,u64 db_bits)455*4882a593Smuzhiyun static int amd_ntb_db_clear_mask(struct ntb_dev *ntb, u64 db_bits)
456*4882a593Smuzhiyun {
457*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
458*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
459*4882a593Smuzhiyun unsigned long flags;
460*4882a593Smuzhiyun
461*4882a593Smuzhiyun if (db_bits & ~ndev->db_valid_mask)
462*4882a593Smuzhiyun return -EINVAL;
463*4882a593Smuzhiyun
464*4882a593Smuzhiyun spin_lock_irqsave(&ndev->db_mask_lock, flags);
465*4882a593Smuzhiyun ndev->db_mask &= ~db_bits;
466*4882a593Smuzhiyun writew((u16)ndev->db_mask, mmio + AMD_DBMASK_OFFSET);
467*4882a593Smuzhiyun spin_unlock_irqrestore(&ndev->db_mask_lock, flags);
468*4882a593Smuzhiyun
469*4882a593Smuzhiyun return 0;
470*4882a593Smuzhiyun }
471*4882a593Smuzhiyun
amd_ntb_peer_db_set(struct ntb_dev * ntb,u64 db_bits)472*4882a593Smuzhiyun static int amd_ntb_peer_db_set(struct ntb_dev *ntb, u64 db_bits)
473*4882a593Smuzhiyun {
474*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
475*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun writew((u16)db_bits, mmio + AMD_DBREQ_OFFSET);
478*4882a593Smuzhiyun
479*4882a593Smuzhiyun return 0;
480*4882a593Smuzhiyun }
481*4882a593Smuzhiyun
amd_ntb_spad_count(struct ntb_dev * ntb)482*4882a593Smuzhiyun static int amd_ntb_spad_count(struct ntb_dev *ntb)
483*4882a593Smuzhiyun {
484*4882a593Smuzhiyun return ntb_ndev(ntb)->spad_count;
485*4882a593Smuzhiyun }
486*4882a593Smuzhiyun
amd_ntb_spad_read(struct ntb_dev * ntb,int idx)487*4882a593Smuzhiyun static u32 amd_ntb_spad_read(struct ntb_dev *ntb, int idx)
488*4882a593Smuzhiyun {
489*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
490*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
491*4882a593Smuzhiyun u32 offset;
492*4882a593Smuzhiyun
493*4882a593Smuzhiyun if (idx < 0 || idx >= ndev->spad_count)
494*4882a593Smuzhiyun return 0;
495*4882a593Smuzhiyun
496*4882a593Smuzhiyun offset = ndev->self_spad + (idx << 2);
497*4882a593Smuzhiyun return readl(mmio + AMD_SPAD_OFFSET + offset);
498*4882a593Smuzhiyun }
499*4882a593Smuzhiyun
amd_ntb_spad_write(struct ntb_dev * ntb,int idx,u32 val)500*4882a593Smuzhiyun static int amd_ntb_spad_write(struct ntb_dev *ntb,
501*4882a593Smuzhiyun int idx, u32 val)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
504*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
505*4882a593Smuzhiyun u32 offset;
506*4882a593Smuzhiyun
507*4882a593Smuzhiyun if (idx < 0 || idx >= ndev->spad_count)
508*4882a593Smuzhiyun return -EINVAL;
509*4882a593Smuzhiyun
510*4882a593Smuzhiyun offset = ndev->self_spad + (idx << 2);
511*4882a593Smuzhiyun writel(val, mmio + AMD_SPAD_OFFSET + offset);
512*4882a593Smuzhiyun
513*4882a593Smuzhiyun return 0;
514*4882a593Smuzhiyun }
515*4882a593Smuzhiyun
amd_ntb_peer_spad_read(struct ntb_dev * ntb,int pidx,int sidx)516*4882a593Smuzhiyun static u32 amd_ntb_peer_spad_read(struct ntb_dev *ntb, int pidx, int sidx)
517*4882a593Smuzhiyun {
518*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
519*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
520*4882a593Smuzhiyun u32 offset;
521*4882a593Smuzhiyun
522*4882a593Smuzhiyun if (sidx < 0 || sidx >= ndev->spad_count)
523*4882a593Smuzhiyun return -EINVAL;
524*4882a593Smuzhiyun
525*4882a593Smuzhiyun offset = ndev->peer_spad + (sidx << 2);
526*4882a593Smuzhiyun return readl(mmio + AMD_SPAD_OFFSET + offset);
527*4882a593Smuzhiyun }
528*4882a593Smuzhiyun
amd_ntb_peer_spad_write(struct ntb_dev * ntb,int pidx,int sidx,u32 val)529*4882a593Smuzhiyun static int amd_ntb_peer_spad_write(struct ntb_dev *ntb, int pidx,
530*4882a593Smuzhiyun int sidx, u32 val)
531*4882a593Smuzhiyun {
532*4882a593Smuzhiyun struct amd_ntb_dev *ndev = ntb_ndev(ntb);
533*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
534*4882a593Smuzhiyun u32 offset;
535*4882a593Smuzhiyun
536*4882a593Smuzhiyun if (sidx < 0 || sidx >= ndev->spad_count)
537*4882a593Smuzhiyun return -EINVAL;
538*4882a593Smuzhiyun
539*4882a593Smuzhiyun offset = ndev->peer_spad + (sidx << 2);
540*4882a593Smuzhiyun writel(val, mmio + AMD_SPAD_OFFSET + offset);
541*4882a593Smuzhiyun
542*4882a593Smuzhiyun return 0;
543*4882a593Smuzhiyun }
544*4882a593Smuzhiyun
545*4882a593Smuzhiyun static const struct ntb_dev_ops amd_ntb_ops = {
546*4882a593Smuzhiyun .mw_count = amd_ntb_mw_count,
547*4882a593Smuzhiyun .mw_get_align = amd_ntb_mw_get_align,
548*4882a593Smuzhiyun .mw_set_trans = amd_ntb_mw_set_trans,
549*4882a593Smuzhiyun .peer_mw_count = amd_ntb_peer_mw_count,
550*4882a593Smuzhiyun .peer_mw_get_addr = amd_ntb_peer_mw_get_addr,
551*4882a593Smuzhiyun .link_is_up = amd_ntb_link_is_up,
552*4882a593Smuzhiyun .link_enable = amd_ntb_link_enable,
553*4882a593Smuzhiyun .link_disable = amd_ntb_link_disable,
554*4882a593Smuzhiyun .db_valid_mask = amd_ntb_db_valid_mask,
555*4882a593Smuzhiyun .db_vector_count = amd_ntb_db_vector_count,
556*4882a593Smuzhiyun .db_vector_mask = amd_ntb_db_vector_mask,
557*4882a593Smuzhiyun .db_read = amd_ntb_db_read,
558*4882a593Smuzhiyun .db_clear = amd_ntb_db_clear,
559*4882a593Smuzhiyun .db_set_mask = amd_ntb_db_set_mask,
560*4882a593Smuzhiyun .db_clear_mask = amd_ntb_db_clear_mask,
561*4882a593Smuzhiyun .peer_db_set = amd_ntb_peer_db_set,
562*4882a593Smuzhiyun .spad_count = amd_ntb_spad_count,
563*4882a593Smuzhiyun .spad_read = amd_ntb_spad_read,
564*4882a593Smuzhiyun .spad_write = amd_ntb_spad_write,
565*4882a593Smuzhiyun .peer_spad_read = amd_ntb_peer_spad_read,
566*4882a593Smuzhiyun .peer_spad_write = amd_ntb_peer_spad_write,
567*4882a593Smuzhiyun };
568*4882a593Smuzhiyun
amd_ack_smu(struct amd_ntb_dev * ndev,u32 bit)569*4882a593Smuzhiyun static void amd_ack_smu(struct amd_ntb_dev *ndev, u32 bit)
570*4882a593Smuzhiyun {
571*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
572*4882a593Smuzhiyun int reg;
573*4882a593Smuzhiyun
574*4882a593Smuzhiyun reg = readl(mmio + AMD_SMUACK_OFFSET);
575*4882a593Smuzhiyun reg |= bit;
576*4882a593Smuzhiyun writel(reg, mmio + AMD_SMUACK_OFFSET);
577*4882a593Smuzhiyun }
578*4882a593Smuzhiyun
amd_handle_event(struct amd_ntb_dev * ndev,int vec)579*4882a593Smuzhiyun static void amd_handle_event(struct amd_ntb_dev *ndev, int vec)
580*4882a593Smuzhiyun {
581*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
582*4882a593Smuzhiyun struct device *dev = &ndev->ntb.pdev->dev;
583*4882a593Smuzhiyun u32 status;
584*4882a593Smuzhiyun
585*4882a593Smuzhiyun status = readl(mmio + AMD_INTSTAT_OFFSET);
586*4882a593Smuzhiyun if (!(status & AMD_EVENT_INTMASK))
587*4882a593Smuzhiyun return;
588*4882a593Smuzhiyun
589*4882a593Smuzhiyun dev_dbg(dev, "status = 0x%x and vec = %d\n", status, vec);
590*4882a593Smuzhiyun
591*4882a593Smuzhiyun status &= AMD_EVENT_INTMASK;
592*4882a593Smuzhiyun switch (status) {
593*4882a593Smuzhiyun case AMD_PEER_FLUSH_EVENT:
594*4882a593Smuzhiyun ndev->peer_sta |= AMD_PEER_FLUSH_EVENT;
595*4882a593Smuzhiyun dev_info(dev, "Flush is done.\n");
596*4882a593Smuzhiyun break;
597*4882a593Smuzhiyun case AMD_PEER_RESET_EVENT:
598*4882a593Smuzhiyun case AMD_LINK_DOWN_EVENT:
599*4882a593Smuzhiyun ndev->peer_sta |= status;
600*4882a593Smuzhiyun if (status == AMD_LINK_DOWN_EVENT)
601*4882a593Smuzhiyun ndev->peer_sta &= ~AMD_LINK_UP_EVENT;
602*4882a593Smuzhiyun
603*4882a593Smuzhiyun amd_ack_smu(ndev, status);
604*4882a593Smuzhiyun
605*4882a593Smuzhiyun /* link down first */
606*4882a593Smuzhiyun ntb_link_event(&ndev->ntb);
607*4882a593Smuzhiyun /* polling peer status */
608*4882a593Smuzhiyun schedule_delayed_work(&ndev->hb_timer, AMD_LINK_HB_TIMEOUT);
609*4882a593Smuzhiyun
610*4882a593Smuzhiyun break;
611*4882a593Smuzhiyun case AMD_PEER_D3_EVENT:
612*4882a593Smuzhiyun case AMD_PEER_PMETO_EVENT:
613*4882a593Smuzhiyun case AMD_LINK_UP_EVENT:
614*4882a593Smuzhiyun ndev->peer_sta |= status;
615*4882a593Smuzhiyun if (status == AMD_LINK_UP_EVENT)
616*4882a593Smuzhiyun ndev->peer_sta &= ~AMD_LINK_DOWN_EVENT;
617*4882a593Smuzhiyun else if (status == AMD_PEER_D3_EVENT)
618*4882a593Smuzhiyun ndev->peer_sta &= ~AMD_PEER_D0_EVENT;
619*4882a593Smuzhiyun
620*4882a593Smuzhiyun amd_ack_smu(ndev, status);
621*4882a593Smuzhiyun
622*4882a593Smuzhiyun /* link down */
623*4882a593Smuzhiyun ntb_link_event(&ndev->ntb);
624*4882a593Smuzhiyun
625*4882a593Smuzhiyun break;
626*4882a593Smuzhiyun case AMD_PEER_D0_EVENT:
627*4882a593Smuzhiyun mmio = ndev->peer_mmio;
628*4882a593Smuzhiyun status = readl(mmio + AMD_PMESTAT_OFFSET);
629*4882a593Smuzhiyun /* check if this is WAKEUP event */
630*4882a593Smuzhiyun if (status & 0x1)
631*4882a593Smuzhiyun dev_info(dev, "Wakeup is done.\n");
632*4882a593Smuzhiyun
633*4882a593Smuzhiyun ndev->peer_sta |= AMD_PEER_D0_EVENT;
634*4882a593Smuzhiyun ndev->peer_sta &= ~AMD_PEER_D3_EVENT;
635*4882a593Smuzhiyun amd_ack_smu(ndev, AMD_PEER_D0_EVENT);
636*4882a593Smuzhiyun
637*4882a593Smuzhiyun /* start a timer to poll link status */
638*4882a593Smuzhiyun schedule_delayed_work(&ndev->hb_timer,
639*4882a593Smuzhiyun AMD_LINK_HB_TIMEOUT);
640*4882a593Smuzhiyun break;
641*4882a593Smuzhiyun default:
642*4882a593Smuzhiyun dev_info(dev, "event status = 0x%x.\n", status);
643*4882a593Smuzhiyun break;
644*4882a593Smuzhiyun }
645*4882a593Smuzhiyun
646*4882a593Smuzhiyun /* Clear the interrupt status */
647*4882a593Smuzhiyun writel(status, mmio + AMD_INTSTAT_OFFSET);
648*4882a593Smuzhiyun }
649*4882a593Smuzhiyun
amd_handle_db_event(struct amd_ntb_dev * ndev,int vec)650*4882a593Smuzhiyun static void amd_handle_db_event(struct amd_ntb_dev *ndev, int vec)
651*4882a593Smuzhiyun {
652*4882a593Smuzhiyun struct device *dev = &ndev->ntb.pdev->dev;
653*4882a593Smuzhiyun u64 status;
654*4882a593Smuzhiyun
655*4882a593Smuzhiyun status = amd_ntb_db_read(&ndev->ntb);
656*4882a593Smuzhiyun
657*4882a593Smuzhiyun dev_dbg(dev, "status = 0x%llx and vec = %d\n", status, vec);
658*4882a593Smuzhiyun
659*4882a593Smuzhiyun /*
660*4882a593Smuzhiyun * Since we had reserved highest order bit of DB for signaling peer of
661*4882a593Smuzhiyun * a special event, this is the only status bit we should be concerned
662*4882a593Smuzhiyun * here now.
663*4882a593Smuzhiyun */
664*4882a593Smuzhiyun if (status & BIT(ndev->db_last_bit)) {
665*4882a593Smuzhiyun ntb_db_clear(&ndev->ntb, BIT(ndev->db_last_bit));
666*4882a593Smuzhiyun /* send link down event notification */
667*4882a593Smuzhiyun ntb_link_event(&ndev->ntb);
668*4882a593Smuzhiyun
669*4882a593Smuzhiyun /*
670*4882a593Smuzhiyun * If we are here, that means the peer has signalled a special
671*4882a593Smuzhiyun * event which notifies that the peer driver has been
672*4882a593Smuzhiyun * un-loaded for some reason. Since there is a chance that the
673*4882a593Smuzhiyun * peer will load its driver again sometime, we schedule link
674*4882a593Smuzhiyun * polling routine.
675*4882a593Smuzhiyun */
676*4882a593Smuzhiyun schedule_delayed_work(&ndev->hb_timer, AMD_LINK_HB_TIMEOUT);
677*4882a593Smuzhiyun }
678*4882a593Smuzhiyun }
679*4882a593Smuzhiyun
ndev_interrupt(struct amd_ntb_dev * ndev,int vec)680*4882a593Smuzhiyun static irqreturn_t ndev_interrupt(struct amd_ntb_dev *ndev, int vec)
681*4882a593Smuzhiyun {
682*4882a593Smuzhiyun dev_dbg(&ndev->ntb.pdev->dev, "vec %d\n", vec);
683*4882a593Smuzhiyun
684*4882a593Smuzhiyun if (vec > (AMD_DB_CNT - 1) || (ndev->msix_vec_count == 1))
685*4882a593Smuzhiyun amd_handle_event(ndev, vec);
686*4882a593Smuzhiyun
687*4882a593Smuzhiyun if (vec < AMD_DB_CNT) {
688*4882a593Smuzhiyun amd_handle_db_event(ndev, vec);
689*4882a593Smuzhiyun ntb_db_event(&ndev->ntb, vec);
690*4882a593Smuzhiyun }
691*4882a593Smuzhiyun
692*4882a593Smuzhiyun return IRQ_HANDLED;
693*4882a593Smuzhiyun }
694*4882a593Smuzhiyun
ndev_vec_isr(int irq,void * dev)695*4882a593Smuzhiyun static irqreturn_t ndev_vec_isr(int irq, void *dev)
696*4882a593Smuzhiyun {
697*4882a593Smuzhiyun struct amd_ntb_vec *nvec = dev;
698*4882a593Smuzhiyun
699*4882a593Smuzhiyun return ndev_interrupt(nvec->ndev, nvec->num);
700*4882a593Smuzhiyun }
701*4882a593Smuzhiyun
ndev_irq_isr(int irq,void * dev)702*4882a593Smuzhiyun static irqreturn_t ndev_irq_isr(int irq, void *dev)
703*4882a593Smuzhiyun {
704*4882a593Smuzhiyun struct amd_ntb_dev *ndev = dev;
705*4882a593Smuzhiyun
706*4882a593Smuzhiyun return ndev_interrupt(ndev, irq - ndev->ntb.pdev->irq);
707*4882a593Smuzhiyun }
708*4882a593Smuzhiyun
ndev_init_isr(struct amd_ntb_dev * ndev,int msix_min,int msix_max)709*4882a593Smuzhiyun static int ndev_init_isr(struct amd_ntb_dev *ndev,
710*4882a593Smuzhiyun int msix_min, int msix_max)
711*4882a593Smuzhiyun {
712*4882a593Smuzhiyun struct pci_dev *pdev;
713*4882a593Smuzhiyun int rc, i, msix_count, node;
714*4882a593Smuzhiyun
715*4882a593Smuzhiyun pdev = ndev->ntb.pdev;
716*4882a593Smuzhiyun
717*4882a593Smuzhiyun node = dev_to_node(&pdev->dev);
718*4882a593Smuzhiyun
719*4882a593Smuzhiyun ndev->db_mask = ndev->db_valid_mask;
720*4882a593Smuzhiyun
721*4882a593Smuzhiyun /* Try to set up msix irq */
722*4882a593Smuzhiyun ndev->vec = kcalloc_node(msix_max, sizeof(*ndev->vec),
723*4882a593Smuzhiyun GFP_KERNEL, node);
724*4882a593Smuzhiyun if (!ndev->vec)
725*4882a593Smuzhiyun goto err_msix_vec_alloc;
726*4882a593Smuzhiyun
727*4882a593Smuzhiyun ndev->msix = kcalloc_node(msix_max, sizeof(*ndev->msix),
728*4882a593Smuzhiyun GFP_KERNEL, node);
729*4882a593Smuzhiyun if (!ndev->msix)
730*4882a593Smuzhiyun goto err_msix_alloc;
731*4882a593Smuzhiyun
732*4882a593Smuzhiyun for (i = 0; i < msix_max; ++i)
733*4882a593Smuzhiyun ndev->msix[i].entry = i;
734*4882a593Smuzhiyun
735*4882a593Smuzhiyun msix_count = pci_enable_msix_range(pdev, ndev->msix,
736*4882a593Smuzhiyun msix_min, msix_max);
737*4882a593Smuzhiyun if (msix_count < 0)
738*4882a593Smuzhiyun goto err_msix_enable;
739*4882a593Smuzhiyun
740*4882a593Smuzhiyun /* NOTE: Disable MSIX if msix count is less than 16 because of
741*4882a593Smuzhiyun * hardware limitation.
742*4882a593Smuzhiyun */
743*4882a593Smuzhiyun if (msix_count < msix_min) {
744*4882a593Smuzhiyun pci_disable_msix(pdev);
745*4882a593Smuzhiyun goto err_msix_enable;
746*4882a593Smuzhiyun }
747*4882a593Smuzhiyun
748*4882a593Smuzhiyun for (i = 0; i < msix_count; ++i) {
749*4882a593Smuzhiyun ndev->vec[i].ndev = ndev;
750*4882a593Smuzhiyun ndev->vec[i].num = i;
751*4882a593Smuzhiyun rc = request_irq(ndev->msix[i].vector, ndev_vec_isr, 0,
752*4882a593Smuzhiyun "ndev_vec_isr", &ndev->vec[i]);
753*4882a593Smuzhiyun if (rc)
754*4882a593Smuzhiyun goto err_msix_request;
755*4882a593Smuzhiyun }
756*4882a593Smuzhiyun
757*4882a593Smuzhiyun dev_dbg(&pdev->dev, "Using msix interrupts\n");
758*4882a593Smuzhiyun ndev->db_count = msix_min;
759*4882a593Smuzhiyun ndev->msix_vec_count = msix_max;
760*4882a593Smuzhiyun return 0;
761*4882a593Smuzhiyun
762*4882a593Smuzhiyun err_msix_request:
763*4882a593Smuzhiyun while (i-- > 0)
764*4882a593Smuzhiyun free_irq(ndev->msix[i].vector, &ndev->vec[i]);
765*4882a593Smuzhiyun pci_disable_msix(pdev);
766*4882a593Smuzhiyun err_msix_enable:
767*4882a593Smuzhiyun kfree(ndev->msix);
768*4882a593Smuzhiyun err_msix_alloc:
769*4882a593Smuzhiyun kfree(ndev->vec);
770*4882a593Smuzhiyun err_msix_vec_alloc:
771*4882a593Smuzhiyun ndev->msix = NULL;
772*4882a593Smuzhiyun ndev->vec = NULL;
773*4882a593Smuzhiyun
774*4882a593Smuzhiyun /* Try to set up msi irq */
775*4882a593Smuzhiyun rc = pci_enable_msi(pdev);
776*4882a593Smuzhiyun if (rc)
777*4882a593Smuzhiyun goto err_msi_enable;
778*4882a593Smuzhiyun
779*4882a593Smuzhiyun rc = request_irq(pdev->irq, ndev_irq_isr, 0,
780*4882a593Smuzhiyun "ndev_irq_isr", ndev);
781*4882a593Smuzhiyun if (rc)
782*4882a593Smuzhiyun goto err_msi_request;
783*4882a593Smuzhiyun
784*4882a593Smuzhiyun dev_dbg(&pdev->dev, "Using msi interrupts\n");
785*4882a593Smuzhiyun ndev->db_count = 1;
786*4882a593Smuzhiyun ndev->msix_vec_count = 1;
787*4882a593Smuzhiyun return 0;
788*4882a593Smuzhiyun
789*4882a593Smuzhiyun err_msi_request:
790*4882a593Smuzhiyun pci_disable_msi(pdev);
791*4882a593Smuzhiyun err_msi_enable:
792*4882a593Smuzhiyun
793*4882a593Smuzhiyun /* Try to set up intx irq */
794*4882a593Smuzhiyun pci_intx(pdev, 1);
795*4882a593Smuzhiyun
796*4882a593Smuzhiyun rc = request_irq(pdev->irq, ndev_irq_isr, IRQF_SHARED,
797*4882a593Smuzhiyun "ndev_irq_isr", ndev);
798*4882a593Smuzhiyun if (rc)
799*4882a593Smuzhiyun goto err_intx_request;
800*4882a593Smuzhiyun
801*4882a593Smuzhiyun dev_dbg(&pdev->dev, "Using intx interrupts\n");
802*4882a593Smuzhiyun ndev->db_count = 1;
803*4882a593Smuzhiyun ndev->msix_vec_count = 1;
804*4882a593Smuzhiyun return 0;
805*4882a593Smuzhiyun
806*4882a593Smuzhiyun err_intx_request:
807*4882a593Smuzhiyun return rc;
808*4882a593Smuzhiyun }
809*4882a593Smuzhiyun
ndev_deinit_isr(struct amd_ntb_dev * ndev)810*4882a593Smuzhiyun static void ndev_deinit_isr(struct amd_ntb_dev *ndev)
811*4882a593Smuzhiyun {
812*4882a593Smuzhiyun struct pci_dev *pdev;
813*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
814*4882a593Smuzhiyun int i;
815*4882a593Smuzhiyun
816*4882a593Smuzhiyun pdev = ndev->ntb.pdev;
817*4882a593Smuzhiyun
818*4882a593Smuzhiyun /* Mask all doorbell interrupts */
819*4882a593Smuzhiyun ndev->db_mask = ndev->db_valid_mask;
820*4882a593Smuzhiyun writel(ndev->db_mask, mmio + AMD_DBMASK_OFFSET);
821*4882a593Smuzhiyun
822*4882a593Smuzhiyun if (ndev->msix) {
823*4882a593Smuzhiyun i = ndev->msix_vec_count;
824*4882a593Smuzhiyun while (i--)
825*4882a593Smuzhiyun free_irq(ndev->msix[i].vector, &ndev->vec[i]);
826*4882a593Smuzhiyun pci_disable_msix(pdev);
827*4882a593Smuzhiyun kfree(ndev->msix);
828*4882a593Smuzhiyun kfree(ndev->vec);
829*4882a593Smuzhiyun } else {
830*4882a593Smuzhiyun free_irq(pdev->irq, ndev);
831*4882a593Smuzhiyun if (pci_dev_msi_enabled(pdev))
832*4882a593Smuzhiyun pci_disable_msi(pdev);
833*4882a593Smuzhiyun else
834*4882a593Smuzhiyun pci_intx(pdev, 0);
835*4882a593Smuzhiyun }
836*4882a593Smuzhiyun }
837*4882a593Smuzhiyun
ndev_debugfs_read(struct file * filp,char __user * ubuf,size_t count,loff_t * offp)838*4882a593Smuzhiyun static ssize_t ndev_debugfs_read(struct file *filp, char __user *ubuf,
839*4882a593Smuzhiyun size_t count, loff_t *offp)
840*4882a593Smuzhiyun {
841*4882a593Smuzhiyun struct amd_ntb_dev *ndev;
842*4882a593Smuzhiyun void __iomem *mmio;
843*4882a593Smuzhiyun char *buf;
844*4882a593Smuzhiyun size_t buf_size;
845*4882a593Smuzhiyun ssize_t ret, off;
846*4882a593Smuzhiyun union { u64 v64; u32 v32; u16 v16; } u;
847*4882a593Smuzhiyun
848*4882a593Smuzhiyun ndev = filp->private_data;
849*4882a593Smuzhiyun mmio = ndev->self_mmio;
850*4882a593Smuzhiyun
851*4882a593Smuzhiyun buf_size = min(count, 0x800ul);
852*4882a593Smuzhiyun
853*4882a593Smuzhiyun buf = kmalloc(buf_size, GFP_KERNEL);
854*4882a593Smuzhiyun if (!buf)
855*4882a593Smuzhiyun return -ENOMEM;
856*4882a593Smuzhiyun
857*4882a593Smuzhiyun off = 0;
858*4882a593Smuzhiyun
859*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
860*4882a593Smuzhiyun "NTB Device Information:\n");
861*4882a593Smuzhiyun
862*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
863*4882a593Smuzhiyun "Connection Topology -\t%s\n",
864*4882a593Smuzhiyun ntb_topo_string(ndev->ntb.topo));
865*4882a593Smuzhiyun
866*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
867*4882a593Smuzhiyun "LNK STA -\t\t%#06x\n", ndev->lnk_sta);
868*4882a593Smuzhiyun
869*4882a593Smuzhiyun if (!amd_link_is_up(ndev)) {
870*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
871*4882a593Smuzhiyun "Link Status -\t\tDown\n");
872*4882a593Smuzhiyun } else {
873*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
874*4882a593Smuzhiyun "Link Status -\t\tUp\n");
875*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
876*4882a593Smuzhiyun "Link Speed -\t\tPCI-E Gen %u\n",
877*4882a593Smuzhiyun NTB_LNK_STA_SPEED(ndev->lnk_sta));
878*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
879*4882a593Smuzhiyun "Link Width -\t\tx%u\n",
880*4882a593Smuzhiyun NTB_LNK_STA_WIDTH(ndev->lnk_sta));
881*4882a593Smuzhiyun }
882*4882a593Smuzhiyun
883*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
884*4882a593Smuzhiyun "Memory Window Count -\t%u\n", ndev->mw_count);
885*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
886*4882a593Smuzhiyun "Scratchpad Count -\t%u\n", ndev->spad_count);
887*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
888*4882a593Smuzhiyun "Doorbell Count -\t%u\n", ndev->db_count);
889*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
890*4882a593Smuzhiyun "MSIX Vector Count -\t%u\n", ndev->msix_vec_count);
891*4882a593Smuzhiyun
892*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
893*4882a593Smuzhiyun "Doorbell Valid Mask -\t%#llx\n", ndev->db_valid_mask);
894*4882a593Smuzhiyun
895*4882a593Smuzhiyun u.v32 = readl(ndev->self_mmio + AMD_DBMASK_OFFSET);
896*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
897*4882a593Smuzhiyun "Doorbell Mask -\t\t\t%#06x\n", u.v32);
898*4882a593Smuzhiyun
899*4882a593Smuzhiyun u.v32 = readl(mmio + AMD_DBSTAT_OFFSET);
900*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
901*4882a593Smuzhiyun "Doorbell Bell -\t\t\t%#06x\n", u.v32);
902*4882a593Smuzhiyun
903*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
904*4882a593Smuzhiyun "\nNTB Incoming XLAT:\n");
905*4882a593Smuzhiyun
906*4882a593Smuzhiyun u.v64 = read64(mmio + AMD_BAR1XLAT_OFFSET);
907*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
908*4882a593Smuzhiyun "XLAT1 -\t\t%#018llx\n", u.v64);
909*4882a593Smuzhiyun
910*4882a593Smuzhiyun u.v64 = read64(ndev->self_mmio + AMD_BAR23XLAT_OFFSET);
911*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
912*4882a593Smuzhiyun "XLAT23 -\t\t%#018llx\n", u.v64);
913*4882a593Smuzhiyun
914*4882a593Smuzhiyun u.v64 = read64(ndev->self_mmio + AMD_BAR45XLAT_OFFSET);
915*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
916*4882a593Smuzhiyun "XLAT45 -\t\t%#018llx\n", u.v64);
917*4882a593Smuzhiyun
918*4882a593Smuzhiyun u.v32 = readl(mmio + AMD_BAR1LMT_OFFSET);
919*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
920*4882a593Smuzhiyun "LMT1 -\t\t\t%#06x\n", u.v32);
921*4882a593Smuzhiyun
922*4882a593Smuzhiyun u.v64 = read64(ndev->self_mmio + AMD_BAR23LMT_OFFSET);
923*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
924*4882a593Smuzhiyun "LMT23 -\t\t\t%#018llx\n", u.v64);
925*4882a593Smuzhiyun
926*4882a593Smuzhiyun u.v64 = read64(ndev->self_mmio + AMD_BAR45LMT_OFFSET);
927*4882a593Smuzhiyun off += scnprintf(buf + off, buf_size - off,
928*4882a593Smuzhiyun "LMT45 -\t\t\t%#018llx\n", u.v64);
929*4882a593Smuzhiyun
930*4882a593Smuzhiyun ret = simple_read_from_buffer(ubuf, count, offp, buf, off);
931*4882a593Smuzhiyun kfree(buf);
932*4882a593Smuzhiyun return ret;
933*4882a593Smuzhiyun }
934*4882a593Smuzhiyun
ndev_init_debugfs(struct amd_ntb_dev * ndev)935*4882a593Smuzhiyun static void ndev_init_debugfs(struct amd_ntb_dev *ndev)
936*4882a593Smuzhiyun {
937*4882a593Smuzhiyun if (!debugfs_dir) {
938*4882a593Smuzhiyun ndev->debugfs_dir = NULL;
939*4882a593Smuzhiyun ndev->debugfs_info = NULL;
940*4882a593Smuzhiyun } else {
941*4882a593Smuzhiyun ndev->debugfs_dir =
942*4882a593Smuzhiyun debugfs_create_dir(pci_name(ndev->ntb.pdev),
943*4882a593Smuzhiyun debugfs_dir);
944*4882a593Smuzhiyun if (!ndev->debugfs_dir)
945*4882a593Smuzhiyun ndev->debugfs_info = NULL;
946*4882a593Smuzhiyun else
947*4882a593Smuzhiyun ndev->debugfs_info =
948*4882a593Smuzhiyun debugfs_create_file("info", S_IRUSR,
949*4882a593Smuzhiyun ndev->debugfs_dir, ndev,
950*4882a593Smuzhiyun &amd_ntb_debugfs_info);
951*4882a593Smuzhiyun }
952*4882a593Smuzhiyun }
953*4882a593Smuzhiyun
ndev_deinit_debugfs(struct amd_ntb_dev * ndev)954*4882a593Smuzhiyun static void ndev_deinit_debugfs(struct amd_ntb_dev *ndev)
955*4882a593Smuzhiyun {
956*4882a593Smuzhiyun debugfs_remove_recursive(ndev->debugfs_dir);
957*4882a593Smuzhiyun }
958*4882a593Smuzhiyun
ndev_init_struct(struct amd_ntb_dev * ndev,struct pci_dev * pdev)959*4882a593Smuzhiyun static inline void ndev_init_struct(struct amd_ntb_dev *ndev,
960*4882a593Smuzhiyun struct pci_dev *pdev)
961*4882a593Smuzhiyun {
962*4882a593Smuzhiyun ndev->ntb.pdev = pdev;
963*4882a593Smuzhiyun ndev->ntb.topo = NTB_TOPO_NONE;
964*4882a593Smuzhiyun ndev->ntb.ops = &amd_ntb_ops;
965*4882a593Smuzhiyun ndev->int_mask = AMD_EVENT_INTMASK;
966*4882a593Smuzhiyun spin_lock_init(&ndev->db_mask_lock);
967*4882a593Smuzhiyun }
968*4882a593Smuzhiyun
amd_poll_link(struct amd_ntb_dev * ndev)969*4882a593Smuzhiyun static int amd_poll_link(struct amd_ntb_dev *ndev)
970*4882a593Smuzhiyun {
971*4882a593Smuzhiyun void __iomem *mmio = ndev->peer_mmio;
972*4882a593Smuzhiyun u32 reg;
973*4882a593Smuzhiyun
974*4882a593Smuzhiyun reg = readl(mmio + AMD_SIDEINFO_OFFSET);
975*4882a593Smuzhiyun reg &= AMD_SIDE_READY;
976*4882a593Smuzhiyun
977*4882a593Smuzhiyun dev_dbg(&ndev->ntb.pdev->dev, "%s: reg_val = 0x%x.\n", __func__, reg);
978*4882a593Smuzhiyun
979*4882a593Smuzhiyun ndev->cntl_sta = reg;
980*4882a593Smuzhiyun
981*4882a593Smuzhiyun amd_ntb_get_link_status(ndev);
982*4882a593Smuzhiyun
983*4882a593Smuzhiyun return ndev->cntl_sta;
984*4882a593Smuzhiyun }
985*4882a593Smuzhiyun
amd_link_hb(struct work_struct * work)986*4882a593Smuzhiyun static void amd_link_hb(struct work_struct *work)
987*4882a593Smuzhiyun {
988*4882a593Smuzhiyun struct amd_ntb_dev *ndev = hb_ndev(work);
989*4882a593Smuzhiyun
990*4882a593Smuzhiyun if (amd_poll_link(ndev))
991*4882a593Smuzhiyun ntb_link_event(&ndev->ntb);
992*4882a593Smuzhiyun
993*4882a593Smuzhiyun if (!amd_link_is_up(ndev))
994*4882a593Smuzhiyun schedule_delayed_work(&ndev->hb_timer, AMD_LINK_HB_TIMEOUT);
995*4882a593Smuzhiyun }
996*4882a593Smuzhiyun
amd_init_isr(struct amd_ntb_dev * ndev)997*4882a593Smuzhiyun static int amd_init_isr(struct amd_ntb_dev *ndev)
998*4882a593Smuzhiyun {
999*4882a593Smuzhiyun return ndev_init_isr(ndev, AMD_DB_CNT, AMD_MSIX_VECTOR_CNT);
1000*4882a593Smuzhiyun }
1001*4882a593Smuzhiyun
amd_set_side_info_reg(struct amd_ntb_dev * ndev,bool peer)1002*4882a593Smuzhiyun static void amd_set_side_info_reg(struct amd_ntb_dev *ndev, bool peer)
1003*4882a593Smuzhiyun {
1004*4882a593Smuzhiyun void __iomem *mmio = NULL;
1005*4882a593Smuzhiyun unsigned int reg;
1006*4882a593Smuzhiyun
1007*4882a593Smuzhiyun if (peer)
1008*4882a593Smuzhiyun mmio = ndev->peer_mmio;
1009*4882a593Smuzhiyun else
1010*4882a593Smuzhiyun mmio = ndev->self_mmio;
1011*4882a593Smuzhiyun
1012*4882a593Smuzhiyun reg = readl(mmio + AMD_SIDEINFO_OFFSET);
1013*4882a593Smuzhiyun if (!(reg & AMD_SIDE_READY)) {
1014*4882a593Smuzhiyun reg |= AMD_SIDE_READY;
1015*4882a593Smuzhiyun writel(reg, mmio + AMD_SIDEINFO_OFFSET);
1016*4882a593Smuzhiyun }
1017*4882a593Smuzhiyun }
1018*4882a593Smuzhiyun
amd_clear_side_info_reg(struct amd_ntb_dev * ndev,bool peer)1019*4882a593Smuzhiyun static void amd_clear_side_info_reg(struct amd_ntb_dev *ndev, bool peer)
1020*4882a593Smuzhiyun {
1021*4882a593Smuzhiyun void __iomem *mmio = NULL;
1022*4882a593Smuzhiyun unsigned int reg;
1023*4882a593Smuzhiyun
1024*4882a593Smuzhiyun if (peer)
1025*4882a593Smuzhiyun mmio = ndev->peer_mmio;
1026*4882a593Smuzhiyun else
1027*4882a593Smuzhiyun mmio = ndev->self_mmio;
1028*4882a593Smuzhiyun
1029*4882a593Smuzhiyun reg = readl(mmio + AMD_SIDEINFO_OFFSET);
1030*4882a593Smuzhiyun if (reg & AMD_SIDE_READY) {
1031*4882a593Smuzhiyun reg &= ~AMD_SIDE_READY;
1032*4882a593Smuzhiyun writel(reg, mmio + AMD_SIDEINFO_OFFSET);
1033*4882a593Smuzhiyun readl(mmio + AMD_SIDEINFO_OFFSET);
1034*4882a593Smuzhiyun }
1035*4882a593Smuzhiyun }
1036*4882a593Smuzhiyun
amd_init_side_info(struct amd_ntb_dev * ndev)1037*4882a593Smuzhiyun static void amd_init_side_info(struct amd_ntb_dev *ndev)
1038*4882a593Smuzhiyun {
1039*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
1040*4882a593Smuzhiyun u32 ntb_ctl;
1041*4882a593Smuzhiyun
1042*4882a593Smuzhiyun amd_set_side_info_reg(ndev, false);
1043*4882a593Smuzhiyun
1044*4882a593Smuzhiyun ntb_ctl = readl(mmio + AMD_CNTL_OFFSET);
1045*4882a593Smuzhiyun ntb_ctl |= (PMM_REG_CTL | SMM_REG_CTL);
1046*4882a593Smuzhiyun writel(ntb_ctl, mmio + AMD_CNTL_OFFSET);
1047*4882a593Smuzhiyun }
1048*4882a593Smuzhiyun
amd_deinit_side_info(struct amd_ntb_dev * ndev)1049*4882a593Smuzhiyun static void amd_deinit_side_info(struct amd_ntb_dev *ndev)
1050*4882a593Smuzhiyun {
1051*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
1052*4882a593Smuzhiyun u32 ntb_ctl;
1053*4882a593Smuzhiyun
1054*4882a593Smuzhiyun amd_clear_side_info_reg(ndev, false);
1055*4882a593Smuzhiyun
1056*4882a593Smuzhiyun ntb_ctl = readl(mmio + AMD_CNTL_OFFSET);
1057*4882a593Smuzhiyun ntb_ctl &= ~(PMM_REG_CTL | SMM_REG_CTL);
1058*4882a593Smuzhiyun writel(ntb_ctl, mmio + AMD_CNTL_OFFSET);
1059*4882a593Smuzhiyun }
1060*4882a593Smuzhiyun
amd_init_ntb(struct amd_ntb_dev * ndev)1061*4882a593Smuzhiyun static int amd_init_ntb(struct amd_ntb_dev *ndev)
1062*4882a593Smuzhiyun {
1063*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
1064*4882a593Smuzhiyun
1065*4882a593Smuzhiyun ndev->mw_count = ndev->dev_data->mw_count;
1066*4882a593Smuzhiyun ndev->spad_count = AMD_SPADS_CNT;
1067*4882a593Smuzhiyun ndev->db_count = AMD_DB_CNT;
1068*4882a593Smuzhiyun
1069*4882a593Smuzhiyun switch (ndev->ntb.topo) {
1070*4882a593Smuzhiyun case NTB_TOPO_PRI:
1071*4882a593Smuzhiyun case NTB_TOPO_SEC:
1072*4882a593Smuzhiyun ndev->spad_count >>= 1;
1073*4882a593Smuzhiyun if (ndev->ntb.topo == NTB_TOPO_PRI) {
1074*4882a593Smuzhiyun ndev->self_spad = 0;
1075*4882a593Smuzhiyun ndev->peer_spad = 0x20;
1076*4882a593Smuzhiyun } else {
1077*4882a593Smuzhiyun ndev->self_spad = 0x20;
1078*4882a593Smuzhiyun ndev->peer_spad = 0;
1079*4882a593Smuzhiyun }
1080*4882a593Smuzhiyun
1081*4882a593Smuzhiyun INIT_DELAYED_WORK(&ndev->hb_timer, amd_link_hb);
1082*4882a593Smuzhiyun schedule_delayed_work(&ndev->hb_timer, AMD_LINK_HB_TIMEOUT);
1083*4882a593Smuzhiyun
1084*4882a593Smuzhiyun break;
1085*4882a593Smuzhiyun default:
1086*4882a593Smuzhiyun dev_err(&ndev->ntb.pdev->dev,
1087*4882a593Smuzhiyun "AMD NTB does not support B2B mode.\n");
1088*4882a593Smuzhiyun return -EINVAL;
1089*4882a593Smuzhiyun }
1090*4882a593Smuzhiyun
1091*4882a593Smuzhiyun /* Mask event interrupts */
1092*4882a593Smuzhiyun writel(ndev->int_mask, mmio + AMD_INTMASK_OFFSET);
1093*4882a593Smuzhiyun
1094*4882a593Smuzhiyun return 0;
1095*4882a593Smuzhiyun }
1096*4882a593Smuzhiyun
amd_get_topo(struct amd_ntb_dev * ndev)1097*4882a593Smuzhiyun static enum ntb_topo amd_get_topo(struct amd_ntb_dev *ndev)
1098*4882a593Smuzhiyun {
1099*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
1100*4882a593Smuzhiyun u32 info;
1101*4882a593Smuzhiyun
1102*4882a593Smuzhiyun info = readl(mmio + AMD_SIDEINFO_OFFSET);
1103*4882a593Smuzhiyun if (info & AMD_SIDE_MASK)
1104*4882a593Smuzhiyun return NTB_TOPO_SEC;
1105*4882a593Smuzhiyun else
1106*4882a593Smuzhiyun return NTB_TOPO_PRI;
1107*4882a593Smuzhiyun }
1108*4882a593Smuzhiyun
amd_init_dev(struct amd_ntb_dev * ndev)1109*4882a593Smuzhiyun static int amd_init_dev(struct amd_ntb_dev *ndev)
1110*4882a593Smuzhiyun {
1111*4882a593Smuzhiyun void __iomem *mmio = ndev->self_mmio;
1112*4882a593Smuzhiyun struct pci_dev *pdev;
1113*4882a593Smuzhiyun int rc = 0;
1114*4882a593Smuzhiyun
1115*4882a593Smuzhiyun pdev = ndev->ntb.pdev;
1116*4882a593Smuzhiyun
1117*4882a593Smuzhiyun ndev->ntb.topo = amd_get_topo(ndev);
1118*4882a593Smuzhiyun dev_dbg(&pdev->dev, "AMD NTB topo is %s\n",
1119*4882a593Smuzhiyun ntb_topo_string(ndev->ntb.topo));
1120*4882a593Smuzhiyun
1121*4882a593Smuzhiyun rc = amd_init_ntb(ndev);
1122*4882a593Smuzhiyun if (rc)
1123*4882a593Smuzhiyun return rc;
1124*4882a593Smuzhiyun
1125*4882a593Smuzhiyun rc = amd_init_isr(ndev);
1126*4882a593Smuzhiyun if (rc) {
1127*4882a593Smuzhiyun dev_err(&pdev->dev, "fail to init isr.\n");
1128*4882a593Smuzhiyun return rc;
1129*4882a593Smuzhiyun }
1130*4882a593Smuzhiyun
1131*4882a593Smuzhiyun ndev->db_valid_mask = BIT_ULL(ndev->db_count) - 1;
1132*4882a593Smuzhiyun /*
1133*4882a593Smuzhiyun * We reserve the highest order bit of the DB register which will
1134*4882a593Smuzhiyun * be used to notify peer when the driver on this side is being
1135*4882a593Smuzhiyun * un-loaded.
1136*4882a593Smuzhiyun */
1137*4882a593Smuzhiyun ndev->db_last_bit =
1138*4882a593Smuzhiyun find_last_bit((unsigned long *)&ndev->db_valid_mask,
1139*4882a593Smuzhiyun hweight64(ndev->db_valid_mask));
1140*4882a593Smuzhiyun writew((u16)~BIT(ndev->db_last_bit), mmio + AMD_DBMASK_OFFSET);
1141*4882a593Smuzhiyun /*
1142*4882a593Smuzhiyun * Since now there is one less bit to account for, the DB count
1143*4882a593Smuzhiyun * and DB mask should be adjusted accordingly.
1144*4882a593Smuzhiyun */
1145*4882a593Smuzhiyun ndev->db_count -= 1;
1146*4882a593Smuzhiyun ndev->db_valid_mask = BIT_ULL(ndev->db_count) - 1;
1147*4882a593Smuzhiyun
1148*4882a593Smuzhiyun /* Enable Link-Up and Link-Down event interrupts */
1149*4882a593Smuzhiyun ndev->int_mask &= ~(AMD_LINK_UP_EVENT | AMD_LINK_DOWN_EVENT);
1150*4882a593Smuzhiyun writel(ndev->int_mask, mmio + AMD_INTMASK_OFFSET);
1151*4882a593Smuzhiyun
1152*4882a593Smuzhiyun return 0;
1153*4882a593Smuzhiyun }
1154*4882a593Smuzhiyun
amd_deinit_dev(struct amd_ntb_dev * ndev)1155*4882a593Smuzhiyun static void amd_deinit_dev(struct amd_ntb_dev *ndev)
1156*4882a593Smuzhiyun {
1157*4882a593Smuzhiyun cancel_delayed_work_sync(&ndev->hb_timer);
1158*4882a593Smuzhiyun
1159*4882a593Smuzhiyun ndev_deinit_isr(ndev);
1160*4882a593Smuzhiyun }
1161*4882a593Smuzhiyun
amd_ntb_init_pci(struct amd_ntb_dev * ndev,struct pci_dev * pdev)1162*4882a593Smuzhiyun static int amd_ntb_init_pci(struct amd_ntb_dev *ndev,
1163*4882a593Smuzhiyun struct pci_dev *pdev)
1164*4882a593Smuzhiyun {
1165*4882a593Smuzhiyun int rc;
1166*4882a593Smuzhiyun
1167*4882a593Smuzhiyun pci_set_drvdata(pdev, ndev);
1168*4882a593Smuzhiyun
1169*4882a593Smuzhiyun rc = pci_enable_device(pdev);
1170*4882a593Smuzhiyun if (rc)
1171*4882a593Smuzhiyun goto err_pci_enable;
1172*4882a593Smuzhiyun
1173*4882a593Smuzhiyun rc = pci_request_regions(pdev, NTB_NAME);
1174*4882a593Smuzhiyun if (rc)
1175*4882a593Smuzhiyun goto err_pci_regions;
1176*4882a593Smuzhiyun
1177*4882a593Smuzhiyun pci_set_master(pdev);
1178*4882a593Smuzhiyun
1179*4882a593Smuzhiyun rc = pci_set_dma_mask(pdev, DMA_BIT_MASK(64));
1180*4882a593Smuzhiyun if (rc) {
1181*4882a593Smuzhiyun rc = pci_set_dma_mask(pdev, DMA_BIT_MASK(32));
1182*4882a593Smuzhiyun if (rc)
1183*4882a593Smuzhiyun goto err_dma_mask;
1184*4882a593Smuzhiyun dev_warn(&pdev->dev, "Cannot DMA highmem\n");
1185*4882a593Smuzhiyun }
1186*4882a593Smuzhiyun
1187*4882a593Smuzhiyun rc = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(64));
1188*4882a593Smuzhiyun if (rc) {
1189*4882a593Smuzhiyun rc = pci_set_consistent_dma_mask(pdev, DMA_BIT_MASK(32));
1190*4882a593Smuzhiyun if (rc)
1191*4882a593Smuzhiyun goto err_dma_mask;
1192*4882a593Smuzhiyun dev_warn(&pdev->dev, "Cannot DMA consistent highmem\n");
1193*4882a593Smuzhiyun }
1194*4882a593Smuzhiyun
1195*4882a593Smuzhiyun ndev->self_mmio = pci_iomap(pdev, 0, 0);
1196*4882a593Smuzhiyun if (!ndev->self_mmio) {
1197*4882a593Smuzhiyun rc = -EIO;
1198*4882a593Smuzhiyun goto err_dma_mask;
1199*4882a593Smuzhiyun }
1200*4882a593Smuzhiyun ndev->peer_mmio = ndev->self_mmio + AMD_PEER_OFFSET;
1201*4882a593Smuzhiyun
1202*4882a593Smuzhiyun return 0;
1203*4882a593Smuzhiyun
1204*4882a593Smuzhiyun err_dma_mask:
1205*4882a593Smuzhiyun pci_clear_master(pdev);
1206*4882a593Smuzhiyun pci_release_regions(pdev);
1207*4882a593Smuzhiyun err_pci_regions:
1208*4882a593Smuzhiyun pci_disable_device(pdev);
1209*4882a593Smuzhiyun err_pci_enable:
1210*4882a593Smuzhiyun pci_set_drvdata(pdev, NULL);
1211*4882a593Smuzhiyun return rc;
1212*4882a593Smuzhiyun }
1213*4882a593Smuzhiyun
amd_ntb_deinit_pci(struct amd_ntb_dev * ndev)1214*4882a593Smuzhiyun static void amd_ntb_deinit_pci(struct amd_ntb_dev *ndev)
1215*4882a593Smuzhiyun {
1216*4882a593Smuzhiyun struct pci_dev *pdev = ndev->ntb.pdev;
1217*4882a593Smuzhiyun
1218*4882a593Smuzhiyun pci_iounmap(pdev, ndev->self_mmio);
1219*4882a593Smuzhiyun
1220*4882a593Smuzhiyun pci_clear_master(pdev);
1221*4882a593Smuzhiyun pci_release_regions(pdev);
1222*4882a593Smuzhiyun pci_disable_device(pdev);
1223*4882a593Smuzhiyun pci_set_drvdata(pdev, NULL);
1224*4882a593Smuzhiyun }
1225*4882a593Smuzhiyun
amd_ntb_pci_probe(struct pci_dev * pdev,const struct pci_device_id * id)1226*4882a593Smuzhiyun static int amd_ntb_pci_probe(struct pci_dev *pdev,
1227*4882a593Smuzhiyun const struct pci_device_id *id)
1228*4882a593Smuzhiyun {
1229*4882a593Smuzhiyun struct amd_ntb_dev *ndev;
1230*4882a593Smuzhiyun int rc, node;
1231*4882a593Smuzhiyun
1232*4882a593Smuzhiyun node = dev_to_node(&pdev->dev);
1233*4882a593Smuzhiyun
1234*4882a593Smuzhiyun ndev = kzalloc_node(sizeof(*ndev), GFP_KERNEL, node);
1235*4882a593Smuzhiyun if (!ndev) {
1236*4882a593Smuzhiyun rc = -ENOMEM;
1237*4882a593Smuzhiyun goto err_ndev;
1238*4882a593Smuzhiyun }
1239*4882a593Smuzhiyun
1240*4882a593Smuzhiyun ndev->dev_data = (struct ntb_dev_data *)id->driver_data;
1241*4882a593Smuzhiyun
1242*4882a593Smuzhiyun ndev_init_struct(ndev, pdev);
1243*4882a593Smuzhiyun
1244*4882a593Smuzhiyun rc = amd_ntb_init_pci(ndev, pdev);
1245*4882a593Smuzhiyun if (rc)
1246*4882a593Smuzhiyun goto err_init_pci;
1247*4882a593Smuzhiyun
1248*4882a593Smuzhiyun rc = amd_init_dev(ndev);
1249*4882a593Smuzhiyun if (rc)
1250*4882a593Smuzhiyun goto err_init_dev;
1251*4882a593Smuzhiyun
1252*4882a593Smuzhiyun /* write side info */
1253*4882a593Smuzhiyun amd_init_side_info(ndev);
1254*4882a593Smuzhiyun
1255*4882a593Smuzhiyun amd_poll_link(ndev);
1256*4882a593Smuzhiyun
1257*4882a593Smuzhiyun ndev_init_debugfs(ndev);
1258*4882a593Smuzhiyun
1259*4882a593Smuzhiyun rc = ntb_register_device(&ndev->ntb);
1260*4882a593Smuzhiyun if (rc)
1261*4882a593Smuzhiyun goto err_register;
1262*4882a593Smuzhiyun
1263*4882a593Smuzhiyun dev_info(&pdev->dev, "NTB device registered.\n");
1264*4882a593Smuzhiyun
1265*4882a593Smuzhiyun return 0;
1266*4882a593Smuzhiyun
1267*4882a593Smuzhiyun err_register:
1268*4882a593Smuzhiyun ndev_deinit_debugfs(ndev);
1269*4882a593Smuzhiyun amd_deinit_dev(ndev);
1270*4882a593Smuzhiyun err_init_dev:
1271*4882a593Smuzhiyun amd_ntb_deinit_pci(ndev);
1272*4882a593Smuzhiyun err_init_pci:
1273*4882a593Smuzhiyun kfree(ndev);
1274*4882a593Smuzhiyun err_ndev:
1275*4882a593Smuzhiyun return rc;
1276*4882a593Smuzhiyun }
1277*4882a593Smuzhiyun
amd_ntb_pci_remove(struct pci_dev * pdev)1278*4882a593Smuzhiyun static void amd_ntb_pci_remove(struct pci_dev *pdev)
1279*4882a593Smuzhiyun {
1280*4882a593Smuzhiyun struct amd_ntb_dev *ndev = pci_get_drvdata(pdev);
1281*4882a593Smuzhiyun
1282*4882a593Smuzhiyun /*
1283*4882a593Smuzhiyun * Clear the READY bit in SIDEINFO register before sending DB event
1284*4882a593Smuzhiyun * to the peer. This will make sure that when the peer handles the
1285*4882a593Smuzhiyun * DB event, it correctly reads this bit as being 0.
1286*4882a593Smuzhiyun */
1287*4882a593Smuzhiyun amd_deinit_side_info(ndev);
1288*4882a593Smuzhiyun ntb_peer_db_set(&ndev->ntb, BIT_ULL(ndev->db_last_bit));
1289*4882a593Smuzhiyun ntb_unregister_device(&ndev->ntb);
1290*4882a593Smuzhiyun ndev_deinit_debugfs(ndev);
1291*4882a593Smuzhiyun amd_deinit_dev(ndev);
1292*4882a593Smuzhiyun amd_ntb_deinit_pci(ndev);
1293*4882a593Smuzhiyun kfree(ndev);
1294*4882a593Smuzhiyun }
1295*4882a593Smuzhiyun
amd_ntb_pci_shutdown(struct pci_dev * pdev)1296*4882a593Smuzhiyun static void amd_ntb_pci_shutdown(struct pci_dev *pdev)
1297*4882a593Smuzhiyun {
1298*4882a593Smuzhiyun struct amd_ntb_dev *ndev = pci_get_drvdata(pdev);
1299*4882a593Smuzhiyun
1300*4882a593Smuzhiyun /* Send link down notification */
1301*4882a593Smuzhiyun ntb_link_event(&ndev->ntb);
1302*4882a593Smuzhiyun
1303*4882a593Smuzhiyun amd_deinit_side_info(ndev);
1304*4882a593Smuzhiyun ntb_peer_db_set(&ndev->ntb, BIT_ULL(ndev->db_last_bit));
1305*4882a593Smuzhiyun ntb_unregister_device(&ndev->ntb);
1306*4882a593Smuzhiyun ndev_deinit_debugfs(ndev);
1307*4882a593Smuzhiyun amd_deinit_dev(ndev);
1308*4882a593Smuzhiyun amd_ntb_deinit_pci(ndev);
1309*4882a593Smuzhiyun kfree(ndev);
1310*4882a593Smuzhiyun }
1311*4882a593Smuzhiyun
1312*4882a593Smuzhiyun static const struct file_operations amd_ntb_debugfs_info = {
1313*4882a593Smuzhiyun .owner = THIS_MODULE,
1314*4882a593Smuzhiyun .open = simple_open,
1315*4882a593Smuzhiyun .read = ndev_debugfs_read,
1316*4882a593Smuzhiyun };
1317*4882a593Smuzhiyun
1318*4882a593Smuzhiyun static const struct ntb_dev_data dev_data[] = {
1319*4882a593Smuzhiyun { /* for device 145b */
1320*4882a593Smuzhiyun .mw_count = 3,
1321*4882a593Smuzhiyun .mw_idx = 1,
1322*4882a593Smuzhiyun },
1323*4882a593Smuzhiyun { /* for device 148b */
1324*4882a593Smuzhiyun .mw_count = 2,
1325*4882a593Smuzhiyun .mw_idx = 2,
1326*4882a593Smuzhiyun },
1327*4882a593Smuzhiyun };
1328*4882a593Smuzhiyun
1329*4882a593Smuzhiyun static const struct pci_device_id amd_ntb_pci_tbl[] = {
1330*4882a593Smuzhiyun { PCI_VDEVICE(AMD, 0x145b), (kernel_ulong_t)&dev_data[0] },
1331*4882a593Smuzhiyun { PCI_VDEVICE(AMD, 0x148b), (kernel_ulong_t)&dev_data[1] },
1332*4882a593Smuzhiyun { PCI_VDEVICE(HYGON, 0x145b), (kernel_ulong_t)&dev_data[0] },
1333*4882a593Smuzhiyun { 0, }
1334*4882a593Smuzhiyun };
1335*4882a593Smuzhiyun MODULE_DEVICE_TABLE(pci, amd_ntb_pci_tbl);
1336*4882a593Smuzhiyun
1337*4882a593Smuzhiyun static struct pci_driver amd_ntb_pci_driver = {
1338*4882a593Smuzhiyun .name = KBUILD_MODNAME,
1339*4882a593Smuzhiyun .id_table = amd_ntb_pci_tbl,
1340*4882a593Smuzhiyun .probe = amd_ntb_pci_probe,
1341*4882a593Smuzhiyun .remove = amd_ntb_pci_remove,
1342*4882a593Smuzhiyun .shutdown = amd_ntb_pci_shutdown,
1343*4882a593Smuzhiyun };
1344*4882a593Smuzhiyun
amd_ntb_pci_driver_init(void)1345*4882a593Smuzhiyun static int __init amd_ntb_pci_driver_init(void)
1346*4882a593Smuzhiyun {
1347*4882a593Smuzhiyun pr_info("%s %s\n", NTB_DESC, NTB_VER);
1348*4882a593Smuzhiyun
1349*4882a593Smuzhiyun if (debugfs_initialized())
1350*4882a593Smuzhiyun debugfs_dir = debugfs_create_dir(KBUILD_MODNAME, NULL);
1351*4882a593Smuzhiyun
1352*4882a593Smuzhiyun return pci_register_driver(&amd_ntb_pci_driver);
1353*4882a593Smuzhiyun }
1354*4882a593Smuzhiyun module_init(amd_ntb_pci_driver_init);
1355*4882a593Smuzhiyun
amd_ntb_pci_driver_exit(void)1356*4882a593Smuzhiyun static void __exit amd_ntb_pci_driver_exit(void)
1357*4882a593Smuzhiyun {
1358*4882a593Smuzhiyun pci_unregister_driver(&amd_ntb_pci_driver);
1359*4882a593Smuzhiyun debugfs_remove_recursive(debugfs_dir);
1360*4882a593Smuzhiyun }
1361*4882a593Smuzhiyun module_exit(amd_ntb_pci_driver_exit);
1362