1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Low-Level PCI Express Support for the SH7786
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright (C) 2009 - 2011 Paul Mundt
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun #define pr_fmt(fmt) "PCI: " fmt
8*4882a593Smuzhiyun
9*4882a593Smuzhiyun #include <linux/pci.h>
10*4882a593Smuzhiyun #include <linux/init.h>
11*4882a593Smuzhiyun #include <linux/kernel.h>
12*4882a593Smuzhiyun #include <linux/io.h>
13*4882a593Smuzhiyun #include <linux/async.h>
14*4882a593Smuzhiyun #include <linux/delay.h>
15*4882a593Smuzhiyun #include <linux/dma-mapping.h>
16*4882a593Smuzhiyun #include <linux/slab.h>
17*4882a593Smuzhiyun #include <linux/clk.h>
18*4882a593Smuzhiyun #include <linux/sh_clk.h>
19*4882a593Smuzhiyun #include <linux/sh_intc.h>
20*4882a593Smuzhiyun #include <cpu/sh7786.h>
21*4882a593Smuzhiyun #include "pcie-sh7786.h"
22*4882a593Smuzhiyun #include <linux/sizes.h>
23*4882a593Smuzhiyun
24*4882a593Smuzhiyun struct sh7786_pcie_port {
25*4882a593Smuzhiyun struct pci_channel *hose;
26*4882a593Smuzhiyun struct clk *fclk, phy_clk;
27*4882a593Smuzhiyun unsigned int index;
28*4882a593Smuzhiyun int endpoint;
29*4882a593Smuzhiyun int link;
30*4882a593Smuzhiyun };
31*4882a593Smuzhiyun
32*4882a593Smuzhiyun static struct sh7786_pcie_port *sh7786_pcie_ports;
33*4882a593Smuzhiyun static unsigned int nr_ports;
34*4882a593Smuzhiyun static unsigned long dma_pfn_offset;
35*4882a593Smuzhiyun size_t memsize;
36*4882a593Smuzhiyun u64 memstart;
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun static struct sh7786_pcie_hwops {
39*4882a593Smuzhiyun int (*core_init)(void);
40*4882a593Smuzhiyun async_func_t port_init_hw;
41*4882a593Smuzhiyun } *sh7786_pcie_hwops;
42*4882a593Smuzhiyun
43*4882a593Smuzhiyun static struct resource sh7786_pci0_resources[] = {
44*4882a593Smuzhiyun {
45*4882a593Smuzhiyun .name = "PCIe0 MEM 0",
46*4882a593Smuzhiyun .start = 0xfd000000,
47*4882a593Smuzhiyun .end = 0xfd000000 + SZ_8M - 1,
48*4882a593Smuzhiyun .flags = IORESOURCE_MEM,
49*4882a593Smuzhiyun }, {
50*4882a593Smuzhiyun .name = "PCIe0 MEM 1",
51*4882a593Smuzhiyun .start = 0xc0000000,
52*4882a593Smuzhiyun .end = 0xc0000000 + SZ_512M - 1,
53*4882a593Smuzhiyun .flags = IORESOURCE_MEM | IORESOURCE_MEM_32BIT,
54*4882a593Smuzhiyun }, {
55*4882a593Smuzhiyun .name = "PCIe0 MEM 2",
56*4882a593Smuzhiyun .start = 0x10000000,
57*4882a593Smuzhiyun .end = 0x10000000 + SZ_64M - 1,
58*4882a593Smuzhiyun .flags = IORESOURCE_MEM,
59*4882a593Smuzhiyun }, {
60*4882a593Smuzhiyun .name = "PCIe0 IO",
61*4882a593Smuzhiyun .start = 0xfe100000,
62*4882a593Smuzhiyun .end = 0xfe100000 + SZ_1M - 1,
63*4882a593Smuzhiyun .flags = IORESOURCE_IO,
64*4882a593Smuzhiyun },
65*4882a593Smuzhiyun };
66*4882a593Smuzhiyun
67*4882a593Smuzhiyun static struct resource sh7786_pci1_resources[] = {
68*4882a593Smuzhiyun {
69*4882a593Smuzhiyun .name = "PCIe1 MEM 0",
70*4882a593Smuzhiyun .start = 0xfd800000,
71*4882a593Smuzhiyun .end = 0xfd800000 + SZ_8M - 1,
72*4882a593Smuzhiyun .flags = IORESOURCE_MEM,
73*4882a593Smuzhiyun }, {
74*4882a593Smuzhiyun .name = "PCIe1 MEM 1",
75*4882a593Smuzhiyun .start = 0xa0000000,
76*4882a593Smuzhiyun .end = 0xa0000000 + SZ_512M - 1,
77*4882a593Smuzhiyun .flags = IORESOURCE_MEM | IORESOURCE_MEM_32BIT,
78*4882a593Smuzhiyun }, {
79*4882a593Smuzhiyun .name = "PCIe1 MEM 2",
80*4882a593Smuzhiyun .start = 0x30000000,
81*4882a593Smuzhiyun .end = 0x30000000 + SZ_256M - 1,
82*4882a593Smuzhiyun .flags = IORESOURCE_MEM | IORESOURCE_MEM_32BIT,
83*4882a593Smuzhiyun }, {
84*4882a593Smuzhiyun .name = "PCIe1 IO",
85*4882a593Smuzhiyun .start = 0xfe300000,
86*4882a593Smuzhiyun .end = 0xfe300000 + SZ_1M - 1,
87*4882a593Smuzhiyun .flags = IORESOURCE_IO,
88*4882a593Smuzhiyun },
89*4882a593Smuzhiyun };
90*4882a593Smuzhiyun
91*4882a593Smuzhiyun static struct resource sh7786_pci2_resources[] = {
92*4882a593Smuzhiyun {
93*4882a593Smuzhiyun .name = "PCIe2 MEM 0",
94*4882a593Smuzhiyun .start = 0xfc800000,
95*4882a593Smuzhiyun .end = 0xfc800000 + SZ_4M - 1,
96*4882a593Smuzhiyun .flags = IORESOURCE_MEM,
97*4882a593Smuzhiyun }, {
98*4882a593Smuzhiyun .name = "PCIe2 MEM 1",
99*4882a593Smuzhiyun .start = 0x80000000,
100*4882a593Smuzhiyun .end = 0x80000000 + SZ_512M - 1,
101*4882a593Smuzhiyun .flags = IORESOURCE_MEM | IORESOURCE_MEM_32BIT,
102*4882a593Smuzhiyun }, {
103*4882a593Smuzhiyun .name = "PCIe2 MEM 2",
104*4882a593Smuzhiyun .start = 0x20000000,
105*4882a593Smuzhiyun .end = 0x20000000 + SZ_256M - 1,
106*4882a593Smuzhiyun .flags = IORESOURCE_MEM | IORESOURCE_MEM_32BIT,
107*4882a593Smuzhiyun }, {
108*4882a593Smuzhiyun .name = "PCIe2 IO",
109*4882a593Smuzhiyun .start = 0xfcd00000,
110*4882a593Smuzhiyun .end = 0xfcd00000 + SZ_1M - 1,
111*4882a593Smuzhiyun .flags = IORESOURCE_IO,
112*4882a593Smuzhiyun },
113*4882a593Smuzhiyun };
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun extern struct pci_ops sh7786_pci_ops;
116*4882a593Smuzhiyun
117*4882a593Smuzhiyun #define DEFINE_CONTROLLER(start, idx) \
118*4882a593Smuzhiyun { \
119*4882a593Smuzhiyun .pci_ops = &sh7786_pci_ops, \
120*4882a593Smuzhiyun .resources = sh7786_pci##idx##_resources, \
121*4882a593Smuzhiyun .nr_resources = ARRAY_SIZE(sh7786_pci##idx##_resources), \
122*4882a593Smuzhiyun .reg_base = start, \
123*4882a593Smuzhiyun .mem_offset = 0, \
124*4882a593Smuzhiyun .io_offset = 0, \
125*4882a593Smuzhiyun }
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun static struct pci_channel sh7786_pci_channels[] = {
128*4882a593Smuzhiyun DEFINE_CONTROLLER(0xfe000000, 0),
129*4882a593Smuzhiyun DEFINE_CONTROLLER(0xfe200000, 1),
130*4882a593Smuzhiyun DEFINE_CONTROLLER(0xfcc00000, 2),
131*4882a593Smuzhiyun };
132*4882a593Smuzhiyun
133*4882a593Smuzhiyun static struct clk fixed_pciexclkp = {
134*4882a593Smuzhiyun .rate = 100000000, /* 100 MHz reference clock */
135*4882a593Smuzhiyun };
136*4882a593Smuzhiyun
sh7786_pci_fixup(struct pci_dev * dev)137*4882a593Smuzhiyun static void sh7786_pci_fixup(struct pci_dev *dev)
138*4882a593Smuzhiyun {
139*4882a593Smuzhiyun /*
140*4882a593Smuzhiyun * Prevent enumeration of root complex resources.
141*4882a593Smuzhiyun */
142*4882a593Smuzhiyun if (pci_is_root_bus(dev->bus) && dev->devfn == 0) {
143*4882a593Smuzhiyun int i;
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun for (i = 0; i < DEVICE_COUNT_RESOURCE; i++) {
146*4882a593Smuzhiyun dev->resource[i].start = 0;
147*4882a593Smuzhiyun dev->resource[i].end = 0;
148*4882a593Smuzhiyun dev->resource[i].flags = 0;
149*4882a593Smuzhiyun }
150*4882a593Smuzhiyun }
151*4882a593Smuzhiyun }
152*4882a593Smuzhiyun DECLARE_PCI_FIXUP_HEADER(PCI_VENDOR_ID_RENESAS, PCI_DEVICE_ID_RENESAS_SH7786,
153*4882a593Smuzhiyun sh7786_pci_fixup);
154*4882a593Smuzhiyun
phy_wait_for_ack(struct pci_channel * chan)155*4882a593Smuzhiyun static int __init phy_wait_for_ack(struct pci_channel *chan)
156*4882a593Smuzhiyun {
157*4882a593Smuzhiyun unsigned int timeout = 100;
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun while (timeout--) {
160*4882a593Smuzhiyun if (pci_read_reg(chan, SH4A_PCIEPHYADRR) & (1 << BITS_ACK))
161*4882a593Smuzhiyun return 0;
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun udelay(100);
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun
166*4882a593Smuzhiyun return -ETIMEDOUT;
167*4882a593Smuzhiyun }
168*4882a593Smuzhiyun
pci_wait_for_irq(struct pci_channel * chan,unsigned int mask)169*4882a593Smuzhiyun static int __init pci_wait_for_irq(struct pci_channel *chan, unsigned int mask)
170*4882a593Smuzhiyun {
171*4882a593Smuzhiyun unsigned int timeout = 100;
172*4882a593Smuzhiyun
173*4882a593Smuzhiyun while (timeout--) {
174*4882a593Smuzhiyun if ((pci_read_reg(chan, SH4A_PCIEINTR) & mask) == mask)
175*4882a593Smuzhiyun return 0;
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun udelay(100);
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun return -ETIMEDOUT;
181*4882a593Smuzhiyun }
182*4882a593Smuzhiyun
phy_write_reg(struct pci_channel * chan,unsigned int addr,unsigned int lane,unsigned int data)183*4882a593Smuzhiyun static void __init phy_write_reg(struct pci_channel *chan, unsigned int addr,
184*4882a593Smuzhiyun unsigned int lane, unsigned int data)
185*4882a593Smuzhiyun {
186*4882a593Smuzhiyun unsigned long phyaddr;
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun phyaddr = (1 << BITS_CMD) + ((lane & 0xf) << BITS_LANE) +
189*4882a593Smuzhiyun ((addr & 0xff) << BITS_ADR);
190*4882a593Smuzhiyun
191*4882a593Smuzhiyun /* Set write data */
192*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEPHYDOUTR);
193*4882a593Smuzhiyun pci_write_reg(chan, phyaddr, SH4A_PCIEPHYADRR);
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun phy_wait_for_ack(chan);
196*4882a593Smuzhiyun
197*4882a593Smuzhiyun /* Clear command */
198*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIEPHYDOUTR);
199*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIEPHYADRR);
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun phy_wait_for_ack(chan);
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun
pcie_clk_init(struct sh7786_pcie_port * port)204*4882a593Smuzhiyun static int __init pcie_clk_init(struct sh7786_pcie_port *port)
205*4882a593Smuzhiyun {
206*4882a593Smuzhiyun struct pci_channel *chan = port->hose;
207*4882a593Smuzhiyun struct clk *clk;
208*4882a593Smuzhiyun char fclk_name[16];
209*4882a593Smuzhiyun int ret;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun /*
212*4882a593Smuzhiyun * First register the fixed clock
213*4882a593Smuzhiyun */
214*4882a593Smuzhiyun ret = clk_register(&fixed_pciexclkp);
215*4882a593Smuzhiyun if (unlikely(ret != 0))
216*4882a593Smuzhiyun return ret;
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun /*
219*4882a593Smuzhiyun * Grab the port's function clock, which the PHY clock depends
220*4882a593Smuzhiyun * on. clock lookups don't help us much at this point, since no
221*4882a593Smuzhiyun * dev_id is available this early. Lame.
222*4882a593Smuzhiyun */
223*4882a593Smuzhiyun snprintf(fclk_name, sizeof(fclk_name), "pcie%d_fck", port->index);
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun port->fclk = clk_get(NULL, fclk_name);
226*4882a593Smuzhiyun if (IS_ERR(port->fclk)) {
227*4882a593Smuzhiyun ret = PTR_ERR(port->fclk);
228*4882a593Smuzhiyun goto err_fclk;
229*4882a593Smuzhiyun }
230*4882a593Smuzhiyun
231*4882a593Smuzhiyun clk_enable(port->fclk);
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun /*
234*4882a593Smuzhiyun * And now, set up the PHY clock
235*4882a593Smuzhiyun */
236*4882a593Smuzhiyun clk = &port->phy_clk;
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun memset(clk, 0, sizeof(struct clk));
239*4882a593Smuzhiyun
240*4882a593Smuzhiyun clk->parent = &fixed_pciexclkp;
241*4882a593Smuzhiyun clk->enable_reg = (void __iomem *)(chan->reg_base + SH4A_PCIEPHYCTLR);
242*4882a593Smuzhiyun clk->enable_bit = BITS_CKE;
243*4882a593Smuzhiyun
244*4882a593Smuzhiyun ret = sh_clk_mstp_register(clk, 1);
245*4882a593Smuzhiyun if (unlikely(ret < 0))
246*4882a593Smuzhiyun goto err_phy;
247*4882a593Smuzhiyun
248*4882a593Smuzhiyun return 0;
249*4882a593Smuzhiyun
250*4882a593Smuzhiyun err_phy:
251*4882a593Smuzhiyun clk_disable(port->fclk);
252*4882a593Smuzhiyun clk_put(port->fclk);
253*4882a593Smuzhiyun err_fclk:
254*4882a593Smuzhiyun clk_unregister(&fixed_pciexclkp);
255*4882a593Smuzhiyun
256*4882a593Smuzhiyun return ret;
257*4882a593Smuzhiyun }
258*4882a593Smuzhiyun
phy_init(struct sh7786_pcie_port * port)259*4882a593Smuzhiyun static int __init phy_init(struct sh7786_pcie_port *port)
260*4882a593Smuzhiyun {
261*4882a593Smuzhiyun struct pci_channel *chan = port->hose;
262*4882a593Smuzhiyun unsigned int timeout = 100;
263*4882a593Smuzhiyun
264*4882a593Smuzhiyun clk_enable(&port->phy_clk);
265*4882a593Smuzhiyun
266*4882a593Smuzhiyun /* Initialize the phy */
267*4882a593Smuzhiyun phy_write_reg(chan, 0x60, 0xf, 0x004b008b);
268*4882a593Smuzhiyun phy_write_reg(chan, 0x61, 0xf, 0x00007b41);
269*4882a593Smuzhiyun phy_write_reg(chan, 0x64, 0xf, 0x00ff4f00);
270*4882a593Smuzhiyun phy_write_reg(chan, 0x65, 0xf, 0x09070907);
271*4882a593Smuzhiyun phy_write_reg(chan, 0x66, 0xf, 0x00000010);
272*4882a593Smuzhiyun phy_write_reg(chan, 0x74, 0xf, 0x0007001c);
273*4882a593Smuzhiyun phy_write_reg(chan, 0x79, 0xf, 0x01fc000d);
274*4882a593Smuzhiyun phy_write_reg(chan, 0xb0, 0xf, 0x00000610);
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun /* Deassert Standby */
277*4882a593Smuzhiyun phy_write_reg(chan, 0x67, 0x1, 0x00000400);
278*4882a593Smuzhiyun
279*4882a593Smuzhiyun /* Disable clock */
280*4882a593Smuzhiyun clk_disable(&port->phy_clk);
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun while (timeout--) {
283*4882a593Smuzhiyun if (pci_read_reg(chan, SH4A_PCIEPHYSR))
284*4882a593Smuzhiyun return 0;
285*4882a593Smuzhiyun
286*4882a593Smuzhiyun udelay(100);
287*4882a593Smuzhiyun }
288*4882a593Smuzhiyun
289*4882a593Smuzhiyun return -ETIMEDOUT;
290*4882a593Smuzhiyun }
291*4882a593Smuzhiyun
pcie_reset(struct sh7786_pcie_port * port)292*4882a593Smuzhiyun static void __init pcie_reset(struct sh7786_pcie_port *port)
293*4882a593Smuzhiyun {
294*4882a593Smuzhiyun struct pci_channel *chan = port->hose;
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun pci_write_reg(chan, 1, SH4A_PCIESRSTR);
297*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIETCTLR);
298*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIESRSTR);
299*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIETXVC0SR);
300*4882a593Smuzhiyun }
301*4882a593Smuzhiyun
pcie_init(struct sh7786_pcie_port * port)302*4882a593Smuzhiyun static int __init pcie_init(struct sh7786_pcie_port *port)
303*4882a593Smuzhiyun {
304*4882a593Smuzhiyun struct pci_channel *chan = port->hose;
305*4882a593Smuzhiyun unsigned int data;
306*4882a593Smuzhiyun phys_addr_t memstart, memend;
307*4882a593Smuzhiyun int ret, i, win;
308*4882a593Smuzhiyun
309*4882a593Smuzhiyun /* Begin initialization */
310*4882a593Smuzhiyun pcie_reset(port);
311*4882a593Smuzhiyun
312*4882a593Smuzhiyun /*
313*4882a593Smuzhiyun * Initial header for port config space is type 1, set the device
314*4882a593Smuzhiyun * class to match. Hardware takes care of propagating the IDSETR
315*4882a593Smuzhiyun * settings, so there is no need to bother with a quirk.
316*4882a593Smuzhiyun */
317*4882a593Smuzhiyun pci_write_reg(chan, PCI_CLASS_BRIDGE_PCI << 16, SH4A_PCIEIDSETR1);
318*4882a593Smuzhiyun
319*4882a593Smuzhiyun /* Initialize default capabilities. */
320*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEEXPCAP0);
321*4882a593Smuzhiyun data &= ~(PCI_EXP_FLAGS_TYPE << 16);
322*4882a593Smuzhiyun
323*4882a593Smuzhiyun if (port->endpoint)
324*4882a593Smuzhiyun data |= PCI_EXP_TYPE_ENDPOINT << 20;
325*4882a593Smuzhiyun else
326*4882a593Smuzhiyun data |= PCI_EXP_TYPE_ROOT_PORT << 20;
327*4882a593Smuzhiyun
328*4882a593Smuzhiyun data |= PCI_CAP_ID_EXP;
329*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEEXPCAP0);
330*4882a593Smuzhiyun
331*4882a593Smuzhiyun /* Enable data link layer active state reporting */
332*4882a593Smuzhiyun pci_write_reg(chan, PCI_EXP_LNKCAP_DLLLARC, SH4A_PCIEEXPCAP3);
333*4882a593Smuzhiyun
334*4882a593Smuzhiyun /* Enable extended sync and ASPM L0s support */
335*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEEXPCAP4);
336*4882a593Smuzhiyun data &= ~PCI_EXP_LNKCTL_ASPMC;
337*4882a593Smuzhiyun data |= PCI_EXP_LNKCTL_ES | 1;
338*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEEXPCAP4);
339*4882a593Smuzhiyun
340*4882a593Smuzhiyun /* Write out the physical slot number */
341*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEEXPCAP5);
342*4882a593Smuzhiyun data &= ~PCI_EXP_SLTCAP_PSN;
343*4882a593Smuzhiyun data |= (port->index + 1) << 19;
344*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEEXPCAP5);
345*4882a593Smuzhiyun
346*4882a593Smuzhiyun /* Set the completion timer timeout to the maximum 32ms. */
347*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIETLCTLR);
348*4882a593Smuzhiyun data &= ~0x3f00;
349*4882a593Smuzhiyun data |= 0x32 << 8;
350*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIETLCTLR);
351*4882a593Smuzhiyun
352*4882a593Smuzhiyun /*
353*4882a593Smuzhiyun * Set fast training sequences to the maximum 255,
354*4882a593Smuzhiyun * and enable MAC data scrambling.
355*4882a593Smuzhiyun */
356*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEMACCTLR);
357*4882a593Smuzhiyun data &= ~PCIEMACCTLR_SCR_DIS;
358*4882a593Smuzhiyun data |= (0xff << 16);
359*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEMACCTLR);
360*4882a593Smuzhiyun
361*4882a593Smuzhiyun memstart = __pa(memory_start);
362*4882a593Smuzhiyun memend = __pa(memory_end);
363*4882a593Smuzhiyun memsize = roundup_pow_of_two(memend - memstart);
364*4882a593Smuzhiyun
365*4882a593Smuzhiyun /*
366*4882a593Smuzhiyun * The start address must be aligned on its size. So we round
367*4882a593Smuzhiyun * it down, and then recalculate the size so that it covers
368*4882a593Smuzhiyun * the entire memory.
369*4882a593Smuzhiyun */
370*4882a593Smuzhiyun memstart = ALIGN_DOWN(memstart, memsize);
371*4882a593Smuzhiyun memsize = roundup_pow_of_two(memend - memstart);
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun /*
374*4882a593Smuzhiyun * If there's more than 512MB of memory, we need to roll over to
375*4882a593Smuzhiyun * LAR1/LAMR1.
376*4882a593Smuzhiyun */
377*4882a593Smuzhiyun if (memsize > SZ_512M) {
378*4882a593Smuzhiyun pci_write_reg(chan, memstart + SZ_512M, SH4A_PCIELAR1);
379*4882a593Smuzhiyun pci_write_reg(chan, ((memsize - SZ_512M) - SZ_256) | 1,
380*4882a593Smuzhiyun SH4A_PCIELAMR1);
381*4882a593Smuzhiyun memsize = SZ_512M;
382*4882a593Smuzhiyun } else {
383*4882a593Smuzhiyun /*
384*4882a593Smuzhiyun * Otherwise just zero it out and disable it.
385*4882a593Smuzhiyun */
386*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIELAR1);
387*4882a593Smuzhiyun pci_write_reg(chan, 0, SH4A_PCIELAMR1);
388*4882a593Smuzhiyun }
389*4882a593Smuzhiyun
390*4882a593Smuzhiyun /*
391*4882a593Smuzhiyun * LAR0/LAMR0 covers up to the first 512MB, which is enough to
392*4882a593Smuzhiyun * cover all of lowmem on most platforms.
393*4882a593Smuzhiyun */
394*4882a593Smuzhiyun pci_write_reg(chan, memstart, SH4A_PCIELAR0);
395*4882a593Smuzhiyun pci_write_reg(chan, (memsize - SZ_256) | 1, SH4A_PCIELAMR0);
396*4882a593Smuzhiyun
397*4882a593Smuzhiyun /* Finish initialization */
398*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIETCTLR);
399*4882a593Smuzhiyun data |= 0x1;
400*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIETCTLR);
401*4882a593Smuzhiyun
402*4882a593Smuzhiyun /* Let things settle down a bit.. */
403*4882a593Smuzhiyun mdelay(100);
404*4882a593Smuzhiyun
405*4882a593Smuzhiyun /* Enable DL_Active Interrupt generation */
406*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEDLINTENR);
407*4882a593Smuzhiyun data |= PCIEDLINTENR_DLL_ACT_ENABLE;
408*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEDLINTENR);
409*4882a593Smuzhiyun
410*4882a593Smuzhiyun /* Disable MAC data scrambling. */
411*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEMACCTLR);
412*4882a593Smuzhiyun data |= PCIEMACCTLR_SCR_DIS | (0xff << 16);
413*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEMACCTLR);
414*4882a593Smuzhiyun
415*4882a593Smuzhiyun /*
416*4882a593Smuzhiyun * This will timeout if we don't have a link, but we permit the
417*4882a593Smuzhiyun * port to register anyways in order to support hotplug on future
418*4882a593Smuzhiyun * hardware.
419*4882a593Smuzhiyun */
420*4882a593Smuzhiyun ret = pci_wait_for_irq(chan, MASK_INT_TX_CTRL);
421*4882a593Smuzhiyun
422*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEPCICONF1);
423*4882a593Smuzhiyun data &= ~(PCI_STATUS_DEVSEL_MASK << 16);
424*4882a593Smuzhiyun data |= PCI_COMMAND_IO | PCI_COMMAND_MEMORY | PCI_COMMAND_MASTER |
425*4882a593Smuzhiyun (PCI_STATUS_CAP_LIST | PCI_STATUS_DEVSEL_FAST) << 16;
426*4882a593Smuzhiyun pci_write_reg(chan, data, SH4A_PCIEPCICONF1);
427*4882a593Smuzhiyun
428*4882a593Smuzhiyun pci_write_reg(chan, 0x80888000, SH4A_PCIETXVC0DCTLR);
429*4882a593Smuzhiyun pci_write_reg(chan, 0x00222000, SH4A_PCIERXVC0DCTLR);
430*4882a593Smuzhiyun
431*4882a593Smuzhiyun wmb();
432*4882a593Smuzhiyun
433*4882a593Smuzhiyun if (ret == 0) {
434*4882a593Smuzhiyun data = pci_read_reg(chan, SH4A_PCIEMACSR);
435*4882a593Smuzhiyun printk(KERN_NOTICE "PCI: PCIe#%d x%d link detected\n",
436*4882a593Smuzhiyun port->index, (data >> 20) & 0x3f);
437*4882a593Smuzhiyun } else
438*4882a593Smuzhiyun printk(KERN_NOTICE "PCI: PCIe#%d link down\n",
439*4882a593Smuzhiyun port->index);
440*4882a593Smuzhiyun
441*4882a593Smuzhiyun for (i = win = 0; i < chan->nr_resources; i++) {
442*4882a593Smuzhiyun struct resource *res = chan->resources + i;
443*4882a593Smuzhiyun resource_size_t size;
444*4882a593Smuzhiyun u32 mask;
445*4882a593Smuzhiyun
446*4882a593Smuzhiyun /*
447*4882a593Smuzhiyun * We can't use the 32-bit mode windows in legacy 29-bit
448*4882a593Smuzhiyun * mode, so just skip them entirely.
449*4882a593Smuzhiyun */
450*4882a593Smuzhiyun if ((res->flags & IORESOURCE_MEM_32BIT) && __in_29bit_mode())
451*4882a593Smuzhiyun res->flags |= IORESOURCE_DISABLED;
452*4882a593Smuzhiyun
453*4882a593Smuzhiyun if (res->flags & IORESOURCE_DISABLED)
454*4882a593Smuzhiyun continue;
455*4882a593Smuzhiyun
456*4882a593Smuzhiyun pci_write_reg(chan, 0x00000000, SH4A_PCIEPTCTLR(win));
457*4882a593Smuzhiyun
458*4882a593Smuzhiyun /*
459*4882a593Smuzhiyun * The PAMR mask is calculated in units of 256kB, which
460*4882a593Smuzhiyun * keeps things pretty simple.
461*4882a593Smuzhiyun */
462*4882a593Smuzhiyun size = resource_size(res);
463*4882a593Smuzhiyun mask = (roundup_pow_of_two(size) / SZ_256K) - 1;
464*4882a593Smuzhiyun pci_write_reg(chan, mask << 18, SH4A_PCIEPAMR(win));
465*4882a593Smuzhiyun
466*4882a593Smuzhiyun pci_write_reg(chan, upper_32_bits(res->start),
467*4882a593Smuzhiyun SH4A_PCIEPARH(win));
468*4882a593Smuzhiyun pci_write_reg(chan, lower_32_bits(res->start),
469*4882a593Smuzhiyun SH4A_PCIEPARL(win));
470*4882a593Smuzhiyun
471*4882a593Smuzhiyun mask = MASK_PARE;
472*4882a593Smuzhiyun if (res->flags & IORESOURCE_IO)
473*4882a593Smuzhiyun mask |= MASK_SPC;
474*4882a593Smuzhiyun
475*4882a593Smuzhiyun pci_write_reg(chan, mask, SH4A_PCIEPTCTLR(win));
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun win++;
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun return 0;
481*4882a593Smuzhiyun }
482*4882a593Smuzhiyun
pcibios_map_platform_irq(const struct pci_dev * pdev,u8 slot,u8 pin)483*4882a593Smuzhiyun int pcibios_map_platform_irq(const struct pci_dev *pdev, u8 slot, u8 pin)
484*4882a593Smuzhiyun {
485*4882a593Smuzhiyun return evt2irq(0xae0);
486*4882a593Smuzhiyun }
487*4882a593Smuzhiyun
pcibios_bus_add_device(struct pci_dev * pdev)488*4882a593Smuzhiyun void pcibios_bus_add_device(struct pci_dev *pdev)
489*4882a593Smuzhiyun {
490*4882a593Smuzhiyun dma_direct_set_offset(&pdev->dev, __pa(memory_start),
491*4882a593Smuzhiyun __pa(memory_start) - memstart, memsize);
492*4882a593Smuzhiyun }
493*4882a593Smuzhiyun
sh7786_pcie_core_init(void)494*4882a593Smuzhiyun static int __init sh7786_pcie_core_init(void)
495*4882a593Smuzhiyun {
496*4882a593Smuzhiyun /* Return the number of ports */
497*4882a593Smuzhiyun return test_mode_pin(MODE_PIN12) ? 3 : 2;
498*4882a593Smuzhiyun }
499*4882a593Smuzhiyun
sh7786_pcie_init_hw(void * data,async_cookie_t cookie)500*4882a593Smuzhiyun static void __init sh7786_pcie_init_hw(void *data, async_cookie_t cookie)
501*4882a593Smuzhiyun {
502*4882a593Smuzhiyun struct sh7786_pcie_port *port = data;
503*4882a593Smuzhiyun int ret;
504*4882a593Smuzhiyun
505*4882a593Smuzhiyun /*
506*4882a593Smuzhiyun * Check if we are configured in endpoint or root complex mode,
507*4882a593Smuzhiyun * this is a fixed pin setting that applies to all PCIe ports.
508*4882a593Smuzhiyun */
509*4882a593Smuzhiyun port->endpoint = test_mode_pin(MODE_PIN11);
510*4882a593Smuzhiyun
511*4882a593Smuzhiyun /*
512*4882a593Smuzhiyun * Setup clocks, needed both for PHY and PCIe registers.
513*4882a593Smuzhiyun */
514*4882a593Smuzhiyun ret = pcie_clk_init(port);
515*4882a593Smuzhiyun if (unlikely(ret < 0)) {
516*4882a593Smuzhiyun pr_err("clock initialization failed for port#%d\n",
517*4882a593Smuzhiyun port->index);
518*4882a593Smuzhiyun return;
519*4882a593Smuzhiyun }
520*4882a593Smuzhiyun
521*4882a593Smuzhiyun ret = phy_init(port);
522*4882a593Smuzhiyun if (unlikely(ret < 0)) {
523*4882a593Smuzhiyun pr_err("phy initialization failed for port#%d\n",
524*4882a593Smuzhiyun port->index);
525*4882a593Smuzhiyun return;
526*4882a593Smuzhiyun }
527*4882a593Smuzhiyun
528*4882a593Smuzhiyun ret = pcie_init(port);
529*4882a593Smuzhiyun if (unlikely(ret < 0)) {
530*4882a593Smuzhiyun pr_err("core initialization failed for port#%d\n",
531*4882a593Smuzhiyun port->index);
532*4882a593Smuzhiyun return;
533*4882a593Smuzhiyun }
534*4882a593Smuzhiyun
535*4882a593Smuzhiyun /* In the interest of preserving device ordering, synchronize */
536*4882a593Smuzhiyun async_synchronize_cookie(cookie);
537*4882a593Smuzhiyun
538*4882a593Smuzhiyun register_pci_controller(port->hose);
539*4882a593Smuzhiyun }
540*4882a593Smuzhiyun
541*4882a593Smuzhiyun static struct sh7786_pcie_hwops sh7786_65nm_pcie_hwops __initdata = {
542*4882a593Smuzhiyun .core_init = sh7786_pcie_core_init,
543*4882a593Smuzhiyun .port_init_hw = sh7786_pcie_init_hw,
544*4882a593Smuzhiyun };
545*4882a593Smuzhiyun
sh7786_pcie_init(void)546*4882a593Smuzhiyun static int __init sh7786_pcie_init(void)
547*4882a593Smuzhiyun {
548*4882a593Smuzhiyun struct clk *platclk;
549*4882a593Smuzhiyun u32 mm_sel;
550*4882a593Smuzhiyun int i;
551*4882a593Smuzhiyun
552*4882a593Smuzhiyun printk(KERN_NOTICE "PCI: Starting initialization.\n");
553*4882a593Smuzhiyun
554*4882a593Smuzhiyun sh7786_pcie_hwops = &sh7786_65nm_pcie_hwops;
555*4882a593Smuzhiyun
556*4882a593Smuzhiyun nr_ports = sh7786_pcie_hwops->core_init();
557*4882a593Smuzhiyun BUG_ON(nr_ports > ARRAY_SIZE(sh7786_pci_channels));
558*4882a593Smuzhiyun
559*4882a593Smuzhiyun if (unlikely(nr_ports == 0))
560*4882a593Smuzhiyun return -ENODEV;
561*4882a593Smuzhiyun
562*4882a593Smuzhiyun sh7786_pcie_ports = kcalloc(nr_ports, sizeof(struct sh7786_pcie_port),
563*4882a593Smuzhiyun GFP_KERNEL);
564*4882a593Smuzhiyun if (unlikely(!sh7786_pcie_ports))
565*4882a593Smuzhiyun return -ENOMEM;
566*4882a593Smuzhiyun
567*4882a593Smuzhiyun /*
568*4882a593Smuzhiyun * Fetch any optional platform clock associated with this block.
569*4882a593Smuzhiyun *
570*4882a593Smuzhiyun * This is a rather nasty hack for boards with spec-mocking FPGAs
571*4882a593Smuzhiyun * that have a secondary set of clocks outside of the on-chip
572*4882a593Smuzhiyun * ones that need to be accounted for before there is any chance
573*4882a593Smuzhiyun * of touching the existing MSTP bits or CPG clocks.
574*4882a593Smuzhiyun */
575*4882a593Smuzhiyun platclk = clk_get(NULL, "pcie_plat_clk");
576*4882a593Smuzhiyun if (IS_ERR(platclk)) {
577*4882a593Smuzhiyun /* Sane hardware should probably get a WARN_ON.. */
578*4882a593Smuzhiyun platclk = NULL;
579*4882a593Smuzhiyun }
580*4882a593Smuzhiyun
581*4882a593Smuzhiyun clk_enable(platclk);
582*4882a593Smuzhiyun
583*4882a593Smuzhiyun mm_sel = sh7786_mm_sel();
584*4882a593Smuzhiyun
585*4882a593Smuzhiyun /*
586*4882a593Smuzhiyun * Depending on the MMSELR register value, the PCIe0 MEM 1
587*4882a593Smuzhiyun * area may not be available. See Table 13.11 of the SH7786
588*4882a593Smuzhiyun * datasheet.
589*4882a593Smuzhiyun */
590*4882a593Smuzhiyun if (mm_sel != 1 && mm_sel != 2 && mm_sel != 5 && mm_sel != 6)
591*4882a593Smuzhiyun sh7786_pci0_resources[2].flags |= IORESOURCE_DISABLED;
592*4882a593Smuzhiyun
593*4882a593Smuzhiyun printk(KERN_NOTICE "PCI: probing %d ports.\n", nr_ports);
594*4882a593Smuzhiyun
595*4882a593Smuzhiyun for (i = 0; i < nr_ports; i++) {
596*4882a593Smuzhiyun struct sh7786_pcie_port *port = sh7786_pcie_ports + i;
597*4882a593Smuzhiyun
598*4882a593Smuzhiyun port->index = i;
599*4882a593Smuzhiyun port->hose = sh7786_pci_channels + i;
600*4882a593Smuzhiyun port->hose->io_map_base = port->hose->resources[0].start;
601*4882a593Smuzhiyun
602*4882a593Smuzhiyun async_schedule(sh7786_pcie_hwops->port_init_hw, port);
603*4882a593Smuzhiyun }
604*4882a593Smuzhiyun
605*4882a593Smuzhiyun async_synchronize_full();
606*4882a593Smuzhiyun
607*4882a593Smuzhiyun return 0;
608*4882a593Smuzhiyun }
609*4882a593Smuzhiyun arch_initcall(sh7786_pcie_init);
610