1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * This code was extracted from:
3*4882a593Smuzhiyun * git://github.com/gonzoua/u-boot-pi.git master
4*4882a593Smuzhiyun * and hence presumably (C) 2012 Oleksandr Tymoshenko
5*4882a593Smuzhiyun *
6*4882a593Smuzhiyun * Tweaks for U-Boot upstreaming
7*4882a593Smuzhiyun * (C) 2012 Stephen Warren
8*4882a593Smuzhiyun *
9*4882a593Smuzhiyun * Portions (e.g. read/write macros, concepts for back-to-back register write
10*4882a593Smuzhiyun * timing workarounds) obviously extracted from the Linux kernel at:
11*4882a593Smuzhiyun * https://github.com/raspberrypi/linux.git rpi-3.6.y
12*4882a593Smuzhiyun *
13*4882a593Smuzhiyun * The Linux kernel code has the following (c) and license, which is hence
14*4882a593Smuzhiyun * propagated to Oleksandr's tree and here:
15*4882a593Smuzhiyun *
16*4882a593Smuzhiyun * Support for SDHCI device on 2835
17*4882a593Smuzhiyun * Based on sdhci-bcm2708.c (c) 2010 Broadcom
18*4882a593Smuzhiyun *
19*4882a593Smuzhiyun * This program is free software; you can redistribute it and/or modify
20*4882a593Smuzhiyun * it under the terms of the GNU General Public License version 2 as
21*4882a593Smuzhiyun * published by the Free Software Foundation.
22*4882a593Smuzhiyun *
23*4882a593Smuzhiyun * This program is distributed in the hope that it will be useful,
24*4882a593Smuzhiyun * but WITHOUT ANY WARRANTY; without even the implied warranty of
25*4882a593Smuzhiyun * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
26*4882a593Smuzhiyun * GNU General Public License for more details.
27*4882a593Smuzhiyun *
28*4882a593Smuzhiyun * You should have received a copy of the GNU General Public License
29*4882a593Smuzhiyun * along with this program; if not, write to the Free Software
30*4882a593Smuzhiyun * Foundation, Inc., 675 Mass Ave, Cambridge, MA 02139, USA.
31*4882a593Smuzhiyun */
32*4882a593Smuzhiyun
33*4882a593Smuzhiyun /* Supports:
34*4882a593Smuzhiyun * SDHCI platform device - Arasan SD controller in BCM2708
35*4882a593Smuzhiyun *
36*4882a593Smuzhiyun * Inspired by sdhci-pci.c, by Pierre Ossman
37*4882a593Smuzhiyun */
38*4882a593Smuzhiyun
39*4882a593Smuzhiyun #include <common.h>
40*4882a593Smuzhiyun #include <dm.h>
41*4882a593Smuzhiyun #include <malloc.h>
42*4882a593Smuzhiyun #include <memalign.h>
43*4882a593Smuzhiyun #include <sdhci.h>
44*4882a593Smuzhiyun #include <asm/arch/msg.h>
45*4882a593Smuzhiyun #include <asm/arch/mbox.h>
46*4882a593Smuzhiyun #include <mach/sdhci.h>
47*4882a593Smuzhiyun #include <mach/timer.h>
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun /* 400KHz is max freq for card ID etc. Use that as min */
50*4882a593Smuzhiyun #define MIN_FREQ 400000
51*4882a593Smuzhiyun #define SDHCI_BUFFER 0x20
52*4882a593Smuzhiyun
53*4882a593Smuzhiyun struct bcm2835_sdhci_host {
54*4882a593Smuzhiyun struct sdhci_host host;
55*4882a593Smuzhiyun uint twoticks_delay;
56*4882a593Smuzhiyun ulong last_write;
57*4882a593Smuzhiyun };
58*4882a593Smuzhiyun
to_bcm(struct sdhci_host * host)59*4882a593Smuzhiyun static inline struct bcm2835_sdhci_host *to_bcm(struct sdhci_host *host)
60*4882a593Smuzhiyun {
61*4882a593Smuzhiyun return (struct bcm2835_sdhci_host *)host;
62*4882a593Smuzhiyun }
63*4882a593Smuzhiyun
bcm2835_sdhci_raw_writel(struct sdhci_host * host,u32 val,int reg)64*4882a593Smuzhiyun static inline void bcm2835_sdhci_raw_writel(struct sdhci_host *host, u32 val,
65*4882a593Smuzhiyun int reg)
66*4882a593Smuzhiyun {
67*4882a593Smuzhiyun struct bcm2835_sdhci_host *bcm_host = to_bcm(host);
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /*
70*4882a593Smuzhiyun * The Arasan has a bugette whereby it may lose the content of
71*4882a593Smuzhiyun * successive writes to registers that are within two SD-card clock
72*4882a593Smuzhiyun * cycles of each other (a clock domain crossing problem).
73*4882a593Smuzhiyun * It seems, however, that the data register does not have this problem.
74*4882a593Smuzhiyun * (Which is just as well - otherwise we'd have to nobble the DMA engine
75*4882a593Smuzhiyun * too)
76*4882a593Smuzhiyun */
77*4882a593Smuzhiyun if (reg != SDHCI_BUFFER) {
78*4882a593Smuzhiyun while (timer_get_us() - bcm_host->last_write < bcm_host->twoticks_delay)
79*4882a593Smuzhiyun ;
80*4882a593Smuzhiyun }
81*4882a593Smuzhiyun
82*4882a593Smuzhiyun writel(val, host->ioaddr + reg);
83*4882a593Smuzhiyun bcm_host->last_write = timer_get_us();
84*4882a593Smuzhiyun }
85*4882a593Smuzhiyun
bcm2835_sdhci_raw_readl(struct sdhci_host * host,int reg)86*4882a593Smuzhiyun static inline u32 bcm2835_sdhci_raw_readl(struct sdhci_host *host, int reg)
87*4882a593Smuzhiyun {
88*4882a593Smuzhiyun return readl(host->ioaddr + reg);
89*4882a593Smuzhiyun }
90*4882a593Smuzhiyun
bcm2835_sdhci_writel(struct sdhci_host * host,u32 val,int reg)91*4882a593Smuzhiyun static void bcm2835_sdhci_writel(struct sdhci_host *host, u32 val, int reg)
92*4882a593Smuzhiyun {
93*4882a593Smuzhiyun bcm2835_sdhci_raw_writel(host, val, reg);
94*4882a593Smuzhiyun }
95*4882a593Smuzhiyun
bcm2835_sdhci_writew(struct sdhci_host * host,u16 val,int reg)96*4882a593Smuzhiyun static void bcm2835_sdhci_writew(struct sdhci_host *host, u16 val, int reg)
97*4882a593Smuzhiyun {
98*4882a593Smuzhiyun static u32 shadow;
99*4882a593Smuzhiyun u32 oldval = (reg == SDHCI_COMMAND) ? shadow :
100*4882a593Smuzhiyun bcm2835_sdhci_raw_readl(host, reg & ~3);
101*4882a593Smuzhiyun u32 word_num = (reg >> 1) & 1;
102*4882a593Smuzhiyun u32 word_shift = word_num * 16;
103*4882a593Smuzhiyun u32 mask = 0xffff << word_shift;
104*4882a593Smuzhiyun u32 newval = (oldval & ~mask) | (val << word_shift);
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun if (reg == SDHCI_TRANSFER_MODE)
107*4882a593Smuzhiyun shadow = newval;
108*4882a593Smuzhiyun else
109*4882a593Smuzhiyun bcm2835_sdhci_raw_writel(host, newval, reg & ~3);
110*4882a593Smuzhiyun }
111*4882a593Smuzhiyun
bcm2835_sdhci_writeb(struct sdhci_host * host,u8 val,int reg)112*4882a593Smuzhiyun static void bcm2835_sdhci_writeb(struct sdhci_host *host, u8 val, int reg)
113*4882a593Smuzhiyun {
114*4882a593Smuzhiyun u32 oldval = bcm2835_sdhci_raw_readl(host, reg & ~3);
115*4882a593Smuzhiyun u32 byte_num = reg & 3;
116*4882a593Smuzhiyun u32 byte_shift = byte_num * 8;
117*4882a593Smuzhiyun u32 mask = 0xff << byte_shift;
118*4882a593Smuzhiyun u32 newval = (oldval & ~mask) | (val << byte_shift);
119*4882a593Smuzhiyun
120*4882a593Smuzhiyun bcm2835_sdhci_raw_writel(host, newval, reg & ~3);
121*4882a593Smuzhiyun }
122*4882a593Smuzhiyun
bcm2835_sdhci_readl(struct sdhci_host * host,int reg)123*4882a593Smuzhiyun static u32 bcm2835_sdhci_readl(struct sdhci_host *host, int reg)
124*4882a593Smuzhiyun {
125*4882a593Smuzhiyun u32 val = bcm2835_sdhci_raw_readl(host, reg);
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun return val;
128*4882a593Smuzhiyun }
129*4882a593Smuzhiyun
bcm2835_sdhci_readw(struct sdhci_host * host,int reg)130*4882a593Smuzhiyun static u16 bcm2835_sdhci_readw(struct sdhci_host *host, int reg)
131*4882a593Smuzhiyun {
132*4882a593Smuzhiyun u32 val = bcm2835_sdhci_raw_readl(host, (reg & ~3));
133*4882a593Smuzhiyun u32 word_num = (reg >> 1) & 1;
134*4882a593Smuzhiyun u32 word_shift = word_num * 16;
135*4882a593Smuzhiyun u32 word = (val >> word_shift) & 0xffff;
136*4882a593Smuzhiyun
137*4882a593Smuzhiyun return word;
138*4882a593Smuzhiyun }
139*4882a593Smuzhiyun
bcm2835_sdhci_readb(struct sdhci_host * host,int reg)140*4882a593Smuzhiyun static u8 bcm2835_sdhci_readb(struct sdhci_host *host, int reg)
141*4882a593Smuzhiyun {
142*4882a593Smuzhiyun u32 val = bcm2835_sdhci_raw_readl(host, (reg & ~3));
143*4882a593Smuzhiyun u32 byte_num = reg & 3;
144*4882a593Smuzhiyun u32 byte_shift = byte_num * 8;
145*4882a593Smuzhiyun u32 byte = (val >> byte_shift) & 0xff;
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun return byte;
148*4882a593Smuzhiyun }
149*4882a593Smuzhiyun
150*4882a593Smuzhiyun static const struct sdhci_ops bcm2835_ops = {
151*4882a593Smuzhiyun .write_l = bcm2835_sdhci_writel,
152*4882a593Smuzhiyun .write_w = bcm2835_sdhci_writew,
153*4882a593Smuzhiyun .write_b = bcm2835_sdhci_writeb,
154*4882a593Smuzhiyun .read_l = bcm2835_sdhci_readl,
155*4882a593Smuzhiyun .read_w = bcm2835_sdhci_readw,
156*4882a593Smuzhiyun .read_b = bcm2835_sdhci_readb,
157*4882a593Smuzhiyun };
158*4882a593Smuzhiyun
bcm2835_sdhci_bind(struct udevice * dev)159*4882a593Smuzhiyun static int bcm2835_sdhci_bind(struct udevice *dev)
160*4882a593Smuzhiyun {
161*4882a593Smuzhiyun struct bcm2835_sdhci_plat *plat = dev_get_platdata(dev);
162*4882a593Smuzhiyun
163*4882a593Smuzhiyun return sdhci_bind(dev, &plat->mmc, &plat->cfg);
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun
bcm2835_sdhci_probe(struct udevice * dev)166*4882a593Smuzhiyun static int bcm2835_sdhci_probe(struct udevice *dev)
167*4882a593Smuzhiyun {
168*4882a593Smuzhiyun struct mmc_uclass_priv *upriv = dev_get_uclass_priv(dev);
169*4882a593Smuzhiyun struct bcm2835_sdhci_plat *plat = dev_get_platdata(dev);
170*4882a593Smuzhiyun struct bcm2835_sdhci_host *priv = dev_get_priv(dev);
171*4882a593Smuzhiyun struct sdhci_host *host = &priv->host;
172*4882a593Smuzhiyun fdt_addr_t base;
173*4882a593Smuzhiyun int emmc_freq;
174*4882a593Smuzhiyun int ret;
175*4882a593Smuzhiyun
176*4882a593Smuzhiyun base = devfdt_get_addr(dev);
177*4882a593Smuzhiyun if (base == FDT_ADDR_T_NONE)
178*4882a593Smuzhiyun return -EINVAL;
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun ret = bcm2835_get_mmc_clock();
181*4882a593Smuzhiyun if (ret < 0) {
182*4882a593Smuzhiyun debug("%s: Failed to set MMC clock (err=%d)\n", __func__, ret);
183*4882a593Smuzhiyun return ret;
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun emmc_freq = ret;
186*4882a593Smuzhiyun
187*4882a593Smuzhiyun /*
188*4882a593Smuzhiyun * See the comments in bcm2835_sdhci_raw_writel().
189*4882a593Smuzhiyun *
190*4882a593Smuzhiyun * This should probably be dynamically calculated based on the actual
191*4882a593Smuzhiyun * frequency. However, this is the longest we'll have to wait, and
192*4882a593Smuzhiyun * doesn't seem to slow access down too much, so the added complexity
193*4882a593Smuzhiyun * doesn't seem worth it for now.
194*4882a593Smuzhiyun *
195*4882a593Smuzhiyun * 1/MIN_FREQ is (max) time per tick of eMMC clock.
196*4882a593Smuzhiyun * 2/MIN_FREQ is time for two ticks.
197*4882a593Smuzhiyun * Multiply by 1000000 to get uS per two ticks.
198*4882a593Smuzhiyun * +1 for hack rounding.
199*4882a593Smuzhiyun */
200*4882a593Smuzhiyun priv->twoticks_delay = ((2 * 1000000) / MIN_FREQ) + 1;
201*4882a593Smuzhiyun priv->last_write = 0;
202*4882a593Smuzhiyun
203*4882a593Smuzhiyun host->name = dev->name;
204*4882a593Smuzhiyun host->ioaddr = (void *)base;
205*4882a593Smuzhiyun host->quirks = SDHCI_QUIRK_BROKEN_VOLTAGE | SDHCI_QUIRK_BROKEN_R1B |
206*4882a593Smuzhiyun SDHCI_QUIRK_WAIT_SEND_CMD | SDHCI_QUIRK_NO_HISPD_BIT;
207*4882a593Smuzhiyun host->max_clk = emmc_freq;
208*4882a593Smuzhiyun host->voltages = MMC_VDD_32_33 | MMC_VDD_33_34 | MMC_VDD_165_195;
209*4882a593Smuzhiyun host->ops = &bcm2835_ops;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun ret = sdhci_setup_cfg(&plat->cfg, host, emmc_freq, MIN_FREQ);
212*4882a593Smuzhiyun if (ret) {
213*4882a593Smuzhiyun debug("%s: Failed to setup SDHCI (err=%d)\n", __func__, ret);
214*4882a593Smuzhiyun return ret;
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun
217*4882a593Smuzhiyun upriv->mmc = &plat->mmc;
218*4882a593Smuzhiyun host->mmc = &plat->mmc;
219*4882a593Smuzhiyun host->mmc->priv = host;
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun return sdhci_probe(dev);
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun
224*4882a593Smuzhiyun static const struct udevice_id bcm2835_sdhci_match[] = {
225*4882a593Smuzhiyun { .compatible = "brcm,bcm2835-sdhci" },
226*4882a593Smuzhiyun { /* sentinel */ }
227*4882a593Smuzhiyun };
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun U_BOOT_DRIVER(sdhci_cdns) = {
230*4882a593Smuzhiyun .name = "sdhci-bcm2835",
231*4882a593Smuzhiyun .id = UCLASS_MMC,
232*4882a593Smuzhiyun .of_match = bcm2835_sdhci_match,
233*4882a593Smuzhiyun .bind = bcm2835_sdhci_bind,
234*4882a593Smuzhiyun .probe = bcm2835_sdhci_probe,
235*4882a593Smuzhiyun .priv_auto_alloc_size = sizeof(struct bcm2835_sdhci_host),
236*4882a593Smuzhiyun .platdata_auto_alloc_size = sizeof(struct bcm2835_sdhci_plat),
237*4882a593Smuzhiyun .ops = &sdhci_ops,
238*4882a593Smuzhiyun };
239