1*4882a593Smuzhiyun /*
2*4882a593Smuzhiyun * For documentation on the i460 AGP interface, see Chapter 7 (AGP Subsystem) of
3*4882a593Smuzhiyun * the "Intel 460GTX Chipset Software Developer's Manual":
4*4882a593Smuzhiyun * http://www.intel.com/design/archives/itanium/downloads/248704.htm
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun /*
7*4882a593Smuzhiyun * 460GX support by Chris Ahna <christopher.j.ahna@intel.com>
8*4882a593Smuzhiyun * Clean up & simplification by David Mosberger-Tang <davidm@hpl.hp.com>
9*4882a593Smuzhiyun */
10*4882a593Smuzhiyun #include <linux/module.h>
11*4882a593Smuzhiyun #include <linux/pci.h>
12*4882a593Smuzhiyun #include <linux/init.h>
13*4882a593Smuzhiyun #include <linux/string.h>
14*4882a593Smuzhiyun #include <linux/slab.h>
15*4882a593Smuzhiyun #include <linux/agp_backend.h>
16*4882a593Smuzhiyun #include <linux/log2.h>
17*4882a593Smuzhiyun
18*4882a593Smuzhiyun #include "agp.h"
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun #define INTEL_I460_BAPBASE 0x98
21*4882a593Smuzhiyun #define INTEL_I460_GXBCTL 0xa0
22*4882a593Smuzhiyun #define INTEL_I460_AGPSIZ 0xa2
23*4882a593Smuzhiyun #define INTEL_I460_ATTBASE 0xfe200000
24*4882a593Smuzhiyun #define INTEL_I460_GATT_VALID (1UL << 24)
25*4882a593Smuzhiyun #define INTEL_I460_GATT_COHERENT (1UL << 25)
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun /*
28*4882a593Smuzhiyun * The i460 can operate with large (4MB) pages, but there is no sane way to support this
29*4882a593Smuzhiyun * within the current kernel/DRM environment, so we disable the relevant code for now.
30*4882a593Smuzhiyun * See also comments in ia64_alloc_page()...
31*4882a593Smuzhiyun */
32*4882a593Smuzhiyun #define I460_LARGE_IO_PAGES 0
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun #if I460_LARGE_IO_PAGES
35*4882a593Smuzhiyun # define I460_IO_PAGE_SHIFT i460.io_page_shift
36*4882a593Smuzhiyun #else
37*4882a593Smuzhiyun # define I460_IO_PAGE_SHIFT 12
38*4882a593Smuzhiyun #endif
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun #define I460_IOPAGES_PER_KPAGE (PAGE_SIZE >> I460_IO_PAGE_SHIFT)
41*4882a593Smuzhiyun #define I460_KPAGES_PER_IOPAGE (1 << (I460_IO_PAGE_SHIFT - PAGE_SHIFT))
42*4882a593Smuzhiyun #define I460_SRAM_IO_DISABLE (1 << 4)
43*4882a593Smuzhiyun #define I460_BAPBASE_ENABLE (1 << 3)
44*4882a593Smuzhiyun #define I460_AGPSIZ_MASK 0x7
45*4882a593Smuzhiyun #define I460_4M_PS (1 << 1)
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun /* Control bits for Out-Of-GART coherency and Burst Write Combining */
48*4882a593Smuzhiyun #define I460_GXBCTL_OOG (1UL << 0)
49*4882a593Smuzhiyun #define I460_GXBCTL_BWC (1UL << 2)
50*4882a593Smuzhiyun
51*4882a593Smuzhiyun /*
52*4882a593Smuzhiyun * gatt_table entries are 32-bits wide on the i460; the generic code ought to declare the
53*4882a593Smuzhiyun * gatt_table and gatt_table_real pointers a "void *"...
54*4882a593Smuzhiyun */
55*4882a593Smuzhiyun #define RD_GATT(index) readl((u32 *) i460.gatt + (index))
56*4882a593Smuzhiyun #define WR_GATT(index, val) writel((val), (u32 *) i460.gatt + (index))
57*4882a593Smuzhiyun /*
58*4882a593Smuzhiyun * The 460 spec says we have to read the last location written to make sure that all
59*4882a593Smuzhiyun * writes have taken effect
60*4882a593Smuzhiyun */
61*4882a593Smuzhiyun #define WR_FLUSH_GATT(index) RD_GATT(index)
62*4882a593Smuzhiyun
63*4882a593Smuzhiyun static unsigned long i460_mask_memory (struct agp_bridge_data *bridge,
64*4882a593Smuzhiyun dma_addr_t addr, int type);
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun static struct {
67*4882a593Smuzhiyun void *gatt; /* ioremap'd GATT area */
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /* i460 supports multiple GART page sizes, so GART pageshift is dynamic: */
70*4882a593Smuzhiyun u8 io_page_shift;
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun /* BIOS configures chipset to one of 2 possible apbase values: */
73*4882a593Smuzhiyun u8 dynamic_apbase;
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun /* structure for tracking partial use of 4MB GART pages: */
76*4882a593Smuzhiyun struct lp_desc {
77*4882a593Smuzhiyun unsigned long *alloced_map; /* bitmap of kernel-pages in use */
78*4882a593Smuzhiyun int refcount; /* number of kernel pages using the large page */
79*4882a593Smuzhiyun u64 paddr; /* physical address of large page */
80*4882a593Smuzhiyun struct page *page; /* page pointer */
81*4882a593Smuzhiyun } *lp_desc;
82*4882a593Smuzhiyun } i460;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun static const struct aper_size_info_8 i460_sizes[3] =
85*4882a593Smuzhiyun {
86*4882a593Smuzhiyun /*
87*4882a593Smuzhiyun * The 32GB aperture is only available with a 4M GART page size. Due to the
88*4882a593Smuzhiyun * dynamic GART page size, we can't figure out page_order or num_entries until
89*4882a593Smuzhiyun * runtime.
90*4882a593Smuzhiyun */
91*4882a593Smuzhiyun {32768, 0, 0, 4},
92*4882a593Smuzhiyun {1024, 0, 0, 2},
93*4882a593Smuzhiyun {256, 0, 0, 1}
94*4882a593Smuzhiyun };
95*4882a593Smuzhiyun
96*4882a593Smuzhiyun static struct gatt_mask i460_masks[] =
97*4882a593Smuzhiyun {
98*4882a593Smuzhiyun {
99*4882a593Smuzhiyun .mask = INTEL_I460_GATT_VALID | INTEL_I460_GATT_COHERENT,
100*4882a593Smuzhiyun .type = 0
101*4882a593Smuzhiyun }
102*4882a593Smuzhiyun };
103*4882a593Smuzhiyun
i460_fetch_size(void)104*4882a593Smuzhiyun static int i460_fetch_size (void)
105*4882a593Smuzhiyun {
106*4882a593Smuzhiyun int i;
107*4882a593Smuzhiyun u8 temp;
108*4882a593Smuzhiyun struct aper_size_info_8 *values;
109*4882a593Smuzhiyun
110*4882a593Smuzhiyun /* Determine the GART page size */
111*4882a593Smuzhiyun pci_read_config_byte(agp_bridge->dev, INTEL_I460_GXBCTL, &temp);
112*4882a593Smuzhiyun i460.io_page_shift = (temp & I460_4M_PS) ? 22 : 12;
113*4882a593Smuzhiyun pr_debug("i460_fetch_size: io_page_shift=%d\n", i460.io_page_shift);
114*4882a593Smuzhiyun
115*4882a593Smuzhiyun if (i460.io_page_shift != I460_IO_PAGE_SHIFT) {
116*4882a593Smuzhiyun printk(KERN_ERR PFX
117*4882a593Smuzhiyun "I/O (GART) page-size %luKB doesn't match expected "
118*4882a593Smuzhiyun "size %luKB\n",
119*4882a593Smuzhiyun 1UL << (i460.io_page_shift - 10),
120*4882a593Smuzhiyun 1UL << (I460_IO_PAGE_SHIFT));
121*4882a593Smuzhiyun return 0;
122*4882a593Smuzhiyun }
123*4882a593Smuzhiyun
124*4882a593Smuzhiyun values = A_SIZE_8(agp_bridge->driver->aperture_sizes);
125*4882a593Smuzhiyun
126*4882a593Smuzhiyun pci_read_config_byte(agp_bridge->dev, INTEL_I460_AGPSIZ, &temp);
127*4882a593Smuzhiyun
128*4882a593Smuzhiyun /* Exit now if the IO drivers for the GART SRAMS are turned off */
129*4882a593Smuzhiyun if (temp & I460_SRAM_IO_DISABLE) {
130*4882a593Smuzhiyun printk(KERN_ERR PFX "GART SRAMS disabled on 460GX chipset\n");
131*4882a593Smuzhiyun printk(KERN_ERR PFX "AGPGART operation not possible\n");
132*4882a593Smuzhiyun return 0;
133*4882a593Smuzhiyun }
134*4882a593Smuzhiyun
135*4882a593Smuzhiyun /* Make sure we don't try to create an 2 ^ 23 entry GATT */
136*4882a593Smuzhiyun if ((i460.io_page_shift == 0) && ((temp & I460_AGPSIZ_MASK) == 4)) {
137*4882a593Smuzhiyun printk(KERN_ERR PFX "We can't have a 32GB aperture with 4KB GART pages\n");
138*4882a593Smuzhiyun return 0;
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun /* Determine the proper APBASE register */
142*4882a593Smuzhiyun if (temp & I460_BAPBASE_ENABLE)
143*4882a593Smuzhiyun i460.dynamic_apbase = INTEL_I460_BAPBASE;
144*4882a593Smuzhiyun else
145*4882a593Smuzhiyun i460.dynamic_apbase = AGP_APBASE;
146*4882a593Smuzhiyun
147*4882a593Smuzhiyun for (i = 0; i < agp_bridge->driver->num_aperture_sizes; i++) {
148*4882a593Smuzhiyun /*
149*4882a593Smuzhiyun * Dynamically calculate the proper num_entries and page_order values for
150*4882a593Smuzhiyun * the define aperture sizes. Take care not to shift off the end of
151*4882a593Smuzhiyun * values[i].size.
152*4882a593Smuzhiyun */
153*4882a593Smuzhiyun values[i].num_entries = (values[i].size << 8) >> (I460_IO_PAGE_SHIFT - 12);
154*4882a593Smuzhiyun values[i].page_order = ilog2((sizeof(u32)*values[i].num_entries) >> PAGE_SHIFT);
155*4882a593Smuzhiyun }
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun for (i = 0; i < agp_bridge->driver->num_aperture_sizes; i++) {
158*4882a593Smuzhiyun /* Neglect control bits when matching up size_value */
159*4882a593Smuzhiyun if ((temp & I460_AGPSIZ_MASK) == values[i].size_value) {
160*4882a593Smuzhiyun agp_bridge->previous_size = agp_bridge->current_size = (void *) (values + i);
161*4882a593Smuzhiyun agp_bridge->aperture_size_idx = i;
162*4882a593Smuzhiyun return values[i].size;
163*4882a593Smuzhiyun }
164*4882a593Smuzhiyun }
165*4882a593Smuzhiyun
166*4882a593Smuzhiyun return 0;
167*4882a593Smuzhiyun }
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun /* There isn't anything to do here since 460 has no GART TLB. */
i460_tlb_flush(struct agp_memory * mem)170*4882a593Smuzhiyun static void i460_tlb_flush (struct agp_memory *mem)
171*4882a593Smuzhiyun {
172*4882a593Smuzhiyun return;
173*4882a593Smuzhiyun }
174*4882a593Smuzhiyun
175*4882a593Smuzhiyun /*
176*4882a593Smuzhiyun * This utility function is needed to prevent corruption of the control bits
177*4882a593Smuzhiyun * which are stored along with the aperture size in 460's AGPSIZ register
178*4882a593Smuzhiyun */
i460_write_agpsiz(u8 size_value)179*4882a593Smuzhiyun static void i460_write_agpsiz (u8 size_value)
180*4882a593Smuzhiyun {
181*4882a593Smuzhiyun u8 temp;
182*4882a593Smuzhiyun
183*4882a593Smuzhiyun pci_read_config_byte(agp_bridge->dev, INTEL_I460_AGPSIZ, &temp);
184*4882a593Smuzhiyun pci_write_config_byte(agp_bridge->dev, INTEL_I460_AGPSIZ,
185*4882a593Smuzhiyun ((temp & ~I460_AGPSIZ_MASK) | size_value));
186*4882a593Smuzhiyun }
187*4882a593Smuzhiyun
i460_cleanup(void)188*4882a593Smuzhiyun static void i460_cleanup (void)
189*4882a593Smuzhiyun {
190*4882a593Smuzhiyun struct aper_size_info_8 *previous_size;
191*4882a593Smuzhiyun
192*4882a593Smuzhiyun previous_size = A_SIZE_8(agp_bridge->previous_size);
193*4882a593Smuzhiyun i460_write_agpsiz(previous_size->size_value);
194*4882a593Smuzhiyun
195*4882a593Smuzhiyun if (I460_IO_PAGE_SHIFT > PAGE_SHIFT)
196*4882a593Smuzhiyun kfree(i460.lp_desc);
197*4882a593Smuzhiyun }
198*4882a593Smuzhiyun
i460_configure(void)199*4882a593Smuzhiyun static int i460_configure (void)
200*4882a593Smuzhiyun {
201*4882a593Smuzhiyun union {
202*4882a593Smuzhiyun u32 small[2];
203*4882a593Smuzhiyun u64 large;
204*4882a593Smuzhiyun } temp;
205*4882a593Smuzhiyun size_t size;
206*4882a593Smuzhiyun u8 scratch;
207*4882a593Smuzhiyun struct aper_size_info_8 *current_size;
208*4882a593Smuzhiyun
209*4882a593Smuzhiyun temp.large = 0;
210*4882a593Smuzhiyun
211*4882a593Smuzhiyun current_size = A_SIZE_8(agp_bridge->current_size);
212*4882a593Smuzhiyun i460_write_agpsiz(current_size->size_value);
213*4882a593Smuzhiyun
214*4882a593Smuzhiyun /*
215*4882a593Smuzhiyun * Do the necessary rigmarole to read all eight bytes of APBASE.
216*4882a593Smuzhiyun * This has to be done since the AGP aperture can be above 4GB on
217*4882a593Smuzhiyun * 460 based systems.
218*4882a593Smuzhiyun */
219*4882a593Smuzhiyun pci_read_config_dword(agp_bridge->dev, i460.dynamic_apbase, &(temp.small[0]));
220*4882a593Smuzhiyun pci_read_config_dword(agp_bridge->dev, i460.dynamic_apbase + 4, &(temp.small[1]));
221*4882a593Smuzhiyun
222*4882a593Smuzhiyun /* Clear BAR control bits */
223*4882a593Smuzhiyun agp_bridge->gart_bus_addr = temp.large & ~((1UL << 3) - 1);
224*4882a593Smuzhiyun
225*4882a593Smuzhiyun pci_read_config_byte(agp_bridge->dev, INTEL_I460_GXBCTL, &scratch);
226*4882a593Smuzhiyun pci_write_config_byte(agp_bridge->dev, INTEL_I460_GXBCTL,
227*4882a593Smuzhiyun (scratch & 0x02) | I460_GXBCTL_OOG | I460_GXBCTL_BWC);
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun /*
230*4882a593Smuzhiyun * Initialize partial allocation trackers if a GART page is bigger than a kernel
231*4882a593Smuzhiyun * page.
232*4882a593Smuzhiyun */
233*4882a593Smuzhiyun if (I460_IO_PAGE_SHIFT > PAGE_SHIFT) {
234*4882a593Smuzhiyun size = current_size->num_entries * sizeof(i460.lp_desc[0]);
235*4882a593Smuzhiyun i460.lp_desc = kzalloc(size, GFP_KERNEL);
236*4882a593Smuzhiyun if (!i460.lp_desc)
237*4882a593Smuzhiyun return -ENOMEM;
238*4882a593Smuzhiyun }
239*4882a593Smuzhiyun return 0;
240*4882a593Smuzhiyun }
241*4882a593Smuzhiyun
i460_create_gatt_table(struct agp_bridge_data * bridge)242*4882a593Smuzhiyun static int i460_create_gatt_table (struct agp_bridge_data *bridge)
243*4882a593Smuzhiyun {
244*4882a593Smuzhiyun int page_order, num_entries, i;
245*4882a593Smuzhiyun void *temp;
246*4882a593Smuzhiyun
247*4882a593Smuzhiyun /*
248*4882a593Smuzhiyun * Load up the fixed address of the GART SRAMS which hold our GATT table.
249*4882a593Smuzhiyun */
250*4882a593Smuzhiyun temp = agp_bridge->current_size;
251*4882a593Smuzhiyun page_order = A_SIZE_8(temp)->page_order;
252*4882a593Smuzhiyun num_entries = A_SIZE_8(temp)->num_entries;
253*4882a593Smuzhiyun
254*4882a593Smuzhiyun i460.gatt = ioremap(INTEL_I460_ATTBASE, PAGE_SIZE << page_order);
255*4882a593Smuzhiyun if (!i460.gatt) {
256*4882a593Smuzhiyun printk(KERN_ERR PFX "ioremap failed\n");
257*4882a593Smuzhiyun return -ENOMEM;
258*4882a593Smuzhiyun }
259*4882a593Smuzhiyun
260*4882a593Smuzhiyun /* These are no good, the should be removed from the agp_bridge strucure... */
261*4882a593Smuzhiyun agp_bridge->gatt_table_real = NULL;
262*4882a593Smuzhiyun agp_bridge->gatt_table = NULL;
263*4882a593Smuzhiyun agp_bridge->gatt_bus_addr = 0;
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun for (i = 0; i < num_entries; ++i)
266*4882a593Smuzhiyun WR_GATT(i, 0);
267*4882a593Smuzhiyun WR_FLUSH_GATT(i - 1);
268*4882a593Smuzhiyun return 0;
269*4882a593Smuzhiyun }
270*4882a593Smuzhiyun
i460_free_gatt_table(struct agp_bridge_data * bridge)271*4882a593Smuzhiyun static int i460_free_gatt_table (struct agp_bridge_data *bridge)
272*4882a593Smuzhiyun {
273*4882a593Smuzhiyun int num_entries, i;
274*4882a593Smuzhiyun void *temp;
275*4882a593Smuzhiyun
276*4882a593Smuzhiyun temp = agp_bridge->current_size;
277*4882a593Smuzhiyun
278*4882a593Smuzhiyun num_entries = A_SIZE_8(temp)->num_entries;
279*4882a593Smuzhiyun
280*4882a593Smuzhiyun for (i = 0; i < num_entries; ++i)
281*4882a593Smuzhiyun WR_GATT(i, 0);
282*4882a593Smuzhiyun WR_FLUSH_GATT(num_entries - 1);
283*4882a593Smuzhiyun
284*4882a593Smuzhiyun iounmap(i460.gatt);
285*4882a593Smuzhiyun return 0;
286*4882a593Smuzhiyun }
287*4882a593Smuzhiyun
288*4882a593Smuzhiyun /*
289*4882a593Smuzhiyun * The following functions are called when the I/O (GART) page size is smaller than
290*4882a593Smuzhiyun * PAGE_SIZE.
291*4882a593Smuzhiyun */
292*4882a593Smuzhiyun
i460_insert_memory_small_io_page(struct agp_memory * mem,off_t pg_start,int type)293*4882a593Smuzhiyun static int i460_insert_memory_small_io_page (struct agp_memory *mem,
294*4882a593Smuzhiyun off_t pg_start, int type)
295*4882a593Smuzhiyun {
296*4882a593Smuzhiyun unsigned long paddr, io_pg_start, io_page_size;
297*4882a593Smuzhiyun int i, j, k, num_entries;
298*4882a593Smuzhiyun void *temp;
299*4882a593Smuzhiyun
300*4882a593Smuzhiyun pr_debug("i460_insert_memory_small_io_page(mem=%p, pg_start=%ld, type=%d, paddr0=0x%lx)\n",
301*4882a593Smuzhiyun mem, pg_start, type, page_to_phys(mem->pages[0]));
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun if (type >= AGP_USER_TYPES || mem->type >= AGP_USER_TYPES)
304*4882a593Smuzhiyun return -EINVAL;
305*4882a593Smuzhiyun
306*4882a593Smuzhiyun io_pg_start = I460_IOPAGES_PER_KPAGE * pg_start;
307*4882a593Smuzhiyun
308*4882a593Smuzhiyun temp = agp_bridge->current_size;
309*4882a593Smuzhiyun num_entries = A_SIZE_8(temp)->num_entries;
310*4882a593Smuzhiyun
311*4882a593Smuzhiyun if ((io_pg_start + I460_IOPAGES_PER_KPAGE * mem->page_count) > num_entries) {
312*4882a593Smuzhiyun printk(KERN_ERR PFX "Looks like we're out of AGP memory\n");
313*4882a593Smuzhiyun return -EINVAL;
314*4882a593Smuzhiyun }
315*4882a593Smuzhiyun
316*4882a593Smuzhiyun j = io_pg_start;
317*4882a593Smuzhiyun while (j < (io_pg_start + I460_IOPAGES_PER_KPAGE * mem->page_count)) {
318*4882a593Smuzhiyun if (!PGE_EMPTY(agp_bridge, RD_GATT(j))) {
319*4882a593Smuzhiyun pr_debug("i460_insert_memory_small_io_page: GATT[%d]=0x%x is busy\n",
320*4882a593Smuzhiyun j, RD_GATT(j));
321*4882a593Smuzhiyun return -EBUSY;
322*4882a593Smuzhiyun }
323*4882a593Smuzhiyun j++;
324*4882a593Smuzhiyun }
325*4882a593Smuzhiyun
326*4882a593Smuzhiyun io_page_size = 1UL << I460_IO_PAGE_SHIFT;
327*4882a593Smuzhiyun for (i = 0, j = io_pg_start; i < mem->page_count; i++) {
328*4882a593Smuzhiyun paddr = page_to_phys(mem->pages[i]);
329*4882a593Smuzhiyun for (k = 0; k < I460_IOPAGES_PER_KPAGE; k++, j++, paddr += io_page_size)
330*4882a593Smuzhiyun WR_GATT(j, i460_mask_memory(agp_bridge, paddr, mem->type));
331*4882a593Smuzhiyun }
332*4882a593Smuzhiyun WR_FLUSH_GATT(j - 1);
333*4882a593Smuzhiyun return 0;
334*4882a593Smuzhiyun }
335*4882a593Smuzhiyun
i460_remove_memory_small_io_page(struct agp_memory * mem,off_t pg_start,int type)336*4882a593Smuzhiyun static int i460_remove_memory_small_io_page(struct agp_memory *mem,
337*4882a593Smuzhiyun off_t pg_start, int type)
338*4882a593Smuzhiyun {
339*4882a593Smuzhiyun int i;
340*4882a593Smuzhiyun
341*4882a593Smuzhiyun pr_debug("i460_remove_memory_small_io_page(mem=%p, pg_start=%ld, type=%d)\n",
342*4882a593Smuzhiyun mem, pg_start, type);
343*4882a593Smuzhiyun
344*4882a593Smuzhiyun pg_start = I460_IOPAGES_PER_KPAGE * pg_start;
345*4882a593Smuzhiyun
346*4882a593Smuzhiyun for (i = pg_start; i < (pg_start + I460_IOPAGES_PER_KPAGE * mem->page_count); i++)
347*4882a593Smuzhiyun WR_GATT(i, 0);
348*4882a593Smuzhiyun WR_FLUSH_GATT(i - 1);
349*4882a593Smuzhiyun return 0;
350*4882a593Smuzhiyun }
351*4882a593Smuzhiyun
352*4882a593Smuzhiyun #if I460_LARGE_IO_PAGES
353*4882a593Smuzhiyun
354*4882a593Smuzhiyun /*
355*4882a593Smuzhiyun * These functions are called when the I/O (GART) page size exceeds PAGE_SIZE.
356*4882a593Smuzhiyun *
357*4882a593Smuzhiyun * This situation is interesting since AGP memory allocations that are smaller than a
358*4882a593Smuzhiyun * single GART page are possible. The i460.lp_desc array tracks partial allocation of the
359*4882a593Smuzhiyun * large GART pages to work around this issue.
360*4882a593Smuzhiyun *
361*4882a593Smuzhiyun * i460.lp_desc[pg_num].refcount tracks the number of kernel pages in use within GART page
362*4882a593Smuzhiyun * pg_num. i460.lp_desc[pg_num].paddr is the physical address of the large page and
363*4882a593Smuzhiyun * i460.lp_desc[pg_num].alloced_map is a bitmap of kernel pages that are in use (allocated).
364*4882a593Smuzhiyun */
365*4882a593Smuzhiyun
i460_alloc_large_page(struct lp_desc * lp)366*4882a593Smuzhiyun static int i460_alloc_large_page (struct lp_desc *lp)
367*4882a593Smuzhiyun {
368*4882a593Smuzhiyun unsigned long order = I460_IO_PAGE_SHIFT - PAGE_SHIFT;
369*4882a593Smuzhiyun size_t map_size;
370*4882a593Smuzhiyun
371*4882a593Smuzhiyun lp->page = alloc_pages(GFP_KERNEL, order);
372*4882a593Smuzhiyun if (!lp->page) {
373*4882a593Smuzhiyun printk(KERN_ERR PFX "Couldn't alloc 4M GART page...\n");
374*4882a593Smuzhiyun return -ENOMEM;
375*4882a593Smuzhiyun }
376*4882a593Smuzhiyun
377*4882a593Smuzhiyun map_size = ((I460_KPAGES_PER_IOPAGE + BITS_PER_LONG - 1) & -BITS_PER_LONG)/8;
378*4882a593Smuzhiyun lp->alloced_map = kzalloc(map_size, GFP_KERNEL);
379*4882a593Smuzhiyun if (!lp->alloced_map) {
380*4882a593Smuzhiyun __free_pages(lp->page, order);
381*4882a593Smuzhiyun printk(KERN_ERR PFX "Out of memory, we're in trouble...\n");
382*4882a593Smuzhiyun return -ENOMEM;
383*4882a593Smuzhiyun }
384*4882a593Smuzhiyun
385*4882a593Smuzhiyun lp->paddr = page_to_phys(lp->page);
386*4882a593Smuzhiyun lp->refcount = 0;
387*4882a593Smuzhiyun atomic_add(I460_KPAGES_PER_IOPAGE, &agp_bridge->current_memory_agp);
388*4882a593Smuzhiyun return 0;
389*4882a593Smuzhiyun }
390*4882a593Smuzhiyun
i460_free_large_page(struct lp_desc * lp)391*4882a593Smuzhiyun static void i460_free_large_page (struct lp_desc *lp)
392*4882a593Smuzhiyun {
393*4882a593Smuzhiyun kfree(lp->alloced_map);
394*4882a593Smuzhiyun lp->alloced_map = NULL;
395*4882a593Smuzhiyun
396*4882a593Smuzhiyun __free_pages(lp->page, I460_IO_PAGE_SHIFT - PAGE_SHIFT);
397*4882a593Smuzhiyun atomic_sub(I460_KPAGES_PER_IOPAGE, &agp_bridge->current_memory_agp);
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun
i460_insert_memory_large_io_page(struct agp_memory * mem,off_t pg_start,int type)400*4882a593Smuzhiyun static int i460_insert_memory_large_io_page (struct agp_memory *mem,
401*4882a593Smuzhiyun off_t pg_start, int type)
402*4882a593Smuzhiyun {
403*4882a593Smuzhiyun int i, start_offset, end_offset, idx, pg, num_entries;
404*4882a593Smuzhiyun struct lp_desc *start, *end, *lp;
405*4882a593Smuzhiyun void *temp;
406*4882a593Smuzhiyun
407*4882a593Smuzhiyun if (type >= AGP_USER_TYPES || mem->type >= AGP_USER_TYPES)
408*4882a593Smuzhiyun return -EINVAL;
409*4882a593Smuzhiyun
410*4882a593Smuzhiyun temp = agp_bridge->current_size;
411*4882a593Smuzhiyun num_entries = A_SIZE_8(temp)->num_entries;
412*4882a593Smuzhiyun
413*4882a593Smuzhiyun /* Figure out what pg_start means in terms of our large GART pages */
414*4882a593Smuzhiyun start = &i460.lp_desc[pg_start / I460_KPAGES_PER_IOPAGE];
415*4882a593Smuzhiyun end = &i460.lp_desc[(pg_start + mem->page_count - 1) / I460_KPAGES_PER_IOPAGE];
416*4882a593Smuzhiyun start_offset = pg_start % I460_KPAGES_PER_IOPAGE;
417*4882a593Smuzhiyun end_offset = (pg_start + mem->page_count - 1) % I460_KPAGES_PER_IOPAGE;
418*4882a593Smuzhiyun
419*4882a593Smuzhiyun if (end > i460.lp_desc + num_entries) {
420*4882a593Smuzhiyun printk(KERN_ERR PFX "Looks like we're out of AGP memory\n");
421*4882a593Smuzhiyun return -EINVAL;
422*4882a593Smuzhiyun }
423*4882a593Smuzhiyun
424*4882a593Smuzhiyun /* Check if the requested region of the aperture is free */
425*4882a593Smuzhiyun for (lp = start; lp <= end; ++lp) {
426*4882a593Smuzhiyun if (!lp->alloced_map)
427*4882a593Smuzhiyun continue; /* OK, the entire large page is available... */
428*4882a593Smuzhiyun
429*4882a593Smuzhiyun for (idx = ((lp == start) ? start_offset : 0);
430*4882a593Smuzhiyun idx < ((lp == end) ? (end_offset + 1) : I460_KPAGES_PER_IOPAGE);
431*4882a593Smuzhiyun idx++)
432*4882a593Smuzhiyun {
433*4882a593Smuzhiyun if (test_bit(idx, lp->alloced_map))
434*4882a593Smuzhiyun return -EBUSY;
435*4882a593Smuzhiyun }
436*4882a593Smuzhiyun }
437*4882a593Smuzhiyun
438*4882a593Smuzhiyun for (lp = start, i = 0; lp <= end; ++lp) {
439*4882a593Smuzhiyun if (!lp->alloced_map) {
440*4882a593Smuzhiyun /* Allocate new GART pages... */
441*4882a593Smuzhiyun if (i460_alloc_large_page(lp) < 0)
442*4882a593Smuzhiyun return -ENOMEM;
443*4882a593Smuzhiyun pg = lp - i460.lp_desc;
444*4882a593Smuzhiyun WR_GATT(pg, i460_mask_memory(agp_bridge,
445*4882a593Smuzhiyun lp->paddr, 0));
446*4882a593Smuzhiyun WR_FLUSH_GATT(pg);
447*4882a593Smuzhiyun }
448*4882a593Smuzhiyun
449*4882a593Smuzhiyun for (idx = ((lp == start) ? start_offset : 0);
450*4882a593Smuzhiyun idx < ((lp == end) ? (end_offset + 1) : I460_KPAGES_PER_IOPAGE);
451*4882a593Smuzhiyun idx++, i++)
452*4882a593Smuzhiyun {
453*4882a593Smuzhiyun mem->pages[i] = lp->page;
454*4882a593Smuzhiyun __set_bit(idx, lp->alloced_map);
455*4882a593Smuzhiyun ++lp->refcount;
456*4882a593Smuzhiyun }
457*4882a593Smuzhiyun }
458*4882a593Smuzhiyun return 0;
459*4882a593Smuzhiyun }
460*4882a593Smuzhiyun
i460_remove_memory_large_io_page(struct agp_memory * mem,off_t pg_start,int type)461*4882a593Smuzhiyun static int i460_remove_memory_large_io_page (struct agp_memory *mem,
462*4882a593Smuzhiyun off_t pg_start, int type)
463*4882a593Smuzhiyun {
464*4882a593Smuzhiyun int i, pg, start_offset, end_offset, idx, num_entries;
465*4882a593Smuzhiyun struct lp_desc *start, *end, *lp;
466*4882a593Smuzhiyun void *temp;
467*4882a593Smuzhiyun
468*4882a593Smuzhiyun temp = agp_bridge->current_size;
469*4882a593Smuzhiyun num_entries = A_SIZE_8(temp)->num_entries;
470*4882a593Smuzhiyun
471*4882a593Smuzhiyun /* Figure out what pg_start means in terms of our large GART pages */
472*4882a593Smuzhiyun start = &i460.lp_desc[pg_start / I460_KPAGES_PER_IOPAGE];
473*4882a593Smuzhiyun end = &i460.lp_desc[(pg_start + mem->page_count - 1) / I460_KPAGES_PER_IOPAGE];
474*4882a593Smuzhiyun start_offset = pg_start % I460_KPAGES_PER_IOPAGE;
475*4882a593Smuzhiyun end_offset = (pg_start + mem->page_count - 1) % I460_KPAGES_PER_IOPAGE;
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun for (i = 0, lp = start; lp <= end; ++lp) {
478*4882a593Smuzhiyun for (idx = ((lp == start) ? start_offset : 0);
479*4882a593Smuzhiyun idx < ((lp == end) ? (end_offset + 1) : I460_KPAGES_PER_IOPAGE);
480*4882a593Smuzhiyun idx++, i++)
481*4882a593Smuzhiyun {
482*4882a593Smuzhiyun mem->pages[i] = NULL;
483*4882a593Smuzhiyun __clear_bit(idx, lp->alloced_map);
484*4882a593Smuzhiyun --lp->refcount;
485*4882a593Smuzhiyun }
486*4882a593Smuzhiyun
487*4882a593Smuzhiyun /* Free GART pages if they are unused */
488*4882a593Smuzhiyun if (lp->refcount == 0) {
489*4882a593Smuzhiyun pg = lp - i460.lp_desc;
490*4882a593Smuzhiyun WR_GATT(pg, 0);
491*4882a593Smuzhiyun WR_FLUSH_GATT(pg);
492*4882a593Smuzhiyun i460_free_large_page(lp);
493*4882a593Smuzhiyun }
494*4882a593Smuzhiyun }
495*4882a593Smuzhiyun return 0;
496*4882a593Smuzhiyun }
497*4882a593Smuzhiyun
498*4882a593Smuzhiyun /* Wrapper routines to call the approriate {small_io_page,large_io_page} function */
499*4882a593Smuzhiyun
i460_insert_memory(struct agp_memory * mem,off_t pg_start,int type)500*4882a593Smuzhiyun static int i460_insert_memory (struct agp_memory *mem,
501*4882a593Smuzhiyun off_t pg_start, int type)
502*4882a593Smuzhiyun {
503*4882a593Smuzhiyun if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT)
504*4882a593Smuzhiyun return i460_insert_memory_small_io_page(mem, pg_start, type);
505*4882a593Smuzhiyun else
506*4882a593Smuzhiyun return i460_insert_memory_large_io_page(mem, pg_start, type);
507*4882a593Smuzhiyun }
508*4882a593Smuzhiyun
i460_remove_memory(struct agp_memory * mem,off_t pg_start,int type)509*4882a593Smuzhiyun static int i460_remove_memory (struct agp_memory *mem,
510*4882a593Smuzhiyun off_t pg_start, int type)
511*4882a593Smuzhiyun {
512*4882a593Smuzhiyun if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT)
513*4882a593Smuzhiyun return i460_remove_memory_small_io_page(mem, pg_start, type);
514*4882a593Smuzhiyun else
515*4882a593Smuzhiyun return i460_remove_memory_large_io_page(mem, pg_start, type);
516*4882a593Smuzhiyun }
517*4882a593Smuzhiyun
518*4882a593Smuzhiyun /*
519*4882a593Smuzhiyun * If the I/O (GART) page size is bigger than the kernel page size, we don't want to
520*4882a593Smuzhiyun * allocate memory until we know where it is to be bound in the aperture (a
521*4882a593Smuzhiyun * multi-kernel-page alloc might fit inside of an already allocated GART page).
522*4882a593Smuzhiyun *
523*4882a593Smuzhiyun * Let's just hope nobody counts on the allocated AGP memory being there before bind time
524*4882a593Smuzhiyun * (I don't think current drivers do)...
525*4882a593Smuzhiyun */
i460_alloc_page(struct agp_bridge_data * bridge)526*4882a593Smuzhiyun static struct page *i460_alloc_page (struct agp_bridge_data *bridge)
527*4882a593Smuzhiyun {
528*4882a593Smuzhiyun void *page;
529*4882a593Smuzhiyun
530*4882a593Smuzhiyun if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT) {
531*4882a593Smuzhiyun page = agp_generic_alloc_page(agp_bridge);
532*4882a593Smuzhiyun } else
533*4882a593Smuzhiyun /* Returning NULL would cause problems */
534*4882a593Smuzhiyun /* AK: really dubious code. */
535*4882a593Smuzhiyun page = (void *)~0UL;
536*4882a593Smuzhiyun return page;
537*4882a593Smuzhiyun }
538*4882a593Smuzhiyun
i460_destroy_page(struct page * page,int flags)539*4882a593Smuzhiyun static void i460_destroy_page (struct page *page, int flags)
540*4882a593Smuzhiyun {
541*4882a593Smuzhiyun if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT) {
542*4882a593Smuzhiyun agp_generic_destroy_page(page, flags);
543*4882a593Smuzhiyun }
544*4882a593Smuzhiyun }
545*4882a593Smuzhiyun
546*4882a593Smuzhiyun #endif /* I460_LARGE_IO_PAGES */
547*4882a593Smuzhiyun
i460_mask_memory(struct agp_bridge_data * bridge,dma_addr_t addr,int type)548*4882a593Smuzhiyun static unsigned long i460_mask_memory (struct agp_bridge_data *bridge,
549*4882a593Smuzhiyun dma_addr_t addr, int type)
550*4882a593Smuzhiyun {
551*4882a593Smuzhiyun /* Make sure the returned address is a valid GATT entry */
552*4882a593Smuzhiyun return bridge->driver->masks[0].mask
553*4882a593Smuzhiyun | (((addr & ~((1 << I460_IO_PAGE_SHIFT) - 1)) & 0xfffff000) >> 12);
554*4882a593Smuzhiyun }
555*4882a593Smuzhiyun
556*4882a593Smuzhiyun const struct agp_bridge_driver intel_i460_driver = {
557*4882a593Smuzhiyun .owner = THIS_MODULE,
558*4882a593Smuzhiyun .aperture_sizes = i460_sizes,
559*4882a593Smuzhiyun .size_type = U8_APER_SIZE,
560*4882a593Smuzhiyun .num_aperture_sizes = 3,
561*4882a593Smuzhiyun .configure = i460_configure,
562*4882a593Smuzhiyun .fetch_size = i460_fetch_size,
563*4882a593Smuzhiyun .cleanup = i460_cleanup,
564*4882a593Smuzhiyun .tlb_flush = i460_tlb_flush,
565*4882a593Smuzhiyun .mask_memory = i460_mask_memory,
566*4882a593Smuzhiyun .masks = i460_masks,
567*4882a593Smuzhiyun .agp_enable = agp_generic_enable,
568*4882a593Smuzhiyun .cache_flush = global_cache_flush,
569*4882a593Smuzhiyun .create_gatt_table = i460_create_gatt_table,
570*4882a593Smuzhiyun .free_gatt_table = i460_free_gatt_table,
571*4882a593Smuzhiyun #if I460_LARGE_IO_PAGES
572*4882a593Smuzhiyun .insert_memory = i460_insert_memory,
573*4882a593Smuzhiyun .remove_memory = i460_remove_memory,
574*4882a593Smuzhiyun .agp_alloc_page = i460_alloc_page,
575*4882a593Smuzhiyun .agp_destroy_page = i460_destroy_page,
576*4882a593Smuzhiyun #else
577*4882a593Smuzhiyun .insert_memory = i460_insert_memory_small_io_page,
578*4882a593Smuzhiyun .remove_memory = i460_remove_memory_small_io_page,
579*4882a593Smuzhiyun .agp_alloc_page = agp_generic_alloc_page,
580*4882a593Smuzhiyun .agp_alloc_pages = agp_generic_alloc_pages,
581*4882a593Smuzhiyun .agp_destroy_page = agp_generic_destroy_page,
582*4882a593Smuzhiyun .agp_destroy_pages = agp_generic_destroy_pages,
583*4882a593Smuzhiyun #endif
584*4882a593Smuzhiyun .alloc_by_type = agp_generic_alloc_by_type,
585*4882a593Smuzhiyun .free_by_type = agp_generic_free_by_type,
586*4882a593Smuzhiyun .agp_type_to_mask_type = agp_generic_type_to_mask_type,
587*4882a593Smuzhiyun .cant_use_aperture = true,
588*4882a593Smuzhiyun };
589*4882a593Smuzhiyun
agp_intel_i460_probe(struct pci_dev * pdev,const struct pci_device_id * ent)590*4882a593Smuzhiyun static int agp_intel_i460_probe(struct pci_dev *pdev,
591*4882a593Smuzhiyun const struct pci_device_id *ent)
592*4882a593Smuzhiyun {
593*4882a593Smuzhiyun struct agp_bridge_data *bridge;
594*4882a593Smuzhiyun u8 cap_ptr;
595*4882a593Smuzhiyun
596*4882a593Smuzhiyun cap_ptr = pci_find_capability(pdev, PCI_CAP_ID_AGP);
597*4882a593Smuzhiyun if (!cap_ptr)
598*4882a593Smuzhiyun return -ENODEV;
599*4882a593Smuzhiyun
600*4882a593Smuzhiyun bridge = agp_alloc_bridge();
601*4882a593Smuzhiyun if (!bridge)
602*4882a593Smuzhiyun return -ENOMEM;
603*4882a593Smuzhiyun
604*4882a593Smuzhiyun bridge->driver = &intel_i460_driver;
605*4882a593Smuzhiyun bridge->dev = pdev;
606*4882a593Smuzhiyun bridge->capndx = cap_ptr;
607*4882a593Smuzhiyun
608*4882a593Smuzhiyun printk(KERN_INFO PFX "Detected Intel 460GX chipset\n");
609*4882a593Smuzhiyun
610*4882a593Smuzhiyun pci_set_drvdata(pdev, bridge);
611*4882a593Smuzhiyun return agp_add_bridge(bridge);
612*4882a593Smuzhiyun }
613*4882a593Smuzhiyun
agp_intel_i460_remove(struct pci_dev * pdev)614*4882a593Smuzhiyun static void agp_intel_i460_remove(struct pci_dev *pdev)
615*4882a593Smuzhiyun {
616*4882a593Smuzhiyun struct agp_bridge_data *bridge = pci_get_drvdata(pdev);
617*4882a593Smuzhiyun
618*4882a593Smuzhiyun agp_remove_bridge(bridge);
619*4882a593Smuzhiyun agp_put_bridge(bridge);
620*4882a593Smuzhiyun }
621*4882a593Smuzhiyun
622*4882a593Smuzhiyun static struct pci_device_id agp_intel_i460_pci_table[] = {
623*4882a593Smuzhiyun {
624*4882a593Smuzhiyun .class = (PCI_CLASS_BRIDGE_HOST << 8),
625*4882a593Smuzhiyun .class_mask = ~0,
626*4882a593Smuzhiyun .vendor = PCI_VENDOR_ID_INTEL,
627*4882a593Smuzhiyun .device = PCI_DEVICE_ID_INTEL_84460GX,
628*4882a593Smuzhiyun .subvendor = PCI_ANY_ID,
629*4882a593Smuzhiyun .subdevice = PCI_ANY_ID,
630*4882a593Smuzhiyun },
631*4882a593Smuzhiyun { }
632*4882a593Smuzhiyun };
633*4882a593Smuzhiyun
634*4882a593Smuzhiyun MODULE_DEVICE_TABLE(pci, agp_intel_i460_pci_table);
635*4882a593Smuzhiyun
636*4882a593Smuzhiyun static struct pci_driver agp_intel_i460_pci_driver = {
637*4882a593Smuzhiyun .name = "agpgart-intel-i460",
638*4882a593Smuzhiyun .id_table = agp_intel_i460_pci_table,
639*4882a593Smuzhiyun .probe = agp_intel_i460_probe,
640*4882a593Smuzhiyun .remove = agp_intel_i460_remove,
641*4882a593Smuzhiyun };
642*4882a593Smuzhiyun
agp_intel_i460_init(void)643*4882a593Smuzhiyun static int __init agp_intel_i460_init(void)
644*4882a593Smuzhiyun {
645*4882a593Smuzhiyun if (agp_off)
646*4882a593Smuzhiyun return -EINVAL;
647*4882a593Smuzhiyun return pci_register_driver(&agp_intel_i460_pci_driver);
648*4882a593Smuzhiyun }
649*4882a593Smuzhiyun
agp_intel_i460_cleanup(void)650*4882a593Smuzhiyun static void __exit agp_intel_i460_cleanup(void)
651*4882a593Smuzhiyun {
652*4882a593Smuzhiyun pci_unregister_driver(&agp_intel_i460_pci_driver);
653*4882a593Smuzhiyun }
654*4882a593Smuzhiyun
655*4882a593Smuzhiyun module_init(agp_intel_i460_init);
656*4882a593Smuzhiyun module_exit(agp_intel_i460_cleanup);
657*4882a593Smuzhiyun
658*4882a593Smuzhiyun MODULE_AUTHOR("Chris Ahna <Christopher.J.Ahna@intel.com>");
659*4882a593Smuzhiyun MODULE_LICENSE("GPL and additional rights");
660