xref: /OK3568_Linux_fs/kernel/drivers/gpu/drm/gma500/gtt.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0-only
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (c) 2007, Intel Corporation.
4*4882a593Smuzhiyun  * All Rights Reserved.
5*4882a593Smuzhiyun  *
6*4882a593Smuzhiyun  * Authors: Thomas Hellstrom <thomas-at-tungstengraphics.com>
7*4882a593Smuzhiyun  *	    Alan Cox <alan@linux.intel.com>
8*4882a593Smuzhiyun  */
9*4882a593Smuzhiyun 
10*4882a593Smuzhiyun #include <linux/shmem_fs.h>
11*4882a593Smuzhiyun 
12*4882a593Smuzhiyun #include <asm/set_memory.h>
13*4882a593Smuzhiyun 
14*4882a593Smuzhiyun #include "blitter.h"
15*4882a593Smuzhiyun #include "psb_drv.h"
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun 
18*4882a593Smuzhiyun /*
19*4882a593Smuzhiyun  *	GTT resource allocator - manage page mappings in GTT space
20*4882a593Smuzhiyun  */
21*4882a593Smuzhiyun 
22*4882a593Smuzhiyun /**
23*4882a593Smuzhiyun  *	psb_gtt_mask_pte	-	generate GTT pte entry
24*4882a593Smuzhiyun  *	@pfn: page number to encode
25*4882a593Smuzhiyun  *	@type: type of memory in the GTT
26*4882a593Smuzhiyun  *
27*4882a593Smuzhiyun  *	Set the GTT entry for the appropriate memory type.
28*4882a593Smuzhiyun  */
psb_gtt_mask_pte(uint32_t pfn,int type)29*4882a593Smuzhiyun static inline uint32_t psb_gtt_mask_pte(uint32_t pfn, int type)
30*4882a593Smuzhiyun {
31*4882a593Smuzhiyun 	uint32_t mask = PSB_PTE_VALID;
32*4882a593Smuzhiyun 
33*4882a593Smuzhiyun 	/* Ensure we explode rather than put an invalid low mapping of
34*4882a593Smuzhiyun 	   a high mapping page into the gtt */
35*4882a593Smuzhiyun 	BUG_ON(pfn & ~(0xFFFFFFFF >> PAGE_SHIFT));
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun 	if (type & PSB_MMU_CACHED_MEMORY)
38*4882a593Smuzhiyun 		mask |= PSB_PTE_CACHED;
39*4882a593Smuzhiyun 	if (type & PSB_MMU_RO_MEMORY)
40*4882a593Smuzhiyun 		mask |= PSB_PTE_RO;
41*4882a593Smuzhiyun 	if (type & PSB_MMU_WO_MEMORY)
42*4882a593Smuzhiyun 		mask |= PSB_PTE_WO;
43*4882a593Smuzhiyun 
44*4882a593Smuzhiyun 	return (pfn << PAGE_SHIFT) | mask;
45*4882a593Smuzhiyun }
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun /**
48*4882a593Smuzhiyun  *	psb_gtt_entry		-	find the GTT entries for a gtt_range
49*4882a593Smuzhiyun  *	@dev: our DRM device
50*4882a593Smuzhiyun  *	@r: our GTT range
51*4882a593Smuzhiyun  *
52*4882a593Smuzhiyun  *	Given a gtt_range object return the GTT offset of the page table
53*4882a593Smuzhiyun  *	entries for this gtt_range
54*4882a593Smuzhiyun  */
psb_gtt_entry(struct drm_device * dev,struct gtt_range * r)55*4882a593Smuzhiyun static u32 __iomem *psb_gtt_entry(struct drm_device *dev, struct gtt_range *r)
56*4882a593Smuzhiyun {
57*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
58*4882a593Smuzhiyun 	unsigned long offset;
59*4882a593Smuzhiyun 
60*4882a593Smuzhiyun 	offset = r->resource.start - dev_priv->gtt_mem->start;
61*4882a593Smuzhiyun 
62*4882a593Smuzhiyun 	return dev_priv->gtt_map + (offset >> PAGE_SHIFT);
63*4882a593Smuzhiyun }
64*4882a593Smuzhiyun 
65*4882a593Smuzhiyun /**
66*4882a593Smuzhiyun  *	psb_gtt_insert	-	put an object into the GTT
67*4882a593Smuzhiyun  *	@dev: our DRM device
68*4882a593Smuzhiyun  *	@r: our GTT range
69*4882a593Smuzhiyun  *	@resume: on resume
70*4882a593Smuzhiyun  *
71*4882a593Smuzhiyun  *	Take our preallocated GTT range and insert the GEM object into
72*4882a593Smuzhiyun  *	the GTT. This is protected via the gtt mutex which the caller
73*4882a593Smuzhiyun  *	must hold.
74*4882a593Smuzhiyun  */
psb_gtt_insert(struct drm_device * dev,struct gtt_range * r,int resume)75*4882a593Smuzhiyun static int psb_gtt_insert(struct drm_device *dev, struct gtt_range *r,
76*4882a593Smuzhiyun 			  int resume)
77*4882a593Smuzhiyun {
78*4882a593Smuzhiyun 	u32 __iomem *gtt_slot;
79*4882a593Smuzhiyun 	u32 pte;
80*4882a593Smuzhiyun 	struct page **pages;
81*4882a593Smuzhiyun 	int i;
82*4882a593Smuzhiyun 
83*4882a593Smuzhiyun 	if (r->pages == NULL) {
84*4882a593Smuzhiyun 		WARN_ON(1);
85*4882a593Smuzhiyun 		return -EINVAL;
86*4882a593Smuzhiyun 	}
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun 	WARN_ON(r->stolen);	/* refcount these maybe ? */
89*4882a593Smuzhiyun 
90*4882a593Smuzhiyun 	gtt_slot = psb_gtt_entry(dev, r);
91*4882a593Smuzhiyun 	pages = r->pages;
92*4882a593Smuzhiyun 
93*4882a593Smuzhiyun 	if (!resume) {
94*4882a593Smuzhiyun 		/* Make sure changes are visible to the GPU */
95*4882a593Smuzhiyun 		set_pages_array_wc(pages, r->npage);
96*4882a593Smuzhiyun 	}
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	/* Write our page entries into the GTT itself */
99*4882a593Smuzhiyun 	for (i = r->roll; i < r->npage; i++) {
100*4882a593Smuzhiyun 		pte = psb_gtt_mask_pte(page_to_pfn(r->pages[i]),
101*4882a593Smuzhiyun 				       PSB_MMU_CACHED_MEMORY);
102*4882a593Smuzhiyun 		iowrite32(pte, gtt_slot++);
103*4882a593Smuzhiyun 	}
104*4882a593Smuzhiyun 	for (i = 0; i < r->roll; i++) {
105*4882a593Smuzhiyun 		pte = psb_gtt_mask_pte(page_to_pfn(r->pages[i]),
106*4882a593Smuzhiyun 				       PSB_MMU_CACHED_MEMORY);
107*4882a593Smuzhiyun 		iowrite32(pte, gtt_slot++);
108*4882a593Smuzhiyun 	}
109*4882a593Smuzhiyun 	/* Make sure all the entries are set before we return */
110*4882a593Smuzhiyun 	ioread32(gtt_slot - 1);
111*4882a593Smuzhiyun 
112*4882a593Smuzhiyun 	return 0;
113*4882a593Smuzhiyun }
114*4882a593Smuzhiyun 
115*4882a593Smuzhiyun /**
116*4882a593Smuzhiyun  *	psb_gtt_remove	-	remove an object from the GTT
117*4882a593Smuzhiyun  *	@dev: our DRM device
118*4882a593Smuzhiyun  *	@r: our GTT range
119*4882a593Smuzhiyun  *
120*4882a593Smuzhiyun  *	Remove a preallocated GTT range from the GTT. Overwrite all the
121*4882a593Smuzhiyun  *	page table entries with the dummy page. This is protected via the gtt
122*4882a593Smuzhiyun  *	mutex which the caller must hold.
123*4882a593Smuzhiyun  */
psb_gtt_remove(struct drm_device * dev,struct gtt_range * r)124*4882a593Smuzhiyun static void psb_gtt_remove(struct drm_device *dev, struct gtt_range *r)
125*4882a593Smuzhiyun {
126*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
127*4882a593Smuzhiyun 	u32 __iomem *gtt_slot;
128*4882a593Smuzhiyun 	u32 pte;
129*4882a593Smuzhiyun 	int i;
130*4882a593Smuzhiyun 
131*4882a593Smuzhiyun 	WARN_ON(r->stolen);
132*4882a593Smuzhiyun 
133*4882a593Smuzhiyun 	gtt_slot = psb_gtt_entry(dev, r);
134*4882a593Smuzhiyun 	pte = psb_gtt_mask_pte(page_to_pfn(dev_priv->scratch_page),
135*4882a593Smuzhiyun 			       PSB_MMU_CACHED_MEMORY);
136*4882a593Smuzhiyun 
137*4882a593Smuzhiyun 	for (i = 0; i < r->npage; i++)
138*4882a593Smuzhiyun 		iowrite32(pte, gtt_slot++);
139*4882a593Smuzhiyun 	ioread32(gtt_slot - 1);
140*4882a593Smuzhiyun 	set_pages_array_wb(r->pages, r->npage);
141*4882a593Smuzhiyun }
142*4882a593Smuzhiyun 
143*4882a593Smuzhiyun /**
144*4882a593Smuzhiyun  *	psb_gtt_roll	-	set scrolling position
145*4882a593Smuzhiyun  *	@dev: our DRM device
146*4882a593Smuzhiyun  *	@r: the gtt mapping we are using
147*4882a593Smuzhiyun  *	@roll: roll offset
148*4882a593Smuzhiyun  *
149*4882a593Smuzhiyun  *	Roll an existing pinned mapping by moving the pages through the GTT.
150*4882a593Smuzhiyun  *	This allows us to implement hardware scrolling on the consoles without
151*4882a593Smuzhiyun  *	a 2D engine
152*4882a593Smuzhiyun  */
psb_gtt_roll(struct drm_device * dev,struct gtt_range * r,int roll)153*4882a593Smuzhiyun void psb_gtt_roll(struct drm_device *dev, struct gtt_range *r, int roll)
154*4882a593Smuzhiyun {
155*4882a593Smuzhiyun 	u32 __iomem *gtt_slot;
156*4882a593Smuzhiyun 	u32 pte;
157*4882a593Smuzhiyun 	int i;
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 	if (roll >= r->npage) {
160*4882a593Smuzhiyun 		WARN_ON(1);
161*4882a593Smuzhiyun 		return;
162*4882a593Smuzhiyun 	}
163*4882a593Smuzhiyun 
164*4882a593Smuzhiyun 	r->roll = roll;
165*4882a593Smuzhiyun 
166*4882a593Smuzhiyun 	/* Not currently in the GTT - no worry we will write the mapping at
167*4882a593Smuzhiyun 	   the right position when it gets pinned */
168*4882a593Smuzhiyun 	if (!r->stolen && !r->in_gart)
169*4882a593Smuzhiyun 		return;
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	gtt_slot = psb_gtt_entry(dev, r);
172*4882a593Smuzhiyun 
173*4882a593Smuzhiyun 	for (i = r->roll; i < r->npage; i++) {
174*4882a593Smuzhiyun 		pte = psb_gtt_mask_pte(page_to_pfn(r->pages[i]),
175*4882a593Smuzhiyun 				       PSB_MMU_CACHED_MEMORY);
176*4882a593Smuzhiyun 		iowrite32(pte, gtt_slot++);
177*4882a593Smuzhiyun 	}
178*4882a593Smuzhiyun 	for (i = 0; i < r->roll; i++) {
179*4882a593Smuzhiyun 		pte = psb_gtt_mask_pte(page_to_pfn(r->pages[i]),
180*4882a593Smuzhiyun 				       PSB_MMU_CACHED_MEMORY);
181*4882a593Smuzhiyun 		iowrite32(pte, gtt_slot++);
182*4882a593Smuzhiyun 	}
183*4882a593Smuzhiyun 	ioread32(gtt_slot - 1);
184*4882a593Smuzhiyun }
185*4882a593Smuzhiyun 
186*4882a593Smuzhiyun /**
187*4882a593Smuzhiyun  *	psb_gtt_attach_pages	-	attach and pin GEM pages
188*4882a593Smuzhiyun  *	@gt: the gtt range
189*4882a593Smuzhiyun  *
190*4882a593Smuzhiyun  *	Pin and build an in kernel list of the pages that back our GEM object.
191*4882a593Smuzhiyun  *	While we hold this the pages cannot be swapped out. This is protected
192*4882a593Smuzhiyun  *	via the gtt mutex which the caller must hold.
193*4882a593Smuzhiyun  */
psb_gtt_attach_pages(struct gtt_range * gt)194*4882a593Smuzhiyun static int psb_gtt_attach_pages(struct gtt_range *gt)
195*4882a593Smuzhiyun {
196*4882a593Smuzhiyun 	struct page **pages;
197*4882a593Smuzhiyun 
198*4882a593Smuzhiyun 	WARN_ON(gt->pages);
199*4882a593Smuzhiyun 
200*4882a593Smuzhiyun 	pages = drm_gem_get_pages(&gt->gem);
201*4882a593Smuzhiyun 	if (IS_ERR(pages))
202*4882a593Smuzhiyun 		return PTR_ERR(pages);
203*4882a593Smuzhiyun 
204*4882a593Smuzhiyun 	gt->npage = gt->gem.size / PAGE_SIZE;
205*4882a593Smuzhiyun 	gt->pages = pages;
206*4882a593Smuzhiyun 
207*4882a593Smuzhiyun 	return 0;
208*4882a593Smuzhiyun }
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun /**
211*4882a593Smuzhiyun  *	psb_gtt_detach_pages	-	attach and pin GEM pages
212*4882a593Smuzhiyun  *	@gt: the gtt range
213*4882a593Smuzhiyun  *
214*4882a593Smuzhiyun  *	Undo the effect of psb_gtt_attach_pages. At this point the pages
215*4882a593Smuzhiyun  *	must have been removed from the GTT as they could now be paged out
216*4882a593Smuzhiyun  *	and move bus address. This is protected via the gtt mutex which the
217*4882a593Smuzhiyun  *	caller must hold.
218*4882a593Smuzhiyun  */
psb_gtt_detach_pages(struct gtt_range * gt)219*4882a593Smuzhiyun static void psb_gtt_detach_pages(struct gtt_range *gt)
220*4882a593Smuzhiyun {
221*4882a593Smuzhiyun 	drm_gem_put_pages(&gt->gem, gt->pages, true, false);
222*4882a593Smuzhiyun 	gt->pages = NULL;
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun 
225*4882a593Smuzhiyun /**
226*4882a593Smuzhiyun  *	psb_gtt_pin		-	pin pages into the GTT
227*4882a593Smuzhiyun  *	@gt: range to pin
228*4882a593Smuzhiyun  *
229*4882a593Smuzhiyun  *	Pin a set of pages into the GTT. The pins are refcounted so that
230*4882a593Smuzhiyun  *	multiple pins need multiple unpins to undo.
231*4882a593Smuzhiyun  *
232*4882a593Smuzhiyun  *	Non GEM backed objects treat this as a no-op as they are always GTT
233*4882a593Smuzhiyun  *	backed objects.
234*4882a593Smuzhiyun  */
psb_gtt_pin(struct gtt_range * gt)235*4882a593Smuzhiyun int psb_gtt_pin(struct gtt_range *gt)
236*4882a593Smuzhiyun {
237*4882a593Smuzhiyun 	int ret = 0;
238*4882a593Smuzhiyun 	struct drm_device *dev = gt->gem.dev;
239*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
240*4882a593Smuzhiyun 	u32 gpu_base = dev_priv->gtt.gatt_start;
241*4882a593Smuzhiyun 
242*4882a593Smuzhiyun 	mutex_lock(&dev_priv->gtt_mutex);
243*4882a593Smuzhiyun 
244*4882a593Smuzhiyun 	if (gt->in_gart == 0 && gt->stolen == 0) {
245*4882a593Smuzhiyun 		ret = psb_gtt_attach_pages(gt);
246*4882a593Smuzhiyun 		if (ret < 0)
247*4882a593Smuzhiyun 			goto out;
248*4882a593Smuzhiyun 		ret = psb_gtt_insert(dev, gt, 0);
249*4882a593Smuzhiyun 		if (ret < 0) {
250*4882a593Smuzhiyun 			psb_gtt_detach_pages(gt);
251*4882a593Smuzhiyun 			goto out;
252*4882a593Smuzhiyun 		}
253*4882a593Smuzhiyun 		psb_mmu_insert_pages(psb_mmu_get_default_pd(dev_priv->mmu),
254*4882a593Smuzhiyun 				     gt->pages, (gpu_base + gt->offset),
255*4882a593Smuzhiyun 				     gt->npage, 0, 0, PSB_MMU_CACHED_MEMORY);
256*4882a593Smuzhiyun 	}
257*4882a593Smuzhiyun 	gt->in_gart++;
258*4882a593Smuzhiyun out:
259*4882a593Smuzhiyun 	mutex_unlock(&dev_priv->gtt_mutex);
260*4882a593Smuzhiyun 	return ret;
261*4882a593Smuzhiyun }
262*4882a593Smuzhiyun 
263*4882a593Smuzhiyun /**
264*4882a593Smuzhiyun  *	psb_gtt_unpin		-	Drop a GTT pin requirement
265*4882a593Smuzhiyun  *	@gt: range to pin
266*4882a593Smuzhiyun  *
267*4882a593Smuzhiyun  *	Undoes the effect of psb_gtt_pin. On the last drop the GEM object
268*4882a593Smuzhiyun  *	will be removed from the GTT which will also drop the page references
269*4882a593Smuzhiyun  *	and allow the VM to clean up or page stuff.
270*4882a593Smuzhiyun  *
271*4882a593Smuzhiyun  *	Non GEM backed objects treat this as a no-op as they are always GTT
272*4882a593Smuzhiyun  *	backed objects.
273*4882a593Smuzhiyun  */
psb_gtt_unpin(struct gtt_range * gt)274*4882a593Smuzhiyun void psb_gtt_unpin(struct gtt_range *gt)
275*4882a593Smuzhiyun {
276*4882a593Smuzhiyun 	struct drm_device *dev = gt->gem.dev;
277*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
278*4882a593Smuzhiyun 	u32 gpu_base = dev_priv->gtt.gatt_start;
279*4882a593Smuzhiyun 	int ret;
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun 	/* While holding the gtt_mutex no new blits can be initiated */
282*4882a593Smuzhiyun 	mutex_lock(&dev_priv->gtt_mutex);
283*4882a593Smuzhiyun 
284*4882a593Smuzhiyun 	/* Wait for any possible usage of the memory to be finished */
285*4882a593Smuzhiyun 	ret = gma_blt_wait_idle(dev_priv);
286*4882a593Smuzhiyun 	if (ret) {
287*4882a593Smuzhiyun 		DRM_ERROR("Failed to idle the blitter, unpin failed!");
288*4882a593Smuzhiyun 		goto out;
289*4882a593Smuzhiyun 	}
290*4882a593Smuzhiyun 
291*4882a593Smuzhiyun 	WARN_ON(!gt->in_gart);
292*4882a593Smuzhiyun 
293*4882a593Smuzhiyun 	gt->in_gart--;
294*4882a593Smuzhiyun 	if (gt->in_gart == 0 && gt->stolen == 0) {
295*4882a593Smuzhiyun 		psb_mmu_remove_pages(psb_mmu_get_default_pd(dev_priv->mmu),
296*4882a593Smuzhiyun 				     (gpu_base + gt->offset), gt->npage, 0, 0);
297*4882a593Smuzhiyun 		psb_gtt_remove(dev, gt);
298*4882a593Smuzhiyun 		psb_gtt_detach_pages(gt);
299*4882a593Smuzhiyun 	}
300*4882a593Smuzhiyun 
301*4882a593Smuzhiyun out:
302*4882a593Smuzhiyun 	mutex_unlock(&dev_priv->gtt_mutex);
303*4882a593Smuzhiyun }
304*4882a593Smuzhiyun 
305*4882a593Smuzhiyun /*
306*4882a593Smuzhiyun  *	GTT resource allocator - allocate and manage GTT address space
307*4882a593Smuzhiyun  */
308*4882a593Smuzhiyun 
309*4882a593Smuzhiyun /**
310*4882a593Smuzhiyun  *	psb_gtt_alloc_range	-	allocate GTT address space
311*4882a593Smuzhiyun  *	@dev: Our DRM device
312*4882a593Smuzhiyun  *	@len: length (bytes) of address space required
313*4882a593Smuzhiyun  *	@name: resource name
314*4882a593Smuzhiyun  *	@backed: resource should be backed by stolen pages
315*4882a593Smuzhiyun  *	@align: requested alignment
316*4882a593Smuzhiyun  *
317*4882a593Smuzhiyun  *	Ask the kernel core to find us a suitable range of addresses
318*4882a593Smuzhiyun  *	to use for a GTT mapping.
319*4882a593Smuzhiyun  *
320*4882a593Smuzhiyun  *	Returns a gtt_range structure describing the object, or NULL on
321*4882a593Smuzhiyun  *	error. On successful return the resource is both allocated and marked
322*4882a593Smuzhiyun  *	as in use.
323*4882a593Smuzhiyun  */
psb_gtt_alloc_range(struct drm_device * dev,int len,const char * name,int backed,u32 align)324*4882a593Smuzhiyun struct gtt_range *psb_gtt_alloc_range(struct drm_device *dev, int len,
325*4882a593Smuzhiyun 				      const char *name, int backed, u32 align)
326*4882a593Smuzhiyun {
327*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
328*4882a593Smuzhiyun 	struct gtt_range *gt;
329*4882a593Smuzhiyun 	struct resource *r = dev_priv->gtt_mem;
330*4882a593Smuzhiyun 	int ret;
331*4882a593Smuzhiyun 	unsigned long start, end;
332*4882a593Smuzhiyun 
333*4882a593Smuzhiyun 	if (backed) {
334*4882a593Smuzhiyun 		/* The start of the GTT is the stolen pages */
335*4882a593Smuzhiyun 		start = r->start;
336*4882a593Smuzhiyun 		end = r->start + dev_priv->gtt.stolen_size - 1;
337*4882a593Smuzhiyun 	} else {
338*4882a593Smuzhiyun 		/* The rest we will use for GEM backed objects */
339*4882a593Smuzhiyun 		start = r->start + dev_priv->gtt.stolen_size;
340*4882a593Smuzhiyun 		end = r->end;
341*4882a593Smuzhiyun 	}
342*4882a593Smuzhiyun 
343*4882a593Smuzhiyun 	gt = kzalloc(sizeof(struct gtt_range), GFP_KERNEL);
344*4882a593Smuzhiyun 	if (gt == NULL)
345*4882a593Smuzhiyun 		return NULL;
346*4882a593Smuzhiyun 	gt->resource.name = name;
347*4882a593Smuzhiyun 	gt->stolen = backed;
348*4882a593Smuzhiyun 	gt->in_gart = backed;
349*4882a593Smuzhiyun 	gt->roll = 0;
350*4882a593Smuzhiyun 	/* Ensure this is set for non GEM objects */
351*4882a593Smuzhiyun 	gt->gem.dev = dev;
352*4882a593Smuzhiyun 	ret = allocate_resource(dev_priv->gtt_mem, &gt->resource,
353*4882a593Smuzhiyun 				len, start, end, align, NULL, NULL);
354*4882a593Smuzhiyun 	if (ret == 0) {
355*4882a593Smuzhiyun 		gt->offset = gt->resource.start - r->start;
356*4882a593Smuzhiyun 		return gt;
357*4882a593Smuzhiyun 	}
358*4882a593Smuzhiyun 	kfree(gt);
359*4882a593Smuzhiyun 	return NULL;
360*4882a593Smuzhiyun }
361*4882a593Smuzhiyun 
362*4882a593Smuzhiyun /**
363*4882a593Smuzhiyun  *	psb_gtt_free_range	-	release GTT address space
364*4882a593Smuzhiyun  *	@dev: our DRM device
365*4882a593Smuzhiyun  *	@gt: a mapping created with psb_gtt_alloc_range
366*4882a593Smuzhiyun  *
367*4882a593Smuzhiyun  *	Release a resource that was allocated with psb_gtt_alloc_range. If the
368*4882a593Smuzhiyun  *	object has been pinned by mmap users we clean this up here currently.
369*4882a593Smuzhiyun  */
psb_gtt_free_range(struct drm_device * dev,struct gtt_range * gt)370*4882a593Smuzhiyun void psb_gtt_free_range(struct drm_device *dev, struct gtt_range *gt)
371*4882a593Smuzhiyun {
372*4882a593Smuzhiyun 	/* Undo the mmap pin if we are destroying the object */
373*4882a593Smuzhiyun 	if (gt->mmapping) {
374*4882a593Smuzhiyun 		psb_gtt_unpin(gt);
375*4882a593Smuzhiyun 		gt->mmapping = 0;
376*4882a593Smuzhiyun 	}
377*4882a593Smuzhiyun 	WARN_ON(gt->in_gart && !gt->stolen);
378*4882a593Smuzhiyun 	release_resource(&gt->resource);
379*4882a593Smuzhiyun 	kfree(gt);
380*4882a593Smuzhiyun }
381*4882a593Smuzhiyun 
psb_gtt_alloc(struct drm_device * dev)382*4882a593Smuzhiyun static void psb_gtt_alloc(struct drm_device *dev)
383*4882a593Smuzhiyun {
384*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
385*4882a593Smuzhiyun 	init_rwsem(&dev_priv->gtt.sem);
386*4882a593Smuzhiyun }
387*4882a593Smuzhiyun 
psb_gtt_takedown(struct drm_device * dev)388*4882a593Smuzhiyun void psb_gtt_takedown(struct drm_device *dev)
389*4882a593Smuzhiyun {
390*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
391*4882a593Smuzhiyun 
392*4882a593Smuzhiyun 	if (dev_priv->gtt_map) {
393*4882a593Smuzhiyun 		iounmap(dev_priv->gtt_map);
394*4882a593Smuzhiyun 		dev_priv->gtt_map = NULL;
395*4882a593Smuzhiyun 	}
396*4882a593Smuzhiyun 	if (dev_priv->gtt_initialized) {
397*4882a593Smuzhiyun 		pci_write_config_word(dev->pdev, PSB_GMCH_CTRL,
398*4882a593Smuzhiyun 				      dev_priv->gmch_ctrl);
399*4882a593Smuzhiyun 		PSB_WVDC32(dev_priv->pge_ctl, PSB_PGETBL_CTL);
400*4882a593Smuzhiyun 		(void) PSB_RVDC32(PSB_PGETBL_CTL);
401*4882a593Smuzhiyun 	}
402*4882a593Smuzhiyun 	if (dev_priv->vram_addr)
403*4882a593Smuzhiyun 		iounmap(dev_priv->gtt_map);
404*4882a593Smuzhiyun }
405*4882a593Smuzhiyun 
psb_gtt_init(struct drm_device * dev,int resume)406*4882a593Smuzhiyun int psb_gtt_init(struct drm_device *dev, int resume)
407*4882a593Smuzhiyun {
408*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
409*4882a593Smuzhiyun 	unsigned gtt_pages;
410*4882a593Smuzhiyun 	unsigned long stolen_size, vram_stolen_size;
411*4882a593Smuzhiyun 	unsigned i, num_pages;
412*4882a593Smuzhiyun 	unsigned pfn_base;
413*4882a593Smuzhiyun 	struct psb_gtt *pg;
414*4882a593Smuzhiyun 
415*4882a593Smuzhiyun 	int ret = 0;
416*4882a593Smuzhiyun 	uint32_t pte;
417*4882a593Smuzhiyun 
418*4882a593Smuzhiyun 	if (!resume) {
419*4882a593Smuzhiyun 		mutex_init(&dev_priv->gtt_mutex);
420*4882a593Smuzhiyun 		mutex_init(&dev_priv->mmap_mutex);
421*4882a593Smuzhiyun 		psb_gtt_alloc(dev);
422*4882a593Smuzhiyun 	}
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	pg = &dev_priv->gtt;
425*4882a593Smuzhiyun 
426*4882a593Smuzhiyun 	/* Enable the GTT */
427*4882a593Smuzhiyun 	pci_read_config_word(dev->pdev, PSB_GMCH_CTRL, &dev_priv->gmch_ctrl);
428*4882a593Smuzhiyun 	pci_write_config_word(dev->pdev, PSB_GMCH_CTRL,
429*4882a593Smuzhiyun 			      dev_priv->gmch_ctrl | _PSB_GMCH_ENABLED);
430*4882a593Smuzhiyun 
431*4882a593Smuzhiyun 	dev_priv->pge_ctl = PSB_RVDC32(PSB_PGETBL_CTL);
432*4882a593Smuzhiyun 	PSB_WVDC32(dev_priv->pge_ctl | _PSB_PGETBL_ENABLED, PSB_PGETBL_CTL);
433*4882a593Smuzhiyun 	(void) PSB_RVDC32(PSB_PGETBL_CTL);
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun 	/* The root resource we allocate address space from */
436*4882a593Smuzhiyun 	dev_priv->gtt_initialized = 1;
437*4882a593Smuzhiyun 
438*4882a593Smuzhiyun 	pg->gtt_phys_start = dev_priv->pge_ctl & PAGE_MASK;
439*4882a593Smuzhiyun 
440*4882a593Smuzhiyun 	/*
441*4882a593Smuzhiyun 	 *	The video mmu has a hw bug when accessing 0x0D0000000.
442*4882a593Smuzhiyun 	 *	Make gatt start at 0x0e000,0000. This doesn't actually
443*4882a593Smuzhiyun 	 *	matter for us but may do if the video acceleration ever
444*4882a593Smuzhiyun 	 *	gets opened up.
445*4882a593Smuzhiyun 	 */
446*4882a593Smuzhiyun 	pg->mmu_gatt_start = 0xE0000000;
447*4882a593Smuzhiyun 
448*4882a593Smuzhiyun 	pg->gtt_start = pci_resource_start(dev->pdev, PSB_GTT_RESOURCE);
449*4882a593Smuzhiyun 	gtt_pages = pci_resource_len(dev->pdev, PSB_GTT_RESOURCE)
450*4882a593Smuzhiyun 								>> PAGE_SHIFT;
451*4882a593Smuzhiyun 	/* CDV doesn't report this. In which case the system has 64 gtt pages */
452*4882a593Smuzhiyun 	if (pg->gtt_start == 0 || gtt_pages == 0) {
453*4882a593Smuzhiyun 		dev_dbg(dev->dev, "GTT PCI BAR not initialized.\n");
454*4882a593Smuzhiyun 		gtt_pages = 64;
455*4882a593Smuzhiyun 		pg->gtt_start = dev_priv->pge_ctl;
456*4882a593Smuzhiyun 	}
457*4882a593Smuzhiyun 
458*4882a593Smuzhiyun 	pg->gatt_start = pci_resource_start(dev->pdev, PSB_GATT_RESOURCE);
459*4882a593Smuzhiyun 	pg->gatt_pages = pci_resource_len(dev->pdev, PSB_GATT_RESOURCE)
460*4882a593Smuzhiyun 								>> PAGE_SHIFT;
461*4882a593Smuzhiyun 	dev_priv->gtt_mem = &dev->pdev->resource[PSB_GATT_RESOURCE];
462*4882a593Smuzhiyun 
463*4882a593Smuzhiyun 	if (pg->gatt_pages == 0 || pg->gatt_start == 0) {
464*4882a593Smuzhiyun 		static struct resource fudge;	/* Preferably peppermint */
465*4882a593Smuzhiyun 		/* This can occur on CDV systems. Fudge it in this case.
466*4882a593Smuzhiyun 		   We really don't care what imaginary space is being allocated
467*4882a593Smuzhiyun 		   at this point */
468*4882a593Smuzhiyun 		dev_dbg(dev->dev, "GATT PCI BAR not initialized.\n");
469*4882a593Smuzhiyun 		pg->gatt_start = 0x40000000;
470*4882a593Smuzhiyun 		pg->gatt_pages = (128 * 1024 * 1024) >> PAGE_SHIFT;
471*4882a593Smuzhiyun 		/* This is a little confusing but in fact the GTT is providing
472*4882a593Smuzhiyun 		   a view from the GPU into memory and not vice versa. As such
473*4882a593Smuzhiyun 		   this is really allocating space that is not the same as the
474*4882a593Smuzhiyun 		   CPU address space on CDV */
475*4882a593Smuzhiyun 		fudge.start = 0x40000000;
476*4882a593Smuzhiyun 		fudge.end = 0x40000000 + 128 * 1024 * 1024 - 1;
477*4882a593Smuzhiyun 		fudge.name = "fudge";
478*4882a593Smuzhiyun 		fudge.flags = IORESOURCE_MEM;
479*4882a593Smuzhiyun 		dev_priv->gtt_mem = &fudge;
480*4882a593Smuzhiyun 	}
481*4882a593Smuzhiyun 
482*4882a593Smuzhiyun 	pci_read_config_dword(dev->pdev, PSB_BSM, &dev_priv->stolen_base);
483*4882a593Smuzhiyun 	vram_stolen_size = pg->gtt_phys_start - dev_priv->stolen_base
484*4882a593Smuzhiyun 								- PAGE_SIZE;
485*4882a593Smuzhiyun 
486*4882a593Smuzhiyun 	stolen_size = vram_stolen_size;
487*4882a593Smuzhiyun 
488*4882a593Smuzhiyun 	dev_dbg(dev->dev, "Stolen memory base 0x%x, size %luK\n",
489*4882a593Smuzhiyun 			dev_priv->stolen_base, vram_stolen_size / 1024);
490*4882a593Smuzhiyun 
491*4882a593Smuzhiyun 	if (resume && (gtt_pages != pg->gtt_pages) &&
492*4882a593Smuzhiyun 	    (stolen_size != pg->stolen_size)) {
493*4882a593Smuzhiyun 		dev_err(dev->dev, "GTT resume error.\n");
494*4882a593Smuzhiyun 		ret = -EINVAL;
495*4882a593Smuzhiyun 		goto out_err;
496*4882a593Smuzhiyun 	}
497*4882a593Smuzhiyun 
498*4882a593Smuzhiyun 	pg->gtt_pages = gtt_pages;
499*4882a593Smuzhiyun 	pg->stolen_size = stolen_size;
500*4882a593Smuzhiyun 	dev_priv->vram_stolen_size = vram_stolen_size;
501*4882a593Smuzhiyun 
502*4882a593Smuzhiyun 	/*
503*4882a593Smuzhiyun 	 *	Map the GTT and the stolen memory area
504*4882a593Smuzhiyun 	 */
505*4882a593Smuzhiyun 	if (!resume)
506*4882a593Smuzhiyun 		dev_priv->gtt_map = ioremap(pg->gtt_phys_start,
507*4882a593Smuzhiyun 						gtt_pages << PAGE_SHIFT);
508*4882a593Smuzhiyun 	if (!dev_priv->gtt_map) {
509*4882a593Smuzhiyun 		dev_err(dev->dev, "Failure to map gtt.\n");
510*4882a593Smuzhiyun 		ret = -ENOMEM;
511*4882a593Smuzhiyun 		goto out_err;
512*4882a593Smuzhiyun 	}
513*4882a593Smuzhiyun 
514*4882a593Smuzhiyun 	if (!resume)
515*4882a593Smuzhiyun 		dev_priv->vram_addr = ioremap_wc(dev_priv->stolen_base,
516*4882a593Smuzhiyun 						 stolen_size);
517*4882a593Smuzhiyun 
518*4882a593Smuzhiyun 	if (!dev_priv->vram_addr) {
519*4882a593Smuzhiyun 		dev_err(dev->dev, "Failure to map stolen base.\n");
520*4882a593Smuzhiyun 		ret = -ENOMEM;
521*4882a593Smuzhiyun 		goto out_err;
522*4882a593Smuzhiyun 	}
523*4882a593Smuzhiyun 
524*4882a593Smuzhiyun 	/*
525*4882a593Smuzhiyun 	 * Insert vram stolen pages into the GTT
526*4882a593Smuzhiyun 	 */
527*4882a593Smuzhiyun 
528*4882a593Smuzhiyun 	pfn_base = dev_priv->stolen_base >> PAGE_SHIFT;
529*4882a593Smuzhiyun 	num_pages = vram_stolen_size >> PAGE_SHIFT;
530*4882a593Smuzhiyun 	dev_dbg(dev->dev, "Set up %d stolen pages starting at 0x%08x, GTT offset %dK\n",
531*4882a593Smuzhiyun 		num_pages, pfn_base << PAGE_SHIFT, 0);
532*4882a593Smuzhiyun 	for (i = 0; i < num_pages; ++i) {
533*4882a593Smuzhiyun 		pte = psb_gtt_mask_pte(pfn_base + i, PSB_MMU_CACHED_MEMORY);
534*4882a593Smuzhiyun 		iowrite32(pte, dev_priv->gtt_map + i);
535*4882a593Smuzhiyun 	}
536*4882a593Smuzhiyun 
537*4882a593Smuzhiyun 	/*
538*4882a593Smuzhiyun 	 * Init rest of GTT to the scratch page to avoid accidents or scribbles
539*4882a593Smuzhiyun 	 */
540*4882a593Smuzhiyun 
541*4882a593Smuzhiyun 	pfn_base = page_to_pfn(dev_priv->scratch_page);
542*4882a593Smuzhiyun 	pte = psb_gtt_mask_pte(pfn_base, PSB_MMU_CACHED_MEMORY);
543*4882a593Smuzhiyun 	for (; i < gtt_pages; ++i)
544*4882a593Smuzhiyun 		iowrite32(pte, dev_priv->gtt_map + i);
545*4882a593Smuzhiyun 
546*4882a593Smuzhiyun 	(void) ioread32(dev_priv->gtt_map + i - 1);
547*4882a593Smuzhiyun 	return 0;
548*4882a593Smuzhiyun 
549*4882a593Smuzhiyun out_err:
550*4882a593Smuzhiyun 	psb_gtt_takedown(dev);
551*4882a593Smuzhiyun 	return ret;
552*4882a593Smuzhiyun }
553*4882a593Smuzhiyun 
psb_gtt_restore(struct drm_device * dev)554*4882a593Smuzhiyun int psb_gtt_restore(struct drm_device *dev)
555*4882a593Smuzhiyun {
556*4882a593Smuzhiyun 	struct drm_psb_private *dev_priv = dev->dev_private;
557*4882a593Smuzhiyun 	struct resource *r = dev_priv->gtt_mem->child;
558*4882a593Smuzhiyun 	struct gtt_range *range;
559*4882a593Smuzhiyun 	unsigned int restored = 0, total = 0, size = 0;
560*4882a593Smuzhiyun 
561*4882a593Smuzhiyun 	/* On resume, the gtt_mutex is already initialized */
562*4882a593Smuzhiyun 	mutex_lock(&dev_priv->gtt_mutex);
563*4882a593Smuzhiyun 	psb_gtt_init(dev, 1);
564*4882a593Smuzhiyun 
565*4882a593Smuzhiyun 	while (r != NULL) {
566*4882a593Smuzhiyun 		range = container_of(r, struct gtt_range, resource);
567*4882a593Smuzhiyun 		if (range->pages) {
568*4882a593Smuzhiyun 			psb_gtt_insert(dev, range, 1);
569*4882a593Smuzhiyun 			size += range->resource.end - range->resource.start;
570*4882a593Smuzhiyun 			restored++;
571*4882a593Smuzhiyun 		}
572*4882a593Smuzhiyun 		r = r->sibling;
573*4882a593Smuzhiyun 		total++;
574*4882a593Smuzhiyun 	}
575*4882a593Smuzhiyun 	mutex_unlock(&dev_priv->gtt_mutex);
576*4882a593Smuzhiyun 	DRM_DEBUG_DRIVER("Restored %u of %u gtt ranges (%u KB)", restored,
577*4882a593Smuzhiyun 			 total, (size / 1024));
578*4882a593Smuzhiyun 
579*4882a593Smuzhiyun 	return 0;
580*4882a593Smuzhiyun }
581