1*4882a593Smuzhiyun /***************************************************************************\
2*4882a593Smuzhiyun |* *|
3*4882a593Smuzhiyun |* Copyright 1993-1999 NVIDIA, Corporation. All rights reserved. *|
4*4882a593Smuzhiyun |* *|
5*4882a593Smuzhiyun |* NOTICE TO USER: The source code is copyrighted under U.S. and *|
6*4882a593Smuzhiyun |* international laws. Users and possessors of this source code are *|
7*4882a593Smuzhiyun |* hereby granted a nonexclusive, royalty-free copyright license to *|
8*4882a593Smuzhiyun |* use this code in individual and commercial software. *|
9*4882a593Smuzhiyun |* *|
10*4882a593Smuzhiyun |* Any use of this source code must include, in the user documenta- *|
11*4882a593Smuzhiyun |* tion and internal comments to the code, notices to the end user *|
12*4882a593Smuzhiyun |* as follows: *|
13*4882a593Smuzhiyun |* *|
14*4882a593Smuzhiyun |* Copyright 1993-1999 NVIDIA, Corporation. All rights reserved. *|
15*4882a593Smuzhiyun |* *|
16*4882a593Smuzhiyun |* NVIDIA, CORPORATION MAKES NO REPRESENTATION ABOUT THE SUITABILITY *|
17*4882a593Smuzhiyun |* OF THIS SOURCE CODE FOR ANY PURPOSE. IT IS PROVIDED "AS IS" *|
18*4882a593Smuzhiyun |* WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND. NVIDIA, CORPOR- *|
19*4882a593Smuzhiyun |* ATION DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOURCE CODE, *|
20*4882a593Smuzhiyun |* INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY, NONINFRINGE- *|
21*4882a593Smuzhiyun |* MENT, AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT SHALL *|
22*4882a593Smuzhiyun |* NVIDIA, CORPORATION BE LIABLE FOR ANY SPECIAL, INDIRECT, INCI- *|
23*4882a593Smuzhiyun |* DENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY DAMAGES WHATSOEVER RE- *|
24*4882a593Smuzhiyun |* SULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION *|
25*4882a593Smuzhiyun |* OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF *|
26*4882a593Smuzhiyun |* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOURCE CODE. *|
27*4882a593Smuzhiyun |* *|
28*4882a593Smuzhiyun |* U.S. Government End Users. This source code is a "commercial *|
29*4882a593Smuzhiyun |* item," as that term is defined at 48 C.F.R. 2.101 (OCT 1995), *|
30*4882a593Smuzhiyun |* consisting of "commercial computer software" and "commercial *|
31*4882a593Smuzhiyun |* computer software documentation," as such terms are used in *|
32*4882a593Smuzhiyun |* 48 C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Govern- *|
33*4882a593Smuzhiyun |* ment only as a commercial end item. Consistent with 48 C.F.R. *|
34*4882a593Smuzhiyun |* 12.212 and 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), *|
35*4882a593Smuzhiyun |* all U.S. Government End Users acquire the source code with only *|
36*4882a593Smuzhiyun |* those rights set forth herein. *|
37*4882a593Smuzhiyun |* *|
38*4882a593Smuzhiyun \***************************************************************************/
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun /*
41*4882a593Smuzhiyun * GPL licensing note -- nVidia is allowing a liberal interpretation of
42*4882a593Smuzhiyun * the documentation restriction above, to merely say that this nVidia's
43*4882a593Smuzhiyun * copyright and disclaimer should be included with all code derived
44*4882a593Smuzhiyun * from this source. -- Jeff Garzik <jgarzik@pobox.com>, 01/Nov/99
45*4882a593Smuzhiyun */
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun /* $XFree86: xc/programs/Xserver/hw/xfree86/drivers/nv/riva_hw.c,v 1.33 2002/08/05 20:47:06 mvojkovi Exp $ */
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun #include <linux/kernel.h>
50*4882a593Smuzhiyun #include <linux/pci.h>
51*4882a593Smuzhiyun #include <linux/pci_ids.h>
52*4882a593Smuzhiyun #include "riva_hw.h"
53*4882a593Smuzhiyun #include "riva_tbl.h"
54*4882a593Smuzhiyun #include "nv_type.h"
55*4882a593Smuzhiyun
56*4882a593Smuzhiyun /*
57*4882a593Smuzhiyun * This file is an OS-agnostic file used to make RIVA 128 and RIVA TNT
58*4882a593Smuzhiyun * operate identically (except TNT has more memory and better 3D quality.
59*4882a593Smuzhiyun */
nv3Busy(RIVA_HW_INST * chip)60*4882a593Smuzhiyun static int nv3Busy
61*4882a593Smuzhiyun (
62*4882a593Smuzhiyun RIVA_HW_INST *chip
63*4882a593Smuzhiyun )
64*4882a593Smuzhiyun {
65*4882a593Smuzhiyun return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
66*4882a593Smuzhiyun NV_RD32(&chip->PGRAPH[0x000006B0/4], 0) & 0x01);
67*4882a593Smuzhiyun }
nv4Busy(RIVA_HW_INST * chip)68*4882a593Smuzhiyun static int nv4Busy
69*4882a593Smuzhiyun (
70*4882a593Smuzhiyun RIVA_HW_INST *chip
71*4882a593Smuzhiyun )
72*4882a593Smuzhiyun {
73*4882a593Smuzhiyun return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
74*4882a593Smuzhiyun NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
75*4882a593Smuzhiyun }
nv10Busy(RIVA_HW_INST * chip)76*4882a593Smuzhiyun static int nv10Busy
77*4882a593Smuzhiyun (
78*4882a593Smuzhiyun RIVA_HW_INST *chip
79*4882a593Smuzhiyun )
80*4882a593Smuzhiyun {
81*4882a593Smuzhiyun return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
82*4882a593Smuzhiyun NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
83*4882a593Smuzhiyun }
84*4882a593Smuzhiyun
vgaLockUnlock(RIVA_HW_INST * chip,int Lock)85*4882a593Smuzhiyun static void vgaLockUnlock
86*4882a593Smuzhiyun (
87*4882a593Smuzhiyun RIVA_HW_INST *chip,
88*4882a593Smuzhiyun int Lock
89*4882a593Smuzhiyun )
90*4882a593Smuzhiyun {
91*4882a593Smuzhiyun U008 cr11;
92*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x11);
93*4882a593Smuzhiyun cr11 = VGA_RD08(chip->PCIO, 0x3D5);
94*4882a593Smuzhiyun if(Lock) cr11 |= 0x80;
95*4882a593Smuzhiyun else cr11 &= ~0x80;
96*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D5, cr11);
97*4882a593Smuzhiyun }
nv3LockUnlock(RIVA_HW_INST * chip,int Lock)98*4882a593Smuzhiyun static void nv3LockUnlock
99*4882a593Smuzhiyun (
100*4882a593Smuzhiyun RIVA_HW_INST *chip,
101*4882a593Smuzhiyun int Lock
102*4882a593Smuzhiyun )
103*4882a593Smuzhiyun {
104*4882a593Smuzhiyun VGA_WR08(chip->PVIO, 0x3C4, 0x06);
105*4882a593Smuzhiyun VGA_WR08(chip->PVIO, 0x3C5, Lock ? 0x99 : 0x57);
106*4882a593Smuzhiyun vgaLockUnlock(chip, Lock);
107*4882a593Smuzhiyun }
nv4LockUnlock(RIVA_HW_INST * chip,int Lock)108*4882a593Smuzhiyun static void nv4LockUnlock
109*4882a593Smuzhiyun (
110*4882a593Smuzhiyun RIVA_HW_INST *chip,
111*4882a593Smuzhiyun int Lock
112*4882a593Smuzhiyun )
113*4882a593Smuzhiyun {
114*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x1F);
115*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D5, Lock ? 0x99 : 0x57);
116*4882a593Smuzhiyun vgaLockUnlock(chip, Lock);
117*4882a593Smuzhiyun }
118*4882a593Smuzhiyun
ShowHideCursor(RIVA_HW_INST * chip,int ShowHide)119*4882a593Smuzhiyun static int ShowHideCursor
120*4882a593Smuzhiyun (
121*4882a593Smuzhiyun RIVA_HW_INST *chip,
122*4882a593Smuzhiyun int ShowHide
123*4882a593Smuzhiyun )
124*4882a593Smuzhiyun {
125*4882a593Smuzhiyun int cursor;
126*4882a593Smuzhiyun cursor = chip->CurrentState->cursor1;
127*4882a593Smuzhiyun chip->CurrentState->cursor1 = (chip->CurrentState->cursor1 & 0xFE) |
128*4882a593Smuzhiyun (ShowHide & 0x01);
129*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x31);
130*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D5, chip->CurrentState->cursor1);
131*4882a593Smuzhiyun return (cursor & 0x01);
132*4882a593Smuzhiyun }
133*4882a593Smuzhiyun
134*4882a593Smuzhiyun /****************************************************************************\
135*4882a593Smuzhiyun * *
136*4882a593Smuzhiyun * The video arbitration routines calculate some "magic" numbers. Fixes *
137*4882a593Smuzhiyun * the snow seen when accessing the framebuffer without it. *
138*4882a593Smuzhiyun * It just works (I hope). *
139*4882a593Smuzhiyun * *
140*4882a593Smuzhiyun \****************************************************************************/
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun #define DEFAULT_GR_LWM 100
143*4882a593Smuzhiyun #define DEFAULT_VID_LWM 100
144*4882a593Smuzhiyun #define DEFAULT_GR_BURST_SIZE 256
145*4882a593Smuzhiyun #define DEFAULT_VID_BURST_SIZE 128
146*4882a593Smuzhiyun #define VIDEO 0
147*4882a593Smuzhiyun #define GRAPHICS 1
148*4882a593Smuzhiyun #define MPORT 2
149*4882a593Smuzhiyun #define ENGINE 3
150*4882a593Smuzhiyun #define GFIFO_SIZE 320
151*4882a593Smuzhiyun #define GFIFO_SIZE_128 256
152*4882a593Smuzhiyun #define MFIFO_SIZE 120
153*4882a593Smuzhiyun #define VFIFO_SIZE 256
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun typedef struct {
156*4882a593Smuzhiyun int gdrain_rate;
157*4882a593Smuzhiyun int vdrain_rate;
158*4882a593Smuzhiyun int mdrain_rate;
159*4882a593Smuzhiyun int gburst_size;
160*4882a593Smuzhiyun int vburst_size;
161*4882a593Smuzhiyun char vid_en;
162*4882a593Smuzhiyun char gr_en;
163*4882a593Smuzhiyun int wcmocc, wcgocc, wcvocc, wcvlwm, wcglwm;
164*4882a593Smuzhiyun int by_gfacc;
165*4882a593Smuzhiyun char vid_only_once;
166*4882a593Smuzhiyun char gr_only_once;
167*4882a593Smuzhiyun char first_vacc;
168*4882a593Smuzhiyun char first_gacc;
169*4882a593Smuzhiyun char first_macc;
170*4882a593Smuzhiyun int vocc;
171*4882a593Smuzhiyun int gocc;
172*4882a593Smuzhiyun int mocc;
173*4882a593Smuzhiyun char cur;
174*4882a593Smuzhiyun char engine_en;
175*4882a593Smuzhiyun char converged;
176*4882a593Smuzhiyun int priority;
177*4882a593Smuzhiyun } nv3_arb_info;
178*4882a593Smuzhiyun typedef struct {
179*4882a593Smuzhiyun int graphics_lwm;
180*4882a593Smuzhiyun int video_lwm;
181*4882a593Smuzhiyun int graphics_burst_size;
182*4882a593Smuzhiyun int video_burst_size;
183*4882a593Smuzhiyun int graphics_hi_priority;
184*4882a593Smuzhiyun int media_hi_priority;
185*4882a593Smuzhiyun int rtl_values;
186*4882a593Smuzhiyun int valid;
187*4882a593Smuzhiyun } nv3_fifo_info;
188*4882a593Smuzhiyun typedef struct {
189*4882a593Smuzhiyun char pix_bpp;
190*4882a593Smuzhiyun char enable_video;
191*4882a593Smuzhiyun char gr_during_vid;
192*4882a593Smuzhiyun char enable_mp;
193*4882a593Smuzhiyun int memory_width;
194*4882a593Smuzhiyun int video_scale;
195*4882a593Smuzhiyun int pclk_khz;
196*4882a593Smuzhiyun int mclk_khz;
197*4882a593Smuzhiyun int mem_page_miss;
198*4882a593Smuzhiyun int mem_latency;
199*4882a593Smuzhiyun char mem_aligned;
200*4882a593Smuzhiyun } nv3_sim_state;
201*4882a593Smuzhiyun typedef struct {
202*4882a593Smuzhiyun int graphics_lwm;
203*4882a593Smuzhiyun int video_lwm;
204*4882a593Smuzhiyun int graphics_burst_size;
205*4882a593Smuzhiyun int video_burst_size;
206*4882a593Smuzhiyun int valid;
207*4882a593Smuzhiyun } nv4_fifo_info;
208*4882a593Smuzhiyun typedef struct {
209*4882a593Smuzhiyun int pclk_khz;
210*4882a593Smuzhiyun int mclk_khz;
211*4882a593Smuzhiyun int nvclk_khz;
212*4882a593Smuzhiyun char mem_page_miss;
213*4882a593Smuzhiyun char mem_latency;
214*4882a593Smuzhiyun int memory_width;
215*4882a593Smuzhiyun char enable_video;
216*4882a593Smuzhiyun char gr_during_vid;
217*4882a593Smuzhiyun char pix_bpp;
218*4882a593Smuzhiyun char mem_aligned;
219*4882a593Smuzhiyun char enable_mp;
220*4882a593Smuzhiyun } nv4_sim_state;
221*4882a593Smuzhiyun typedef struct {
222*4882a593Smuzhiyun int graphics_lwm;
223*4882a593Smuzhiyun int video_lwm;
224*4882a593Smuzhiyun int graphics_burst_size;
225*4882a593Smuzhiyun int video_burst_size;
226*4882a593Smuzhiyun int valid;
227*4882a593Smuzhiyun } nv10_fifo_info;
228*4882a593Smuzhiyun typedef struct {
229*4882a593Smuzhiyun int pclk_khz;
230*4882a593Smuzhiyun int mclk_khz;
231*4882a593Smuzhiyun int nvclk_khz;
232*4882a593Smuzhiyun char mem_page_miss;
233*4882a593Smuzhiyun char mem_latency;
234*4882a593Smuzhiyun u32 memory_type;
235*4882a593Smuzhiyun int memory_width;
236*4882a593Smuzhiyun char enable_video;
237*4882a593Smuzhiyun char gr_during_vid;
238*4882a593Smuzhiyun char pix_bpp;
239*4882a593Smuzhiyun char mem_aligned;
240*4882a593Smuzhiyun char enable_mp;
241*4882a593Smuzhiyun } nv10_sim_state;
nv3_iterate(nv3_fifo_info * res_info,nv3_sim_state * state,nv3_arb_info * ainfo)242*4882a593Smuzhiyun static int nv3_iterate(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
243*4882a593Smuzhiyun {
244*4882a593Smuzhiyun int iter = 0;
245*4882a593Smuzhiyun int tmp;
246*4882a593Smuzhiyun int vfsize, mfsize, gfsize;
247*4882a593Smuzhiyun int mburst_size = 32;
248*4882a593Smuzhiyun int mmisses, gmisses, vmisses;
249*4882a593Smuzhiyun int misses;
250*4882a593Smuzhiyun int vlwm, glwm, mlwm;
251*4882a593Smuzhiyun int last, next, cur;
252*4882a593Smuzhiyun int max_gfsize ;
253*4882a593Smuzhiyun long ns;
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun vlwm = 0;
256*4882a593Smuzhiyun glwm = 0;
257*4882a593Smuzhiyun mlwm = 0;
258*4882a593Smuzhiyun vfsize = 0;
259*4882a593Smuzhiyun gfsize = 0;
260*4882a593Smuzhiyun cur = ainfo->cur;
261*4882a593Smuzhiyun mmisses = 2;
262*4882a593Smuzhiyun gmisses = 2;
263*4882a593Smuzhiyun vmisses = 2;
264*4882a593Smuzhiyun if (ainfo->gburst_size == 128) max_gfsize = GFIFO_SIZE_128;
265*4882a593Smuzhiyun else max_gfsize = GFIFO_SIZE;
266*4882a593Smuzhiyun max_gfsize = GFIFO_SIZE;
267*4882a593Smuzhiyun while (1)
268*4882a593Smuzhiyun {
269*4882a593Smuzhiyun if (ainfo->vid_en)
270*4882a593Smuzhiyun {
271*4882a593Smuzhiyun if (ainfo->wcvocc > ainfo->vocc) ainfo->wcvocc = ainfo->vocc;
272*4882a593Smuzhiyun if (ainfo->wcvlwm > vlwm) ainfo->wcvlwm = vlwm ;
273*4882a593Smuzhiyun ns = 1000000 * ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
274*4882a593Smuzhiyun vfsize = ns * ainfo->vdrain_rate / 1000000;
275*4882a593Smuzhiyun vfsize = ainfo->wcvlwm - ainfo->vburst_size + vfsize;
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun if (state->enable_mp)
278*4882a593Smuzhiyun {
279*4882a593Smuzhiyun if (ainfo->wcmocc > ainfo->mocc) ainfo->wcmocc = ainfo->mocc;
280*4882a593Smuzhiyun }
281*4882a593Smuzhiyun if (ainfo->gr_en)
282*4882a593Smuzhiyun {
283*4882a593Smuzhiyun if (ainfo->wcglwm > glwm) ainfo->wcglwm = glwm ;
284*4882a593Smuzhiyun if (ainfo->wcgocc > ainfo->gocc) ainfo->wcgocc = ainfo->gocc;
285*4882a593Smuzhiyun ns = 1000000 * (ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
286*4882a593Smuzhiyun gfsize = (ns * (long) ainfo->gdrain_rate)/1000000;
287*4882a593Smuzhiyun gfsize = ainfo->wcglwm - ainfo->gburst_size + gfsize;
288*4882a593Smuzhiyun }
289*4882a593Smuzhiyun mfsize = 0;
290*4882a593Smuzhiyun if (!state->gr_during_vid && ainfo->vid_en)
291*4882a593Smuzhiyun if (ainfo->vid_en && (ainfo->vocc < 0) && !ainfo->vid_only_once)
292*4882a593Smuzhiyun next = VIDEO;
293*4882a593Smuzhiyun else if (ainfo->mocc < 0)
294*4882a593Smuzhiyun next = MPORT;
295*4882a593Smuzhiyun else if (ainfo->gocc< ainfo->by_gfacc)
296*4882a593Smuzhiyun next = GRAPHICS;
297*4882a593Smuzhiyun else return (0);
298*4882a593Smuzhiyun else switch (ainfo->priority)
299*4882a593Smuzhiyun {
300*4882a593Smuzhiyun case VIDEO:
301*4882a593Smuzhiyun if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
302*4882a593Smuzhiyun next = VIDEO;
303*4882a593Smuzhiyun else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
304*4882a593Smuzhiyun next = GRAPHICS;
305*4882a593Smuzhiyun else if (ainfo->mocc<0)
306*4882a593Smuzhiyun next = MPORT;
307*4882a593Smuzhiyun else return (0);
308*4882a593Smuzhiyun break;
309*4882a593Smuzhiyun case GRAPHICS:
310*4882a593Smuzhiyun if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
311*4882a593Smuzhiyun next = GRAPHICS;
312*4882a593Smuzhiyun else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
313*4882a593Smuzhiyun next = VIDEO;
314*4882a593Smuzhiyun else if (ainfo->mocc<0)
315*4882a593Smuzhiyun next = MPORT;
316*4882a593Smuzhiyun else return (0);
317*4882a593Smuzhiyun break;
318*4882a593Smuzhiyun default:
319*4882a593Smuzhiyun if (ainfo->mocc<0)
320*4882a593Smuzhiyun next = MPORT;
321*4882a593Smuzhiyun else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
322*4882a593Smuzhiyun next = GRAPHICS;
323*4882a593Smuzhiyun else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
324*4882a593Smuzhiyun next = VIDEO;
325*4882a593Smuzhiyun else return (0);
326*4882a593Smuzhiyun break;
327*4882a593Smuzhiyun }
328*4882a593Smuzhiyun last = cur;
329*4882a593Smuzhiyun cur = next;
330*4882a593Smuzhiyun iter++;
331*4882a593Smuzhiyun switch (cur)
332*4882a593Smuzhiyun {
333*4882a593Smuzhiyun case VIDEO:
334*4882a593Smuzhiyun if (last==cur) misses = 0;
335*4882a593Smuzhiyun else if (ainfo->first_vacc) misses = vmisses;
336*4882a593Smuzhiyun else misses = 1;
337*4882a593Smuzhiyun ainfo->first_vacc = 0;
338*4882a593Smuzhiyun if (last!=cur)
339*4882a593Smuzhiyun {
340*4882a593Smuzhiyun ns = 1000000 * (vmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
341*4882a593Smuzhiyun vlwm = ns * ainfo->vdrain_rate/ 1000000;
342*4882a593Smuzhiyun vlwm = ainfo->vocc - vlwm;
343*4882a593Smuzhiyun }
344*4882a593Smuzhiyun ns = 1000000*(misses*state->mem_page_miss + ainfo->vburst_size)/(state->memory_width/8)/state->mclk_khz;
345*4882a593Smuzhiyun ainfo->vocc = ainfo->vocc + ainfo->vburst_size - ns*ainfo->vdrain_rate/1000000;
346*4882a593Smuzhiyun ainfo->gocc = ainfo->gocc - ns*ainfo->gdrain_rate/1000000;
347*4882a593Smuzhiyun ainfo->mocc = ainfo->mocc - ns*ainfo->mdrain_rate/1000000;
348*4882a593Smuzhiyun break;
349*4882a593Smuzhiyun case GRAPHICS:
350*4882a593Smuzhiyun if (last==cur) misses = 0;
351*4882a593Smuzhiyun else if (ainfo->first_gacc) misses = gmisses;
352*4882a593Smuzhiyun else misses = 1;
353*4882a593Smuzhiyun ainfo->first_gacc = 0;
354*4882a593Smuzhiyun if (last!=cur)
355*4882a593Smuzhiyun {
356*4882a593Smuzhiyun ns = 1000000*(gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz ;
357*4882a593Smuzhiyun glwm = ns * ainfo->gdrain_rate/1000000;
358*4882a593Smuzhiyun glwm = ainfo->gocc - glwm;
359*4882a593Smuzhiyun }
360*4882a593Smuzhiyun ns = 1000000*(misses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
361*4882a593Smuzhiyun ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
362*4882a593Smuzhiyun ainfo->gocc = ainfo->gocc + ainfo->gburst_size - ns*ainfo->gdrain_rate/1000000;
363*4882a593Smuzhiyun ainfo->mocc = ainfo->mocc + 0 - ns*ainfo->mdrain_rate/1000000;
364*4882a593Smuzhiyun break;
365*4882a593Smuzhiyun default:
366*4882a593Smuzhiyun if (last==cur) misses = 0;
367*4882a593Smuzhiyun else if (ainfo->first_macc) misses = mmisses;
368*4882a593Smuzhiyun else misses = 1;
369*4882a593Smuzhiyun ainfo->first_macc = 0;
370*4882a593Smuzhiyun ns = 1000000*(misses*state->mem_page_miss + mburst_size/(state->memory_width/8))/state->mclk_khz;
371*4882a593Smuzhiyun ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
372*4882a593Smuzhiyun ainfo->gocc = ainfo->gocc + 0 - ns*ainfo->gdrain_rate/1000000;
373*4882a593Smuzhiyun ainfo->mocc = ainfo->mocc + mburst_size - ns*ainfo->mdrain_rate/1000000;
374*4882a593Smuzhiyun break;
375*4882a593Smuzhiyun }
376*4882a593Smuzhiyun if (iter>100)
377*4882a593Smuzhiyun {
378*4882a593Smuzhiyun ainfo->converged = 0;
379*4882a593Smuzhiyun return (1);
380*4882a593Smuzhiyun }
381*4882a593Smuzhiyun ns = 1000000*ainfo->gburst_size/(state->memory_width/8)/state->mclk_khz;
382*4882a593Smuzhiyun tmp = ns * ainfo->gdrain_rate/1000000;
383*4882a593Smuzhiyun if (abs(ainfo->gburst_size) + ((abs(ainfo->wcglwm) + 16 ) & ~0x7) - tmp > max_gfsize)
384*4882a593Smuzhiyun {
385*4882a593Smuzhiyun ainfo->converged = 0;
386*4882a593Smuzhiyun return (1);
387*4882a593Smuzhiyun }
388*4882a593Smuzhiyun ns = 1000000*ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
389*4882a593Smuzhiyun tmp = ns * ainfo->vdrain_rate/1000000;
390*4882a593Smuzhiyun if (abs(ainfo->vburst_size) + (abs(ainfo->wcvlwm + 32) & ~0xf) - tmp> VFIFO_SIZE)
391*4882a593Smuzhiyun {
392*4882a593Smuzhiyun ainfo->converged = 0;
393*4882a593Smuzhiyun return (1);
394*4882a593Smuzhiyun }
395*4882a593Smuzhiyun if (abs(ainfo->gocc) > max_gfsize)
396*4882a593Smuzhiyun {
397*4882a593Smuzhiyun ainfo->converged = 0;
398*4882a593Smuzhiyun return (1);
399*4882a593Smuzhiyun }
400*4882a593Smuzhiyun if (abs(ainfo->vocc) > VFIFO_SIZE)
401*4882a593Smuzhiyun {
402*4882a593Smuzhiyun ainfo->converged = 0;
403*4882a593Smuzhiyun return (1);
404*4882a593Smuzhiyun }
405*4882a593Smuzhiyun if (abs(ainfo->mocc) > MFIFO_SIZE)
406*4882a593Smuzhiyun {
407*4882a593Smuzhiyun ainfo->converged = 0;
408*4882a593Smuzhiyun return (1);
409*4882a593Smuzhiyun }
410*4882a593Smuzhiyun if (abs(vfsize) > VFIFO_SIZE)
411*4882a593Smuzhiyun {
412*4882a593Smuzhiyun ainfo->converged = 0;
413*4882a593Smuzhiyun return (1);
414*4882a593Smuzhiyun }
415*4882a593Smuzhiyun if (abs(gfsize) > max_gfsize)
416*4882a593Smuzhiyun {
417*4882a593Smuzhiyun ainfo->converged = 0;
418*4882a593Smuzhiyun return (1);
419*4882a593Smuzhiyun }
420*4882a593Smuzhiyun if (abs(mfsize) > MFIFO_SIZE)
421*4882a593Smuzhiyun {
422*4882a593Smuzhiyun ainfo->converged = 0;
423*4882a593Smuzhiyun return (1);
424*4882a593Smuzhiyun }
425*4882a593Smuzhiyun }
426*4882a593Smuzhiyun }
nv3_arb(nv3_fifo_info * res_info,nv3_sim_state * state,nv3_arb_info * ainfo)427*4882a593Smuzhiyun static char nv3_arb(nv3_fifo_info * res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
428*4882a593Smuzhiyun {
429*4882a593Smuzhiyun long ens, vns, mns, gns;
430*4882a593Smuzhiyun int mmisses, gmisses, vmisses, eburst_size, mburst_size;
431*4882a593Smuzhiyun int refresh_cycle;
432*4882a593Smuzhiyun
433*4882a593Smuzhiyun refresh_cycle = 2*(state->mclk_khz/state->pclk_khz) + 5;
434*4882a593Smuzhiyun mmisses = 2;
435*4882a593Smuzhiyun if (state->mem_aligned) gmisses = 2;
436*4882a593Smuzhiyun else gmisses = 3;
437*4882a593Smuzhiyun vmisses = 2;
438*4882a593Smuzhiyun eburst_size = state->memory_width * 1;
439*4882a593Smuzhiyun mburst_size = 32;
440*4882a593Smuzhiyun gns = 1000000 * (gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
441*4882a593Smuzhiyun ainfo->by_gfacc = gns*ainfo->gdrain_rate/1000000;
442*4882a593Smuzhiyun ainfo->wcmocc = 0;
443*4882a593Smuzhiyun ainfo->wcgocc = 0;
444*4882a593Smuzhiyun ainfo->wcvocc = 0;
445*4882a593Smuzhiyun ainfo->wcvlwm = 0;
446*4882a593Smuzhiyun ainfo->wcglwm = 0;
447*4882a593Smuzhiyun ainfo->engine_en = 1;
448*4882a593Smuzhiyun ainfo->converged = 1;
449*4882a593Smuzhiyun if (ainfo->engine_en)
450*4882a593Smuzhiyun {
451*4882a593Smuzhiyun ens = 1000000*(state->mem_page_miss + eburst_size/(state->memory_width/8) +refresh_cycle)/state->mclk_khz;
452*4882a593Smuzhiyun ainfo->mocc = state->enable_mp ? 0-ens*ainfo->mdrain_rate/1000000 : 0;
453*4882a593Smuzhiyun ainfo->vocc = ainfo->vid_en ? 0-ens*ainfo->vdrain_rate/1000000 : 0;
454*4882a593Smuzhiyun ainfo->gocc = ainfo->gr_en ? 0-ens*ainfo->gdrain_rate/1000000 : 0;
455*4882a593Smuzhiyun ainfo->cur = ENGINE;
456*4882a593Smuzhiyun ainfo->first_vacc = 1;
457*4882a593Smuzhiyun ainfo->first_gacc = 1;
458*4882a593Smuzhiyun ainfo->first_macc = 1;
459*4882a593Smuzhiyun nv3_iterate(res_info, state,ainfo);
460*4882a593Smuzhiyun }
461*4882a593Smuzhiyun if (state->enable_mp)
462*4882a593Smuzhiyun {
463*4882a593Smuzhiyun mns = 1000000 * (mmisses*state->mem_page_miss + mburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
464*4882a593Smuzhiyun ainfo->mocc = state->enable_mp ? 0 : mburst_size - mns*ainfo->mdrain_rate/1000000;
465*4882a593Smuzhiyun ainfo->vocc = ainfo->vid_en ? 0 : 0- mns*ainfo->vdrain_rate/1000000;
466*4882a593Smuzhiyun ainfo->gocc = ainfo->gr_en ? 0: 0- mns*ainfo->gdrain_rate/1000000;
467*4882a593Smuzhiyun ainfo->cur = MPORT;
468*4882a593Smuzhiyun ainfo->first_vacc = 1;
469*4882a593Smuzhiyun ainfo->first_gacc = 1;
470*4882a593Smuzhiyun ainfo->first_macc = 0;
471*4882a593Smuzhiyun nv3_iterate(res_info, state,ainfo);
472*4882a593Smuzhiyun }
473*4882a593Smuzhiyun if (ainfo->gr_en)
474*4882a593Smuzhiyun {
475*4882a593Smuzhiyun ainfo->first_vacc = 1;
476*4882a593Smuzhiyun ainfo->first_gacc = 0;
477*4882a593Smuzhiyun ainfo->first_macc = 1;
478*4882a593Smuzhiyun gns = 1000000*(gmisses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
479*4882a593Smuzhiyun ainfo->gocc = ainfo->gburst_size - gns*ainfo->gdrain_rate/1000000;
480*4882a593Smuzhiyun ainfo->vocc = ainfo->vid_en? 0-gns*ainfo->vdrain_rate/1000000 : 0;
481*4882a593Smuzhiyun ainfo->mocc = state->enable_mp ? 0-gns*ainfo->mdrain_rate/1000000: 0;
482*4882a593Smuzhiyun ainfo->cur = GRAPHICS;
483*4882a593Smuzhiyun nv3_iterate(res_info, state,ainfo);
484*4882a593Smuzhiyun }
485*4882a593Smuzhiyun if (ainfo->vid_en)
486*4882a593Smuzhiyun {
487*4882a593Smuzhiyun ainfo->first_vacc = 0;
488*4882a593Smuzhiyun ainfo->first_gacc = 1;
489*4882a593Smuzhiyun ainfo->first_macc = 1;
490*4882a593Smuzhiyun vns = 1000000*(vmisses*state->mem_page_miss + ainfo->vburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
491*4882a593Smuzhiyun ainfo->vocc = ainfo->vburst_size - vns*ainfo->vdrain_rate/1000000;
492*4882a593Smuzhiyun ainfo->gocc = ainfo->gr_en? (0-vns*ainfo->gdrain_rate/1000000) : 0;
493*4882a593Smuzhiyun ainfo->mocc = state->enable_mp? 0-vns*ainfo->mdrain_rate/1000000 :0 ;
494*4882a593Smuzhiyun ainfo->cur = VIDEO;
495*4882a593Smuzhiyun nv3_iterate(res_info, state, ainfo);
496*4882a593Smuzhiyun }
497*4882a593Smuzhiyun if (ainfo->converged)
498*4882a593Smuzhiyun {
499*4882a593Smuzhiyun res_info->graphics_lwm = (int)abs(ainfo->wcglwm) + 16;
500*4882a593Smuzhiyun res_info->video_lwm = (int)abs(ainfo->wcvlwm) + 32;
501*4882a593Smuzhiyun res_info->graphics_burst_size = ainfo->gburst_size;
502*4882a593Smuzhiyun res_info->video_burst_size = ainfo->vburst_size;
503*4882a593Smuzhiyun res_info->graphics_hi_priority = (ainfo->priority == GRAPHICS);
504*4882a593Smuzhiyun res_info->media_hi_priority = (ainfo->priority == MPORT);
505*4882a593Smuzhiyun if (res_info->video_lwm > 160)
506*4882a593Smuzhiyun {
507*4882a593Smuzhiyun res_info->graphics_lwm = 256;
508*4882a593Smuzhiyun res_info->video_lwm = 128;
509*4882a593Smuzhiyun res_info->graphics_burst_size = 64;
510*4882a593Smuzhiyun res_info->video_burst_size = 64;
511*4882a593Smuzhiyun res_info->graphics_hi_priority = 0;
512*4882a593Smuzhiyun res_info->media_hi_priority = 0;
513*4882a593Smuzhiyun ainfo->converged = 0;
514*4882a593Smuzhiyun return (0);
515*4882a593Smuzhiyun }
516*4882a593Smuzhiyun if (res_info->video_lwm > 128)
517*4882a593Smuzhiyun {
518*4882a593Smuzhiyun res_info->video_lwm = 128;
519*4882a593Smuzhiyun }
520*4882a593Smuzhiyun return (1);
521*4882a593Smuzhiyun }
522*4882a593Smuzhiyun else
523*4882a593Smuzhiyun {
524*4882a593Smuzhiyun res_info->graphics_lwm = 256;
525*4882a593Smuzhiyun res_info->video_lwm = 128;
526*4882a593Smuzhiyun res_info->graphics_burst_size = 64;
527*4882a593Smuzhiyun res_info->video_burst_size = 64;
528*4882a593Smuzhiyun res_info->graphics_hi_priority = 0;
529*4882a593Smuzhiyun res_info->media_hi_priority = 0;
530*4882a593Smuzhiyun return (0);
531*4882a593Smuzhiyun }
532*4882a593Smuzhiyun }
nv3_get_param(nv3_fifo_info * res_info,nv3_sim_state * state,nv3_arb_info * ainfo)533*4882a593Smuzhiyun static char nv3_get_param(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
534*4882a593Smuzhiyun {
535*4882a593Smuzhiyun int done, g,v, p;
536*4882a593Smuzhiyun
537*4882a593Smuzhiyun done = 0;
538*4882a593Smuzhiyun for (p=0; p < 2; p++)
539*4882a593Smuzhiyun {
540*4882a593Smuzhiyun for (g=128 ; g > 32; g= g>> 1)
541*4882a593Smuzhiyun {
542*4882a593Smuzhiyun for (v=128; v >=32; v = v>> 1)
543*4882a593Smuzhiyun {
544*4882a593Smuzhiyun ainfo->priority = p;
545*4882a593Smuzhiyun ainfo->gburst_size = g;
546*4882a593Smuzhiyun ainfo->vburst_size = v;
547*4882a593Smuzhiyun done = nv3_arb(res_info, state,ainfo);
548*4882a593Smuzhiyun if (done && (g==128))
549*4882a593Smuzhiyun if ((res_info->graphics_lwm + g) > 256)
550*4882a593Smuzhiyun done = 0;
551*4882a593Smuzhiyun if (done)
552*4882a593Smuzhiyun goto Done;
553*4882a593Smuzhiyun }
554*4882a593Smuzhiyun }
555*4882a593Smuzhiyun }
556*4882a593Smuzhiyun
557*4882a593Smuzhiyun Done:
558*4882a593Smuzhiyun return done;
559*4882a593Smuzhiyun }
nv3CalcArbitration(nv3_fifo_info * res_info,nv3_sim_state * state)560*4882a593Smuzhiyun static void nv3CalcArbitration
561*4882a593Smuzhiyun (
562*4882a593Smuzhiyun nv3_fifo_info * res_info,
563*4882a593Smuzhiyun nv3_sim_state * state
564*4882a593Smuzhiyun )
565*4882a593Smuzhiyun {
566*4882a593Smuzhiyun nv3_fifo_info save_info;
567*4882a593Smuzhiyun nv3_arb_info ainfo;
568*4882a593Smuzhiyun char res_gr, res_vid;
569*4882a593Smuzhiyun
570*4882a593Smuzhiyun ainfo.gr_en = 1;
571*4882a593Smuzhiyun ainfo.vid_en = state->enable_video;
572*4882a593Smuzhiyun ainfo.vid_only_once = 0;
573*4882a593Smuzhiyun ainfo.gr_only_once = 0;
574*4882a593Smuzhiyun ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
575*4882a593Smuzhiyun ainfo.vdrain_rate = (int) state->pclk_khz * 2;
576*4882a593Smuzhiyun if (state->video_scale != 0)
577*4882a593Smuzhiyun ainfo.vdrain_rate = ainfo.vdrain_rate/state->video_scale;
578*4882a593Smuzhiyun ainfo.mdrain_rate = 33000;
579*4882a593Smuzhiyun res_info->rtl_values = 0;
580*4882a593Smuzhiyun if (!state->gr_during_vid && state->enable_video)
581*4882a593Smuzhiyun {
582*4882a593Smuzhiyun ainfo.gr_only_once = 1;
583*4882a593Smuzhiyun ainfo.gr_en = 1;
584*4882a593Smuzhiyun ainfo.gdrain_rate = 0;
585*4882a593Smuzhiyun res_vid = nv3_get_param(res_info, state, &ainfo);
586*4882a593Smuzhiyun res_vid = ainfo.converged;
587*4882a593Smuzhiyun save_info.video_lwm = res_info->video_lwm;
588*4882a593Smuzhiyun save_info.video_burst_size = res_info->video_burst_size;
589*4882a593Smuzhiyun ainfo.vid_en = 1;
590*4882a593Smuzhiyun ainfo.vid_only_once = 1;
591*4882a593Smuzhiyun ainfo.gr_en = 1;
592*4882a593Smuzhiyun ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
593*4882a593Smuzhiyun ainfo.vdrain_rate = 0;
594*4882a593Smuzhiyun res_gr = nv3_get_param(res_info, state, &ainfo);
595*4882a593Smuzhiyun res_gr = ainfo.converged;
596*4882a593Smuzhiyun res_info->video_lwm = save_info.video_lwm;
597*4882a593Smuzhiyun res_info->video_burst_size = save_info.video_burst_size;
598*4882a593Smuzhiyun res_info->valid = res_gr & res_vid;
599*4882a593Smuzhiyun }
600*4882a593Smuzhiyun else
601*4882a593Smuzhiyun {
602*4882a593Smuzhiyun if (!ainfo.gr_en) ainfo.gdrain_rate = 0;
603*4882a593Smuzhiyun if (!ainfo.vid_en) ainfo.vdrain_rate = 0;
604*4882a593Smuzhiyun res_gr = nv3_get_param(res_info, state, &ainfo);
605*4882a593Smuzhiyun res_info->valid = ainfo.converged;
606*4882a593Smuzhiyun }
607*4882a593Smuzhiyun }
nv3UpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip)608*4882a593Smuzhiyun static void nv3UpdateArbitrationSettings
609*4882a593Smuzhiyun (
610*4882a593Smuzhiyun unsigned VClk,
611*4882a593Smuzhiyun unsigned pixelDepth,
612*4882a593Smuzhiyun unsigned *burst,
613*4882a593Smuzhiyun unsigned *lwm,
614*4882a593Smuzhiyun RIVA_HW_INST *chip
615*4882a593Smuzhiyun )
616*4882a593Smuzhiyun {
617*4882a593Smuzhiyun nv3_fifo_info fifo_data;
618*4882a593Smuzhiyun nv3_sim_state sim_data;
619*4882a593Smuzhiyun unsigned int M, N, P, pll, MClk;
620*4882a593Smuzhiyun
621*4882a593Smuzhiyun pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
622*4882a593Smuzhiyun M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
623*4882a593Smuzhiyun MClk = (N * chip->CrystalFreqKHz / M) >> P;
624*4882a593Smuzhiyun sim_data.pix_bpp = (char)pixelDepth;
625*4882a593Smuzhiyun sim_data.enable_video = 0;
626*4882a593Smuzhiyun sim_data.enable_mp = 0;
627*4882a593Smuzhiyun sim_data.video_scale = 1;
628*4882a593Smuzhiyun sim_data.memory_width = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
629*4882a593Smuzhiyun 128 : 64;
630*4882a593Smuzhiyun sim_data.memory_width = 128;
631*4882a593Smuzhiyun
632*4882a593Smuzhiyun sim_data.mem_latency = 9;
633*4882a593Smuzhiyun sim_data.mem_aligned = 1;
634*4882a593Smuzhiyun sim_data.mem_page_miss = 11;
635*4882a593Smuzhiyun sim_data.gr_during_vid = 0;
636*4882a593Smuzhiyun sim_data.pclk_khz = VClk;
637*4882a593Smuzhiyun sim_data.mclk_khz = MClk;
638*4882a593Smuzhiyun nv3CalcArbitration(&fifo_data, &sim_data);
639*4882a593Smuzhiyun if (fifo_data.valid)
640*4882a593Smuzhiyun {
641*4882a593Smuzhiyun int b = fifo_data.graphics_burst_size >> 4;
642*4882a593Smuzhiyun *burst = 0;
643*4882a593Smuzhiyun while (b >>= 1)
644*4882a593Smuzhiyun (*burst)++;
645*4882a593Smuzhiyun *lwm = fifo_data.graphics_lwm >> 3;
646*4882a593Smuzhiyun }
647*4882a593Smuzhiyun else
648*4882a593Smuzhiyun {
649*4882a593Smuzhiyun *lwm = 0x24;
650*4882a593Smuzhiyun *burst = 0x2;
651*4882a593Smuzhiyun }
652*4882a593Smuzhiyun }
nv4CalcArbitration(nv4_fifo_info * fifo,nv4_sim_state * arb)653*4882a593Smuzhiyun static void nv4CalcArbitration
654*4882a593Smuzhiyun (
655*4882a593Smuzhiyun nv4_fifo_info *fifo,
656*4882a593Smuzhiyun nv4_sim_state *arb
657*4882a593Smuzhiyun )
658*4882a593Smuzhiyun {
659*4882a593Smuzhiyun int data, pagemiss, cas,width, video_enable, color_key_enable, bpp, align;
660*4882a593Smuzhiyun int nvclks, mclks, pclks, vpagemiss, crtpagemiss, vbs;
661*4882a593Smuzhiyun int found, mclk_extra, mclk_loop, cbs, m1, p1;
662*4882a593Smuzhiyun int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
663*4882a593Smuzhiyun int us_m, us_n, us_p, video_drain_rate, crtc_drain_rate;
664*4882a593Smuzhiyun int vpm_us, us_video, vlwm, video_fill_us, cpm_us, us_crt,clwm;
665*4882a593Smuzhiyun int craw, vraw;
666*4882a593Smuzhiyun
667*4882a593Smuzhiyun fifo->valid = 1;
668*4882a593Smuzhiyun pclk_freq = arb->pclk_khz;
669*4882a593Smuzhiyun mclk_freq = arb->mclk_khz;
670*4882a593Smuzhiyun nvclk_freq = arb->nvclk_khz;
671*4882a593Smuzhiyun pagemiss = arb->mem_page_miss;
672*4882a593Smuzhiyun cas = arb->mem_latency;
673*4882a593Smuzhiyun width = arb->memory_width >> 6;
674*4882a593Smuzhiyun video_enable = arb->enable_video;
675*4882a593Smuzhiyun color_key_enable = arb->gr_during_vid;
676*4882a593Smuzhiyun bpp = arb->pix_bpp;
677*4882a593Smuzhiyun align = arb->mem_aligned;
678*4882a593Smuzhiyun mp_enable = arb->enable_mp;
679*4882a593Smuzhiyun clwm = 0;
680*4882a593Smuzhiyun vlwm = 0;
681*4882a593Smuzhiyun cbs = 128;
682*4882a593Smuzhiyun pclks = 2;
683*4882a593Smuzhiyun nvclks = 2;
684*4882a593Smuzhiyun nvclks += 2;
685*4882a593Smuzhiyun nvclks += 1;
686*4882a593Smuzhiyun mclks = 5;
687*4882a593Smuzhiyun mclks += 3;
688*4882a593Smuzhiyun mclks += 1;
689*4882a593Smuzhiyun mclks += cas;
690*4882a593Smuzhiyun mclks += 1;
691*4882a593Smuzhiyun mclks += 1;
692*4882a593Smuzhiyun mclks += 1;
693*4882a593Smuzhiyun mclks += 1;
694*4882a593Smuzhiyun mclk_extra = 3;
695*4882a593Smuzhiyun nvclks += 2;
696*4882a593Smuzhiyun nvclks += 1;
697*4882a593Smuzhiyun nvclks += 1;
698*4882a593Smuzhiyun nvclks += 1;
699*4882a593Smuzhiyun if (mp_enable)
700*4882a593Smuzhiyun mclks+=4;
701*4882a593Smuzhiyun nvclks += 0;
702*4882a593Smuzhiyun pclks += 0;
703*4882a593Smuzhiyun found = 0;
704*4882a593Smuzhiyun vbs = 0;
705*4882a593Smuzhiyun while (found != 1)
706*4882a593Smuzhiyun {
707*4882a593Smuzhiyun fifo->valid = 1;
708*4882a593Smuzhiyun found = 1;
709*4882a593Smuzhiyun mclk_loop = mclks+mclk_extra;
710*4882a593Smuzhiyun us_m = mclk_loop *1000*1000 / mclk_freq;
711*4882a593Smuzhiyun us_n = nvclks*1000*1000 / nvclk_freq;
712*4882a593Smuzhiyun us_p = nvclks*1000*1000 / pclk_freq;
713*4882a593Smuzhiyun if (video_enable)
714*4882a593Smuzhiyun {
715*4882a593Smuzhiyun video_drain_rate = pclk_freq * 2;
716*4882a593Smuzhiyun crtc_drain_rate = pclk_freq * bpp/8;
717*4882a593Smuzhiyun vpagemiss = 2;
718*4882a593Smuzhiyun vpagemiss += 1;
719*4882a593Smuzhiyun crtpagemiss = 2;
720*4882a593Smuzhiyun vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
721*4882a593Smuzhiyun if (nvclk_freq * 2 > mclk_freq * width)
722*4882a593Smuzhiyun video_fill_us = cbs*1000*1000 / 16 / nvclk_freq ;
723*4882a593Smuzhiyun else
724*4882a593Smuzhiyun video_fill_us = cbs*1000*1000 / (8 * width) / mclk_freq;
725*4882a593Smuzhiyun us_video = vpm_us + us_m + us_n + us_p + video_fill_us;
726*4882a593Smuzhiyun vlwm = us_video * video_drain_rate/(1000*1000);
727*4882a593Smuzhiyun vlwm++;
728*4882a593Smuzhiyun vbs = 128;
729*4882a593Smuzhiyun if (vlwm > 128) vbs = 64;
730*4882a593Smuzhiyun if (vlwm > (256-64)) vbs = 32;
731*4882a593Smuzhiyun if (nvclk_freq * 2 > mclk_freq * width)
732*4882a593Smuzhiyun video_fill_us = vbs *1000*1000/ 16 / nvclk_freq ;
733*4882a593Smuzhiyun else
734*4882a593Smuzhiyun video_fill_us = vbs*1000*1000 / (8 * width) / mclk_freq;
735*4882a593Smuzhiyun cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
736*4882a593Smuzhiyun us_crt =
737*4882a593Smuzhiyun us_video
738*4882a593Smuzhiyun +video_fill_us
739*4882a593Smuzhiyun +cpm_us
740*4882a593Smuzhiyun +us_m + us_n +us_p
741*4882a593Smuzhiyun ;
742*4882a593Smuzhiyun clwm = us_crt * crtc_drain_rate/(1000*1000);
743*4882a593Smuzhiyun clwm++;
744*4882a593Smuzhiyun }
745*4882a593Smuzhiyun else
746*4882a593Smuzhiyun {
747*4882a593Smuzhiyun crtc_drain_rate = pclk_freq * bpp/8;
748*4882a593Smuzhiyun crtpagemiss = 2;
749*4882a593Smuzhiyun crtpagemiss += 1;
750*4882a593Smuzhiyun cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
751*4882a593Smuzhiyun us_crt = cpm_us + us_m + us_n + us_p ;
752*4882a593Smuzhiyun clwm = us_crt * crtc_drain_rate/(1000*1000);
753*4882a593Smuzhiyun clwm++;
754*4882a593Smuzhiyun }
755*4882a593Smuzhiyun m1 = clwm + cbs - 512;
756*4882a593Smuzhiyun p1 = m1 * pclk_freq / mclk_freq;
757*4882a593Smuzhiyun p1 = p1 * bpp / 8;
758*4882a593Smuzhiyun if ((p1 < m1) && (m1 > 0))
759*4882a593Smuzhiyun {
760*4882a593Smuzhiyun fifo->valid = 0;
761*4882a593Smuzhiyun found = 0;
762*4882a593Smuzhiyun if (mclk_extra ==0) found = 1;
763*4882a593Smuzhiyun mclk_extra--;
764*4882a593Smuzhiyun }
765*4882a593Smuzhiyun else if (video_enable)
766*4882a593Smuzhiyun {
767*4882a593Smuzhiyun if ((clwm > 511) || (vlwm > 255))
768*4882a593Smuzhiyun {
769*4882a593Smuzhiyun fifo->valid = 0;
770*4882a593Smuzhiyun found = 0;
771*4882a593Smuzhiyun if (mclk_extra ==0) found = 1;
772*4882a593Smuzhiyun mclk_extra--;
773*4882a593Smuzhiyun }
774*4882a593Smuzhiyun }
775*4882a593Smuzhiyun else
776*4882a593Smuzhiyun {
777*4882a593Smuzhiyun if (clwm > 519)
778*4882a593Smuzhiyun {
779*4882a593Smuzhiyun fifo->valid = 0;
780*4882a593Smuzhiyun found = 0;
781*4882a593Smuzhiyun if (mclk_extra ==0) found = 1;
782*4882a593Smuzhiyun mclk_extra--;
783*4882a593Smuzhiyun }
784*4882a593Smuzhiyun }
785*4882a593Smuzhiyun craw = clwm;
786*4882a593Smuzhiyun vraw = vlwm;
787*4882a593Smuzhiyun if (clwm < 384) clwm = 384;
788*4882a593Smuzhiyun if (vlwm < 128) vlwm = 128;
789*4882a593Smuzhiyun data = (int)(clwm);
790*4882a593Smuzhiyun fifo->graphics_lwm = data;
791*4882a593Smuzhiyun fifo->graphics_burst_size = 128;
792*4882a593Smuzhiyun data = (int)((vlwm+15));
793*4882a593Smuzhiyun fifo->video_lwm = data;
794*4882a593Smuzhiyun fifo->video_burst_size = vbs;
795*4882a593Smuzhiyun }
796*4882a593Smuzhiyun }
nv4UpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip)797*4882a593Smuzhiyun static void nv4UpdateArbitrationSettings
798*4882a593Smuzhiyun (
799*4882a593Smuzhiyun unsigned VClk,
800*4882a593Smuzhiyun unsigned pixelDepth,
801*4882a593Smuzhiyun unsigned *burst,
802*4882a593Smuzhiyun unsigned *lwm,
803*4882a593Smuzhiyun RIVA_HW_INST *chip
804*4882a593Smuzhiyun )
805*4882a593Smuzhiyun {
806*4882a593Smuzhiyun nv4_fifo_info fifo_data;
807*4882a593Smuzhiyun nv4_sim_state sim_data;
808*4882a593Smuzhiyun unsigned int M, N, P, pll, MClk, NVClk, cfg1;
809*4882a593Smuzhiyun
810*4882a593Smuzhiyun pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
811*4882a593Smuzhiyun M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
812*4882a593Smuzhiyun MClk = (N * chip->CrystalFreqKHz / M) >> P;
813*4882a593Smuzhiyun pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
814*4882a593Smuzhiyun M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
815*4882a593Smuzhiyun NVClk = (N * chip->CrystalFreqKHz / M) >> P;
816*4882a593Smuzhiyun cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
817*4882a593Smuzhiyun sim_data.pix_bpp = (char)pixelDepth;
818*4882a593Smuzhiyun sim_data.enable_video = 0;
819*4882a593Smuzhiyun sim_data.enable_mp = 0;
820*4882a593Smuzhiyun sim_data.memory_width = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
821*4882a593Smuzhiyun 128 : 64;
822*4882a593Smuzhiyun sim_data.mem_latency = (char)cfg1 & 0x0F;
823*4882a593Smuzhiyun sim_data.mem_aligned = 1;
824*4882a593Smuzhiyun sim_data.mem_page_miss = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
825*4882a593Smuzhiyun sim_data.gr_during_vid = 0;
826*4882a593Smuzhiyun sim_data.pclk_khz = VClk;
827*4882a593Smuzhiyun sim_data.mclk_khz = MClk;
828*4882a593Smuzhiyun sim_data.nvclk_khz = NVClk;
829*4882a593Smuzhiyun nv4CalcArbitration(&fifo_data, &sim_data);
830*4882a593Smuzhiyun if (fifo_data.valid)
831*4882a593Smuzhiyun {
832*4882a593Smuzhiyun int b = fifo_data.graphics_burst_size >> 4;
833*4882a593Smuzhiyun *burst = 0;
834*4882a593Smuzhiyun while (b >>= 1)
835*4882a593Smuzhiyun (*burst)++;
836*4882a593Smuzhiyun *lwm = fifo_data.graphics_lwm >> 3;
837*4882a593Smuzhiyun }
838*4882a593Smuzhiyun }
nv10CalcArbitration(nv10_fifo_info * fifo,nv10_sim_state * arb)839*4882a593Smuzhiyun static void nv10CalcArbitration
840*4882a593Smuzhiyun (
841*4882a593Smuzhiyun nv10_fifo_info *fifo,
842*4882a593Smuzhiyun nv10_sim_state *arb
843*4882a593Smuzhiyun )
844*4882a593Smuzhiyun {
845*4882a593Smuzhiyun int data, pagemiss, cas,width, video_enable, color_key_enable, bpp, align;
846*4882a593Smuzhiyun int nvclks, mclks, pclks, vpagemiss, crtpagemiss, vbs;
847*4882a593Smuzhiyun int nvclk_fill, us_extra;
848*4882a593Smuzhiyun int found, mclk_extra, mclk_loop, cbs, m1;
849*4882a593Smuzhiyun int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
850*4882a593Smuzhiyun int us_m, us_m_min, us_n, us_p, video_drain_rate, crtc_drain_rate;
851*4882a593Smuzhiyun int vus_m, vus_n, vus_p;
852*4882a593Smuzhiyun int vpm_us, us_video, vlwm, cpm_us, us_crt,clwm;
853*4882a593Smuzhiyun int clwm_rnd_down;
854*4882a593Smuzhiyun int craw, m2us, us_pipe, us_pipe_min, vus_pipe, p1clk, p2;
855*4882a593Smuzhiyun int pclks_2_top_fifo, min_mclk_extra;
856*4882a593Smuzhiyun int us_min_mclk_extra;
857*4882a593Smuzhiyun
858*4882a593Smuzhiyun fifo->valid = 1;
859*4882a593Smuzhiyun pclk_freq = arb->pclk_khz; /* freq in KHz */
860*4882a593Smuzhiyun mclk_freq = arb->mclk_khz;
861*4882a593Smuzhiyun nvclk_freq = arb->nvclk_khz;
862*4882a593Smuzhiyun pagemiss = arb->mem_page_miss;
863*4882a593Smuzhiyun cas = arb->mem_latency;
864*4882a593Smuzhiyun width = arb->memory_width/64;
865*4882a593Smuzhiyun video_enable = arb->enable_video;
866*4882a593Smuzhiyun color_key_enable = arb->gr_during_vid;
867*4882a593Smuzhiyun bpp = arb->pix_bpp;
868*4882a593Smuzhiyun align = arb->mem_aligned;
869*4882a593Smuzhiyun mp_enable = arb->enable_mp;
870*4882a593Smuzhiyun clwm = 0;
871*4882a593Smuzhiyun vlwm = 1024;
872*4882a593Smuzhiyun
873*4882a593Smuzhiyun cbs = 512;
874*4882a593Smuzhiyun vbs = 512;
875*4882a593Smuzhiyun
876*4882a593Smuzhiyun pclks = 4; /* lwm detect. */
877*4882a593Smuzhiyun
878*4882a593Smuzhiyun nvclks = 3; /* lwm -> sync. */
879*4882a593Smuzhiyun nvclks += 2; /* fbi bus cycles (1 req + 1 busy) */
880*4882a593Smuzhiyun
881*4882a593Smuzhiyun mclks = 1; /* 2 edge sync. may be very close to edge so just put one. */
882*4882a593Smuzhiyun
883*4882a593Smuzhiyun mclks += 1; /* arb_hp_req */
884*4882a593Smuzhiyun mclks += 5; /* ap_hp_req tiling pipeline */
885*4882a593Smuzhiyun
886*4882a593Smuzhiyun mclks += 2; /* tc_req latency fifo */
887*4882a593Smuzhiyun mclks += 2; /* fb_cas_n_ memory request to fbio block */
888*4882a593Smuzhiyun mclks += 7; /* sm_d_rdv data returned from fbio block */
889*4882a593Smuzhiyun
890*4882a593Smuzhiyun /* fb.rd.d.Put_gc need to accumulate 256 bits for read */
891*4882a593Smuzhiyun if (arb->memory_type == 0)
892*4882a593Smuzhiyun if (arb->memory_width == 64) /* 64 bit bus */
893*4882a593Smuzhiyun mclks += 4;
894*4882a593Smuzhiyun else
895*4882a593Smuzhiyun mclks += 2;
896*4882a593Smuzhiyun else
897*4882a593Smuzhiyun if (arb->memory_width == 64) /* 64 bit bus */
898*4882a593Smuzhiyun mclks += 2;
899*4882a593Smuzhiyun else
900*4882a593Smuzhiyun mclks += 1;
901*4882a593Smuzhiyun
902*4882a593Smuzhiyun if ((!video_enable) && (arb->memory_width == 128))
903*4882a593Smuzhiyun {
904*4882a593Smuzhiyun mclk_extra = (bpp == 32) ? 31 : 42; /* Margin of error */
905*4882a593Smuzhiyun min_mclk_extra = 17;
906*4882a593Smuzhiyun }
907*4882a593Smuzhiyun else
908*4882a593Smuzhiyun {
909*4882a593Smuzhiyun mclk_extra = (bpp == 32) ? 8 : 4; /* Margin of error */
910*4882a593Smuzhiyun /* mclk_extra = 4; */ /* Margin of error */
911*4882a593Smuzhiyun min_mclk_extra = 18;
912*4882a593Smuzhiyun }
913*4882a593Smuzhiyun
914*4882a593Smuzhiyun nvclks += 1; /* 2 edge sync. may be very close to edge so just put one. */
915*4882a593Smuzhiyun nvclks += 1; /* fbi_d_rdv_n */
916*4882a593Smuzhiyun nvclks += 1; /* Fbi_d_rdata */
917*4882a593Smuzhiyun nvclks += 1; /* crtfifo load */
918*4882a593Smuzhiyun
919*4882a593Smuzhiyun if(mp_enable)
920*4882a593Smuzhiyun mclks+=4; /* Mp can get in with a burst of 8. */
921*4882a593Smuzhiyun /* Extra clocks determined by heuristics */
922*4882a593Smuzhiyun
923*4882a593Smuzhiyun nvclks += 0;
924*4882a593Smuzhiyun pclks += 0;
925*4882a593Smuzhiyun found = 0;
926*4882a593Smuzhiyun while(found != 1) {
927*4882a593Smuzhiyun fifo->valid = 1;
928*4882a593Smuzhiyun found = 1;
929*4882a593Smuzhiyun mclk_loop = mclks+mclk_extra;
930*4882a593Smuzhiyun us_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
931*4882a593Smuzhiyun us_m_min = mclks * 1000*1000 / mclk_freq; /* Minimum Mclk latency in us */
932*4882a593Smuzhiyun us_min_mclk_extra = min_mclk_extra *1000*1000 / mclk_freq;
933*4882a593Smuzhiyun us_n = nvclks*1000*1000 / nvclk_freq;/* nvclk latency in us */
934*4882a593Smuzhiyun us_p = pclks*1000*1000 / pclk_freq;/* nvclk latency in us */
935*4882a593Smuzhiyun us_pipe = us_m + us_n + us_p;
936*4882a593Smuzhiyun us_pipe_min = us_m_min + us_n + us_p;
937*4882a593Smuzhiyun us_extra = 0;
938*4882a593Smuzhiyun
939*4882a593Smuzhiyun vus_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
940*4882a593Smuzhiyun vus_n = (4)*1000*1000 / nvclk_freq;/* nvclk latency in us */
941*4882a593Smuzhiyun vus_p = 0*1000*1000 / pclk_freq;/* pclk latency in us */
942*4882a593Smuzhiyun vus_pipe = vus_m + vus_n + vus_p;
943*4882a593Smuzhiyun
944*4882a593Smuzhiyun if(video_enable) {
945*4882a593Smuzhiyun video_drain_rate = pclk_freq * 4; /* MB/s */
946*4882a593Smuzhiyun crtc_drain_rate = pclk_freq * bpp/8; /* MB/s */
947*4882a593Smuzhiyun
948*4882a593Smuzhiyun vpagemiss = 1; /* self generating page miss */
949*4882a593Smuzhiyun vpagemiss += 1; /* One higher priority before */
950*4882a593Smuzhiyun
951*4882a593Smuzhiyun crtpagemiss = 2; /* self generating page miss */
952*4882a593Smuzhiyun if(mp_enable)
953*4882a593Smuzhiyun crtpagemiss += 1; /* if MA0 conflict */
954*4882a593Smuzhiyun
955*4882a593Smuzhiyun vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
956*4882a593Smuzhiyun
957*4882a593Smuzhiyun us_video = vpm_us + vus_m; /* Video has separate read return path */
958*4882a593Smuzhiyun
959*4882a593Smuzhiyun cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
960*4882a593Smuzhiyun us_crt =
961*4882a593Smuzhiyun us_video /* Wait for video */
962*4882a593Smuzhiyun +cpm_us /* CRT Page miss */
963*4882a593Smuzhiyun +us_m + us_n +us_p /* other latency */
964*4882a593Smuzhiyun ;
965*4882a593Smuzhiyun
966*4882a593Smuzhiyun clwm = us_crt * crtc_drain_rate/(1000*1000);
967*4882a593Smuzhiyun clwm++; /* fixed point <= float_point - 1. Fixes that */
968*4882a593Smuzhiyun } else {
969*4882a593Smuzhiyun crtc_drain_rate = pclk_freq * bpp/8; /* bpp * pclk/8 */
970*4882a593Smuzhiyun
971*4882a593Smuzhiyun crtpagemiss = 1; /* self generating page miss */
972*4882a593Smuzhiyun crtpagemiss += 1; /* MA0 page miss */
973*4882a593Smuzhiyun if(mp_enable)
974*4882a593Smuzhiyun crtpagemiss += 1; /* if MA0 conflict */
975*4882a593Smuzhiyun cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
976*4882a593Smuzhiyun us_crt = cpm_us + us_m + us_n + us_p ;
977*4882a593Smuzhiyun clwm = us_crt * crtc_drain_rate/(1000*1000);
978*4882a593Smuzhiyun clwm++; /* fixed point <= float_point - 1. Fixes that */
979*4882a593Smuzhiyun
980*4882a593Smuzhiyun /*
981*4882a593Smuzhiyun //
982*4882a593Smuzhiyun // Another concern, only for high pclks so don't do this
983*4882a593Smuzhiyun // with video:
984*4882a593Smuzhiyun // What happens if the latency to fetch the cbs is so large that
985*4882a593Smuzhiyun // fifo empties. In that case we need to have an alternate clwm value
986*4882a593Smuzhiyun // based off the total burst fetch
987*4882a593Smuzhiyun //
988*4882a593Smuzhiyun us_crt = (cbs * 1000 * 1000)/ (8*width)/mclk_freq ;
989*4882a593Smuzhiyun us_crt = us_crt + us_m + us_n + us_p + (4 * 1000 * 1000)/mclk_freq;
990*4882a593Smuzhiyun clwm_mt = us_crt * crtc_drain_rate/(1000*1000);
991*4882a593Smuzhiyun clwm_mt ++;
992*4882a593Smuzhiyun if(clwm_mt > clwm)
993*4882a593Smuzhiyun clwm = clwm_mt;
994*4882a593Smuzhiyun */
995*4882a593Smuzhiyun /* Finally, a heuristic check when width == 64 bits */
996*4882a593Smuzhiyun if(width == 1){
997*4882a593Smuzhiyun nvclk_fill = nvclk_freq * 8;
998*4882a593Smuzhiyun if(crtc_drain_rate * 100 >= nvclk_fill * 102)
999*4882a593Smuzhiyun clwm = 0xfff; /*Large number to fail */
1000*4882a593Smuzhiyun
1001*4882a593Smuzhiyun else if(crtc_drain_rate * 100 >= nvclk_fill * 98) {
1002*4882a593Smuzhiyun clwm = 1024;
1003*4882a593Smuzhiyun cbs = 512;
1004*4882a593Smuzhiyun us_extra = (cbs * 1000 * 1000)/ (8*width)/mclk_freq ;
1005*4882a593Smuzhiyun }
1006*4882a593Smuzhiyun }
1007*4882a593Smuzhiyun }
1008*4882a593Smuzhiyun
1009*4882a593Smuzhiyun
1010*4882a593Smuzhiyun /*
1011*4882a593Smuzhiyun Overfill check:
1012*4882a593Smuzhiyun
1013*4882a593Smuzhiyun */
1014*4882a593Smuzhiyun
1015*4882a593Smuzhiyun clwm_rnd_down = ((int)clwm/8)*8;
1016*4882a593Smuzhiyun if (clwm_rnd_down < clwm)
1017*4882a593Smuzhiyun clwm += 8;
1018*4882a593Smuzhiyun
1019*4882a593Smuzhiyun m1 = clwm + cbs - 1024; /* Amount of overfill */
1020*4882a593Smuzhiyun m2us = us_pipe_min + us_min_mclk_extra;
1021*4882a593Smuzhiyun pclks_2_top_fifo = (1024-clwm)/(8*width);
1022*4882a593Smuzhiyun
1023*4882a593Smuzhiyun /* pclk cycles to drain */
1024*4882a593Smuzhiyun p1clk = m2us * pclk_freq/(1000*1000);
1025*4882a593Smuzhiyun p2 = p1clk * bpp / 8; /* bytes drained. */
1026*4882a593Smuzhiyun
1027*4882a593Smuzhiyun if((p2 < m1) && (m1 > 0)) {
1028*4882a593Smuzhiyun fifo->valid = 0;
1029*4882a593Smuzhiyun found = 0;
1030*4882a593Smuzhiyun if(min_mclk_extra == 0) {
1031*4882a593Smuzhiyun if(cbs <= 32) {
1032*4882a593Smuzhiyun found = 1; /* Can't adjust anymore! */
1033*4882a593Smuzhiyun } else {
1034*4882a593Smuzhiyun cbs = cbs/2; /* reduce the burst size */
1035*4882a593Smuzhiyun }
1036*4882a593Smuzhiyun } else {
1037*4882a593Smuzhiyun min_mclk_extra--;
1038*4882a593Smuzhiyun }
1039*4882a593Smuzhiyun } else {
1040*4882a593Smuzhiyun if (clwm > 1023){ /* Have some margin */
1041*4882a593Smuzhiyun fifo->valid = 0;
1042*4882a593Smuzhiyun found = 0;
1043*4882a593Smuzhiyun if(min_mclk_extra == 0)
1044*4882a593Smuzhiyun found = 1; /* Can't adjust anymore! */
1045*4882a593Smuzhiyun else
1046*4882a593Smuzhiyun min_mclk_extra--;
1047*4882a593Smuzhiyun }
1048*4882a593Smuzhiyun }
1049*4882a593Smuzhiyun craw = clwm;
1050*4882a593Smuzhiyun
1051*4882a593Smuzhiyun if(clwm < (1024-cbs+8)) clwm = 1024-cbs+8;
1052*4882a593Smuzhiyun data = (int)(clwm);
1053*4882a593Smuzhiyun /* printf("CRT LWM: %f bytes, prog: 0x%x, bs: 256\n", clwm, data ); */
1054*4882a593Smuzhiyun fifo->graphics_lwm = data; fifo->graphics_burst_size = cbs;
1055*4882a593Smuzhiyun
1056*4882a593Smuzhiyun /* printf("VID LWM: %f bytes, prog: 0x%x, bs: %d\n, ", vlwm, data, vbs ); */
1057*4882a593Smuzhiyun fifo->video_lwm = 1024; fifo->video_burst_size = 512;
1058*4882a593Smuzhiyun }
1059*4882a593Smuzhiyun }
nv10UpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip)1060*4882a593Smuzhiyun static void nv10UpdateArbitrationSettings
1061*4882a593Smuzhiyun (
1062*4882a593Smuzhiyun unsigned VClk,
1063*4882a593Smuzhiyun unsigned pixelDepth,
1064*4882a593Smuzhiyun unsigned *burst,
1065*4882a593Smuzhiyun unsigned *lwm,
1066*4882a593Smuzhiyun RIVA_HW_INST *chip
1067*4882a593Smuzhiyun )
1068*4882a593Smuzhiyun {
1069*4882a593Smuzhiyun nv10_fifo_info fifo_data;
1070*4882a593Smuzhiyun nv10_sim_state sim_data;
1071*4882a593Smuzhiyun unsigned int M, N, P, pll, MClk, NVClk, cfg1;
1072*4882a593Smuzhiyun
1073*4882a593Smuzhiyun pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
1074*4882a593Smuzhiyun M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
1075*4882a593Smuzhiyun MClk = (N * chip->CrystalFreqKHz / M) >> P;
1076*4882a593Smuzhiyun pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
1077*4882a593Smuzhiyun M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
1078*4882a593Smuzhiyun NVClk = (N * chip->CrystalFreqKHz / M) >> P;
1079*4882a593Smuzhiyun cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
1080*4882a593Smuzhiyun sim_data.pix_bpp = (char)pixelDepth;
1081*4882a593Smuzhiyun sim_data.enable_video = 0;
1082*4882a593Smuzhiyun sim_data.enable_mp = 0;
1083*4882a593Smuzhiyun sim_data.memory_type = (NV_RD32(&chip->PFB[0x00000200/4], 0) & 0x01) ?
1084*4882a593Smuzhiyun 1 : 0;
1085*4882a593Smuzhiyun sim_data.memory_width = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
1086*4882a593Smuzhiyun 128 : 64;
1087*4882a593Smuzhiyun sim_data.mem_latency = (char)cfg1 & 0x0F;
1088*4882a593Smuzhiyun sim_data.mem_aligned = 1;
1089*4882a593Smuzhiyun sim_data.mem_page_miss = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
1090*4882a593Smuzhiyun sim_data.gr_during_vid = 0;
1091*4882a593Smuzhiyun sim_data.pclk_khz = VClk;
1092*4882a593Smuzhiyun sim_data.mclk_khz = MClk;
1093*4882a593Smuzhiyun sim_data.nvclk_khz = NVClk;
1094*4882a593Smuzhiyun nv10CalcArbitration(&fifo_data, &sim_data);
1095*4882a593Smuzhiyun if (fifo_data.valid)
1096*4882a593Smuzhiyun {
1097*4882a593Smuzhiyun int b = fifo_data.graphics_burst_size >> 4;
1098*4882a593Smuzhiyun *burst = 0;
1099*4882a593Smuzhiyun while (b >>= 1)
1100*4882a593Smuzhiyun (*burst)++;
1101*4882a593Smuzhiyun *lwm = fifo_data.graphics_lwm >> 3;
1102*4882a593Smuzhiyun }
1103*4882a593Smuzhiyun }
1104*4882a593Smuzhiyun
nForceUpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip,struct pci_dev * pdev)1105*4882a593Smuzhiyun static void nForceUpdateArbitrationSettings
1106*4882a593Smuzhiyun (
1107*4882a593Smuzhiyun unsigned VClk,
1108*4882a593Smuzhiyun unsigned pixelDepth,
1109*4882a593Smuzhiyun unsigned *burst,
1110*4882a593Smuzhiyun unsigned *lwm,
1111*4882a593Smuzhiyun RIVA_HW_INST *chip,
1112*4882a593Smuzhiyun struct pci_dev *pdev
1113*4882a593Smuzhiyun )
1114*4882a593Smuzhiyun {
1115*4882a593Smuzhiyun nv10_fifo_info fifo_data;
1116*4882a593Smuzhiyun nv10_sim_state sim_data;
1117*4882a593Smuzhiyun unsigned int M, N, P, pll, MClk, NVClk;
1118*4882a593Smuzhiyun unsigned int uMClkPostDiv;
1119*4882a593Smuzhiyun struct pci_dev *dev;
1120*4882a593Smuzhiyun int domain = pci_domain_nr(pdev->bus);
1121*4882a593Smuzhiyun
1122*4882a593Smuzhiyun dev = pci_get_domain_bus_and_slot(domain, 0, 3);
1123*4882a593Smuzhiyun pci_read_config_dword(dev, 0x6C, &uMClkPostDiv);
1124*4882a593Smuzhiyun pci_dev_put(dev);
1125*4882a593Smuzhiyun uMClkPostDiv = (uMClkPostDiv >> 8) & 0xf;
1126*4882a593Smuzhiyun
1127*4882a593Smuzhiyun if(!uMClkPostDiv) uMClkPostDiv = 4;
1128*4882a593Smuzhiyun MClk = 400000 / uMClkPostDiv;
1129*4882a593Smuzhiyun
1130*4882a593Smuzhiyun pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
1131*4882a593Smuzhiyun M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
1132*4882a593Smuzhiyun NVClk = (N * chip->CrystalFreqKHz / M) >> P;
1133*4882a593Smuzhiyun sim_data.pix_bpp = (char)pixelDepth;
1134*4882a593Smuzhiyun sim_data.enable_video = 0;
1135*4882a593Smuzhiyun sim_data.enable_mp = 0;
1136*4882a593Smuzhiyun
1137*4882a593Smuzhiyun dev = pci_get_domain_bus_and_slot(domain, 0, 1);
1138*4882a593Smuzhiyun pci_read_config_dword(dev, 0x7C, &sim_data.memory_type);
1139*4882a593Smuzhiyun pci_dev_put(dev);
1140*4882a593Smuzhiyun sim_data.memory_type = (sim_data.memory_type >> 12) & 1;
1141*4882a593Smuzhiyun
1142*4882a593Smuzhiyun sim_data.memory_width = 64;
1143*4882a593Smuzhiyun sim_data.mem_latency = 3;
1144*4882a593Smuzhiyun sim_data.mem_aligned = 1;
1145*4882a593Smuzhiyun sim_data.mem_page_miss = 10;
1146*4882a593Smuzhiyun sim_data.gr_during_vid = 0;
1147*4882a593Smuzhiyun sim_data.pclk_khz = VClk;
1148*4882a593Smuzhiyun sim_data.mclk_khz = MClk;
1149*4882a593Smuzhiyun sim_data.nvclk_khz = NVClk;
1150*4882a593Smuzhiyun nv10CalcArbitration(&fifo_data, &sim_data);
1151*4882a593Smuzhiyun if (fifo_data.valid)
1152*4882a593Smuzhiyun {
1153*4882a593Smuzhiyun int b = fifo_data.graphics_burst_size >> 4;
1154*4882a593Smuzhiyun *burst = 0;
1155*4882a593Smuzhiyun while (b >>= 1)
1156*4882a593Smuzhiyun (*burst)++;
1157*4882a593Smuzhiyun *lwm = fifo_data.graphics_lwm >> 3;
1158*4882a593Smuzhiyun }
1159*4882a593Smuzhiyun }
1160*4882a593Smuzhiyun
1161*4882a593Smuzhiyun /****************************************************************************\
1162*4882a593Smuzhiyun * *
1163*4882a593Smuzhiyun * RIVA Mode State Routines *
1164*4882a593Smuzhiyun * *
1165*4882a593Smuzhiyun \****************************************************************************/
1166*4882a593Smuzhiyun
1167*4882a593Smuzhiyun /*
1168*4882a593Smuzhiyun * Calculate the Video Clock parameters for the PLL.
1169*4882a593Smuzhiyun */
CalcVClock(int clockIn,int * clockOut,int * mOut,int * nOut,int * pOut,RIVA_HW_INST * chip)1170*4882a593Smuzhiyun static int CalcVClock
1171*4882a593Smuzhiyun (
1172*4882a593Smuzhiyun int clockIn,
1173*4882a593Smuzhiyun int *clockOut,
1174*4882a593Smuzhiyun int *mOut,
1175*4882a593Smuzhiyun int *nOut,
1176*4882a593Smuzhiyun int *pOut,
1177*4882a593Smuzhiyun RIVA_HW_INST *chip
1178*4882a593Smuzhiyun )
1179*4882a593Smuzhiyun {
1180*4882a593Smuzhiyun unsigned lowM, highM, highP;
1181*4882a593Smuzhiyun unsigned DeltaNew, DeltaOld;
1182*4882a593Smuzhiyun unsigned VClk, Freq;
1183*4882a593Smuzhiyun unsigned M, N, P;
1184*4882a593Smuzhiyun
1185*4882a593Smuzhiyun DeltaOld = 0xFFFFFFFF;
1186*4882a593Smuzhiyun
1187*4882a593Smuzhiyun VClk = (unsigned)clockIn;
1188*4882a593Smuzhiyun
1189*4882a593Smuzhiyun if (chip->CrystalFreqKHz == 13500)
1190*4882a593Smuzhiyun {
1191*4882a593Smuzhiyun lowM = 7;
1192*4882a593Smuzhiyun highM = 13 - (chip->Architecture == NV_ARCH_03);
1193*4882a593Smuzhiyun }
1194*4882a593Smuzhiyun else
1195*4882a593Smuzhiyun {
1196*4882a593Smuzhiyun lowM = 8;
1197*4882a593Smuzhiyun highM = 14 - (chip->Architecture == NV_ARCH_03);
1198*4882a593Smuzhiyun }
1199*4882a593Smuzhiyun
1200*4882a593Smuzhiyun highP = 4 - (chip->Architecture == NV_ARCH_03);
1201*4882a593Smuzhiyun for (P = 0; P <= highP; P ++)
1202*4882a593Smuzhiyun {
1203*4882a593Smuzhiyun Freq = VClk << P;
1204*4882a593Smuzhiyun if ((Freq >= 128000) && (Freq <= chip->MaxVClockFreqKHz))
1205*4882a593Smuzhiyun {
1206*4882a593Smuzhiyun for (M = lowM; M <= highM; M++)
1207*4882a593Smuzhiyun {
1208*4882a593Smuzhiyun N = (VClk << P) * M / chip->CrystalFreqKHz;
1209*4882a593Smuzhiyun if(N <= 255) {
1210*4882a593Smuzhiyun Freq = (chip->CrystalFreqKHz * N / M) >> P;
1211*4882a593Smuzhiyun if (Freq > VClk)
1212*4882a593Smuzhiyun DeltaNew = Freq - VClk;
1213*4882a593Smuzhiyun else
1214*4882a593Smuzhiyun DeltaNew = VClk - Freq;
1215*4882a593Smuzhiyun if (DeltaNew < DeltaOld)
1216*4882a593Smuzhiyun {
1217*4882a593Smuzhiyun *mOut = M;
1218*4882a593Smuzhiyun *nOut = N;
1219*4882a593Smuzhiyun *pOut = P;
1220*4882a593Smuzhiyun *clockOut = Freq;
1221*4882a593Smuzhiyun DeltaOld = DeltaNew;
1222*4882a593Smuzhiyun }
1223*4882a593Smuzhiyun }
1224*4882a593Smuzhiyun }
1225*4882a593Smuzhiyun }
1226*4882a593Smuzhiyun }
1227*4882a593Smuzhiyun
1228*4882a593Smuzhiyun /* non-zero: M/N/P/clock values assigned. zero: error (not set) */
1229*4882a593Smuzhiyun return (DeltaOld != 0xFFFFFFFF);
1230*4882a593Smuzhiyun }
1231*4882a593Smuzhiyun /*
1232*4882a593Smuzhiyun * Calculate extended mode parameters (SVGA) and save in a
1233*4882a593Smuzhiyun * mode state structure.
1234*4882a593Smuzhiyun */
CalcStateExt(RIVA_HW_INST * chip,RIVA_HW_STATE * state,struct pci_dev * pdev,int bpp,int width,int hDisplaySize,int height,int dotClock)1235*4882a593Smuzhiyun int CalcStateExt
1236*4882a593Smuzhiyun (
1237*4882a593Smuzhiyun RIVA_HW_INST *chip,
1238*4882a593Smuzhiyun RIVA_HW_STATE *state,
1239*4882a593Smuzhiyun struct pci_dev *pdev,
1240*4882a593Smuzhiyun int bpp,
1241*4882a593Smuzhiyun int width,
1242*4882a593Smuzhiyun int hDisplaySize,
1243*4882a593Smuzhiyun int height,
1244*4882a593Smuzhiyun int dotClock
1245*4882a593Smuzhiyun )
1246*4882a593Smuzhiyun {
1247*4882a593Smuzhiyun int pixelDepth;
1248*4882a593Smuzhiyun int VClk, m, n, p;
1249*4882a593Smuzhiyun
1250*4882a593Smuzhiyun /*
1251*4882a593Smuzhiyun * Save mode parameters.
1252*4882a593Smuzhiyun */
1253*4882a593Smuzhiyun state->bpp = bpp; /* this is not bitsPerPixel, it's 8,15,16,32 */
1254*4882a593Smuzhiyun state->width = width;
1255*4882a593Smuzhiyun state->height = height;
1256*4882a593Smuzhiyun /*
1257*4882a593Smuzhiyun * Extended RIVA registers.
1258*4882a593Smuzhiyun */
1259*4882a593Smuzhiyun pixelDepth = (bpp + 1)/8;
1260*4882a593Smuzhiyun if (!CalcVClock(dotClock, &VClk, &m, &n, &p, chip))
1261*4882a593Smuzhiyun return -EINVAL;
1262*4882a593Smuzhiyun
1263*4882a593Smuzhiyun switch (chip->Architecture)
1264*4882a593Smuzhiyun {
1265*4882a593Smuzhiyun case NV_ARCH_03:
1266*4882a593Smuzhiyun nv3UpdateArbitrationSettings(VClk,
1267*4882a593Smuzhiyun pixelDepth * 8,
1268*4882a593Smuzhiyun &(state->arbitration0),
1269*4882a593Smuzhiyun &(state->arbitration1),
1270*4882a593Smuzhiyun chip);
1271*4882a593Smuzhiyun state->cursor0 = 0x00;
1272*4882a593Smuzhiyun state->cursor1 = 0x78;
1273*4882a593Smuzhiyun state->cursor2 = 0x00000000;
1274*4882a593Smuzhiyun state->pllsel = 0x10010100;
1275*4882a593Smuzhiyun state->config = ((width + 31)/32)
1276*4882a593Smuzhiyun | (((pixelDepth > 2) ? 3 : pixelDepth) << 8)
1277*4882a593Smuzhiyun | 0x1000;
1278*4882a593Smuzhiyun state->general = 0x00100100;
1279*4882a593Smuzhiyun state->repaint1 = hDisplaySize < 1280 ? 0x06 : 0x02;
1280*4882a593Smuzhiyun break;
1281*4882a593Smuzhiyun case NV_ARCH_04:
1282*4882a593Smuzhiyun nv4UpdateArbitrationSettings(VClk,
1283*4882a593Smuzhiyun pixelDepth * 8,
1284*4882a593Smuzhiyun &(state->arbitration0),
1285*4882a593Smuzhiyun &(state->arbitration1),
1286*4882a593Smuzhiyun chip);
1287*4882a593Smuzhiyun state->cursor0 = 0x00;
1288*4882a593Smuzhiyun state->cursor1 = 0xFC;
1289*4882a593Smuzhiyun state->cursor2 = 0x00000000;
1290*4882a593Smuzhiyun state->pllsel = 0x10000700;
1291*4882a593Smuzhiyun state->config = 0x00001114;
1292*4882a593Smuzhiyun state->general = bpp == 16 ? 0x00101100 : 0x00100100;
1293*4882a593Smuzhiyun state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
1294*4882a593Smuzhiyun break;
1295*4882a593Smuzhiyun case NV_ARCH_10:
1296*4882a593Smuzhiyun case NV_ARCH_20:
1297*4882a593Smuzhiyun case NV_ARCH_30:
1298*4882a593Smuzhiyun if((chip->Chipset == NV_CHIP_IGEFORCE2) ||
1299*4882a593Smuzhiyun (chip->Chipset == NV_CHIP_0x01F0))
1300*4882a593Smuzhiyun {
1301*4882a593Smuzhiyun nForceUpdateArbitrationSettings(VClk,
1302*4882a593Smuzhiyun pixelDepth * 8,
1303*4882a593Smuzhiyun &(state->arbitration0),
1304*4882a593Smuzhiyun &(state->arbitration1),
1305*4882a593Smuzhiyun chip, pdev);
1306*4882a593Smuzhiyun } else {
1307*4882a593Smuzhiyun nv10UpdateArbitrationSettings(VClk,
1308*4882a593Smuzhiyun pixelDepth * 8,
1309*4882a593Smuzhiyun &(state->arbitration0),
1310*4882a593Smuzhiyun &(state->arbitration1),
1311*4882a593Smuzhiyun chip);
1312*4882a593Smuzhiyun }
1313*4882a593Smuzhiyun state->cursor0 = 0x80 | (chip->CursorStart >> 17);
1314*4882a593Smuzhiyun state->cursor1 = (chip->CursorStart >> 11) << 2;
1315*4882a593Smuzhiyun state->cursor2 = chip->CursorStart >> 24;
1316*4882a593Smuzhiyun state->pllsel = 0x10000700;
1317*4882a593Smuzhiyun state->config = NV_RD32(&chip->PFB[0x00000200/4], 0);
1318*4882a593Smuzhiyun state->general = bpp == 16 ? 0x00101100 : 0x00100100;
1319*4882a593Smuzhiyun state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
1320*4882a593Smuzhiyun break;
1321*4882a593Smuzhiyun }
1322*4882a593Smuzhiyun
1323*4882a593Smuzhiyun /* Paul Richards: below if block borks things in kernel for some reason */
1324*4882a593Smuzhiyun /* Tony: Below is needed to set hardware in DirectColor */
1325*4882a593Smuzhiyun if((bpp != 8) && (chip->Architecture != NV_ARCH_03))
1326*4882a593Smuzhiyun state->general |= 0x00000030;
1327*4882a593Smuzhiyun
1328*4882a593Smuzhiyun state->vpll = (p << 16) | (n << 8) | m;
1329*4882a593Smuzhiyun state->repaint0 = (((width/8)*pixelDepth) & 0x700) >> 3;
1330*4882a593Smuzhiyun state->pixel = pixelDepth > 2 ? 3 : pixelDepth;
1331*4882a593Smuzhiyun state->offset0 =
1332*4882a593Smuzhiyun state->offset1 =
1333*4882a593Smuzhiyun state->offset2 =
1334*4882a593Smuzhiyun state->offset3 = 0;
1335*4882a593Smuzhiyun state->pitch0 =
1336*4882a593Smuzhiyun state->pitch1 =
1337*4882a593Smuzhiyun state->pitch2 =
1338*4882a593Smuzhiyun state->pitch3 = pixelDepth * width;
1339*4882a593Smuzhiyun
1340*4882a593Smuzhiyun return 0;
1341*4882a593Smuzhiyun }
1342*4882a593Smuzhiyun /*
1343*4882a593Smuzhiyun * Load fixed function state and pre-calculated/stored state.
1344*4882a593Smuzhiyun */
1345*4882a593Smuzhiyun #define LOAD_FIXED_STATE(tbl,dev) \
1346*4882a593Smuzhiyun for (i = 0; i < sizeof(tbl##Table##dev)/8; i++) \
1347*4882a593Smuzhiyun NV_WR32(&chip->dev[tbl##Table##dev[i][0]], 0, tbl##Table##dev[i][1])
1348*4882a593Smuzhiyun #define LOAD_FIXED_STATE_8BPP(tbl,dev) \
1349*4882a593Smuzhiyun for (i = 0; i < sizeof(tbl##Table##dev##_8BPP)/8; i++) \
1350*4882a593Smuzhiyun NV_WR32(&chip->dev[tbl##Table##dev##_8BPP[i][0]], 0, tbl##Table##dev##_8BPP[i][1])
1351*4882a593Smuzhiyun #define LOAD_FIXED_STATE_15BPP(tbl,dev) \
1352*4882a593Smuzhiyun for (i = 0; i < sizeof(tbl##Table##dev##_15BPP)/8; i++) \
1353*4882a593Smuzhiyun NV_WR32(&chip->dev[tbl##Table##dev##_15BPP[i][0]], 0, tbl##Table##dev##_15BPP[i][1])
1354*4882a593Smuzhiyun #define LOAD_FIXED_STATE_16BPP(tbl,dev) \
1355*4882a593Smuzhiyun for (i = 0; i < sizeof(tbl##Table##dev##_16BPP)/8; i++) \
1356*4882a593Smuzhiyun NV_WR32(&chip->dev[tbl##Table##dev##_16BPP[i][0]], 0, tbl##Table##dev##_16BPP[i][1])
1357*4882a593Smuzhiyun #define LOAD_FIXED_STATE_32BPP(tbl,dev) \
1358*4882a593Smuzhiyun for (i = 0; i < sizeof(tbl##Table##dev##_32BPP)/8; i++) \
1359*4882a593Smuzhiyun NV_WR32(&chip->dev[tbl##Table##dev##_32BPP[i][0]], 0, tbl##Table##dev##_32BPP[i][1])
1360*4882a593Smuzhiyun
UpdateFifoState(RIVA_HW_INST * chip)1361*4882a593Smuzhiyun static void UpdateFifoState
1362*4882a593Smuzhiyun (
1363*4882a593Smuzhiyun RIVA_HW_INST *chip
1364*4882a593Smuzhiyun )
1365*4882a593Smuzhiyun {
1366*4882a593Smuzhiyun int i;
1367*4882a593Smuzhiyun
1368*4882a593Smuzhiyun switch (chip->Architecture)
1369*4882a593Smuzhiyun {
1370*4882a593Smuzhiyun case NV_ARCH_04:
1371*4882a593Smuzhiyun LOAD_FIXED_STATE(nv4,FIFO);
1372*4882a593Smuzhiyun chip->Tri03 = NULL;
1373*4882a593Smuzhiyun chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
1374*4882a593Smuzhiyun break;
1375*4882a593Smuzhiyun case NV_ARCH_10:
1376*4882a593Smuzhiyun case NV_ARCH_20:
1377*4882a593Smuzhiyun case NV_ARCH_30:
1378*4882a593Smuzhiyun /*
1379*4882a593Smuzhiyun * Initialize state for the RivaTriangle3D05 routines.
1380*4882a593Smuzhiyun */
1381*4882a593Smuzhiyun LOAD_FIXED_STATE(nv10tri05,PGRAPH);
1382*4882a593Smuzhiyun LOAD_FIXED_STATE(nv10,FIFO);
1383*4882a593Smuzhiyun chip->Tri03 = NULL;
1384*4882a593Smuzhiyun chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
1385*4882a593Smuzhiyun break;
1386*4882a593Smuzhiyun }
1387*4882a593Smuzhiyun }
LoadStateExt(RIVA_HW_INST * chip,RIVA_HW_STATE * state)1388*4882a593Smuzhiyun static void LoadStateExt
1389*4882a593Smuzhiyun (
1390*4882a593Smuzhiyun RIVA_HW_INST *chip,
1391*4882a593Smuzhiyun RIVA_HW_STATE *state
1392*4882a593Smuzhiyun )
1393*4882a593Smuzhiyun {
1394*4882a593Smuzhiyun int i;
1395*4882a593Smuzhiyun
1396*4882a593Smuzhiyun /*
1397*4882a593Smuzhiyun * Load HW fixed function state.
1398*4882a593Smuzhiyun */
1399*4882a593Smuzhiyun LOAD_FIXED_STATE(Riva,PMC);
1400*4882a593Smuzhiyun LOAD_FIXED_STATE(Riva,PTIMER);
1401*4882a593Smuzhiyun switch (chip->Architecture)
1402*4882a593Smuzhiyun {
1403*4882a593Smuzhiyun case NV_ARCH_03:
1404*4882a593Smuzhiyun /*
1405*4882a593Smuzhiyun * Make sure frame buffer config gets set before loading PRAMIN.
1406*4882a593Smuzhiyun */
1407*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000200, state->config);
1408*4882a593Smuzhiyun LOAD_FIXED_STATE(nv3,PFIFO);
1409*4882a593Smuzhiyun LOAD_FIXED_STATE(nv3,PRAMIN);
1410*4882a593Smuzhiyun LOAD_FIXED_STATE(nv3,PGRAPH);
1411*4882a593Smuzhiyun switch (state->bpp)
1412*4882a593Smuzhiyun {
1413*4882a593Smuzhiyun case 15:
1414*4882a593Smuzhiyun case 16:
1415*4882a593Smuzhiyun LOAD_FIXED_STATE_15BPP(nv3,PRAMIN);
1416*4882a593Smuzhiyun LOAD_FIXED_STATE_15BPP(nv3,PGRAPH);
1417*4882a593Smuzhiyun chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
1418*4882a593Smuzhiyun break;
1419*4882a593Smuzhiyun case 24:
1420*4882a593Smuzhiyun case 32:
1421*4882a593Smuzhiyun LOAD_FIXED_STATE_32BPP(nv3,PRAMIN);
1422*4882a593Smuzhiyun LOAD_FIXED_STATE_32BPP(nv3,PGRAPH);
1423*4882a593Smuzhiyun chip->Tri03 = NULL;
1424*4882a593Smuzhiyun break;
1425*4882a593Smuzhiyun case 8:
1426*4882a593Smuzhiyun default:
1427*4882a593Smuzhiyun LOAD_FIXED_STATE_8BPP(nv3,PRAMIN);
1428*4882a593Smuzhiyun LOAD_FIXED_STATE_8BPP(nv3,PGRAPH);
1429*4882a593Smuzhiyun chip->Tri03 = NULL;
1430*4882a593Smuzhiyun break;
1431*4882a593Smuzhiyun }
1432*4882a593Smuzhiyun for (i = 0x00000; i < 0x00800; i++)
1433*4882a593Smuzhiyun NV_WR32(&chip->PRAMIN[0x00000502 + i], 0, (i << 12) | 0x03);
1434*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000630, state->offset0);
1435*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000634, state->offset1);
1436*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000638, state->offset2);
1437*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000063C, state->offset3);
1438*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000650, state->pitch0);
1439*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000654, state->pitch1);
1440*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000658, state->pitch2);
1441*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000065C, state->pitch3);
1442*4882a593Smuzhiyun break;
1443*4882a593Smuzhiyun case NV_ARCH_04:
1444*4882a593Smuzhiyun /*
1445*4882a593Smuzhiyun * Make sure frame buffer config gets set before loading PRAMIN.
1446*4882a593Smuzhiyun */
1447*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000200, state->config);
1448*4882a593Smuzhiyun LOAD_FIXED_STATE(nv4,PFIFO);
1449*4882a593Smuzhiyun LOAD_FIXED_STATE(nv4,PRAMIN);
1450*4882a593Smuzhiyun LOAD_FIXED_STATE(nv4,PGRAPH);
1451*4882a593Smuzhiyun switch (state->bpp)
1452*4882a593Smuzhiyun {
1453*4882a593Smuzhiyun case 15:
1454*4882a593Smuzhiyun LOAD_FIXED_STATE_15BPP(nv4,PRAMIN);
1455*4882a593Smuzhiyun LOAD_FIXED_STATE_15BPP(nv4,PGRAPH);
1456*4882a593Smuzhiyun chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
1457*4882a593Smuzhiyun break;
1458*4882a593Smuzhiyun case 16:
1459*4882a593Smuzhiyun LOAD_FIXED_STATE_16BPP(nv4,PRAMIN);
1460*4882a593Smuzhiyun LOAD_FIXED_STATE_16BPP(nv4,PGRAPH);
1461*4882a593Smuzhiyun chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
1462*4882a593Smuzhiyun break;
1463*4882a593Smuzhiyun case 24:
1464*4882a593Smuzhiyun case 32:
1465*4882a593Smuzhiyun LOAD_FIXED_STATE_32BPP(nv4,PRAMIN);
1466*4882a593Smuzhiyun LOAD_FIXED_STATE_32BPP(nv4,PGRAPH);
1467*4882a593Smuzhiyun chip->Tri03 = NULL;
1468*4882a593Smuzhiyun break;
1469*4882a593Smuzhiyun case 8:
1470*4882a593Smuzhiyun default:
1471*4882a593Smuzhiyun LOAD_FIXED_STATE_8BPP(nv4,PRAMIN);
1472*4882a593Smuzhiyun LOAD_FIXED_STATE_8BPP(nv4,PGRAPH);
1473*4882a593Smuzhiyun chip->Tri03 = NULL;
1474*4882a593Smuzhiyun break;
1475*4882a593Smuzhiyun }
1476*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
1477*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
1478*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
1479*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
1480*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
1481*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
1482*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
1483*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
1484*4882a593Smuzhiyun break;
1485*4882a593Smuzhiyun case NV_ARCH_10:
1486*4882a593Smuzhiyun case NV_ARCH_20:
1487*4882a593Smuzhiyun case NV_ARCH_30:
1488*4882a593Smuzhiyun if(chip->twoHeads) {
1489*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x44);
1490*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->crtcOwner);
1491*4882a593Smuzhiyun chip->LockUnlock(chip, 0);
1492*4882a593Smuzhiyun }
1493*4882a593Smuzhiyun
1494*4882a593Smuzhiyun LOAD_FIXED_STATE(nv10,PFIFO);
1495*4882a593Smuzhiyun LOAD_FIXED_STATE(nv10,PRAMIN);
1496*4882a593Smuzhiyun LOAD_FIXED_STATE(nv10,PGRAPH);
1497*4882a593Smuzhiyun switch (state->bpp)
1498*4882a593Smuzhiyun {
1499*4882a593Smuzhiyun case 15:
1500*4882a593Smuzhiyun LOAD_FIXED_STATE_15BPP(nv10,PRAMIN);
1501*4882a593Smuzhiyun LOAD_FIXED_STATE_15BPP(nv10,PGRAPH);
1502*4882a593Smuzhiyun chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
1503*4882a593Smuzhiyun break;
1504*4882a593Smuzhiyun case 16:
1505*4882a593Smuzhiyun LOAD_FIXED_STATE_16BPP(nv10,PRAMIN);
1506*4882a593Smuzhiyun LOAD_FIXED_STATE_16BPP(nv10,PGRAPH);
1507*4882a593Smuzhiyun chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
1508*4882a593Smuzhiyun break;
1509*4882a593Smuzhiyun case 24:
1510*4882a593Smuzhiyun case 32:
1511*4882a593Smuzhiyun LOAD_FIXED_STATE_32BPP(nv10,PRAMIN);
1512*4882a593Smuzhiyun LOAD_FIXED_STATE_32BPP(nv10,PGRAPH);
1513*4882a593Smuzhiyun chip->Tri03 = NULL;
1514*4882a593Smuzhiyun break;
1515*4882a593Smuzhiyun case 8:
1516*4882a593Smuzhiyun default:
1517*4882a593Smuzhiyun LOAD_FIXED_STATE_8BPP(nv10,PRAMIN);
1518*4882a593Smuzhiyun LOAD_FIXED_STATE_8BPP(nv10,PGRAPH);
1519*4882a593Smuzhiyun chip->Tri03 = NULL;
1520*4882a593Smuzhiyun break;
1521*4882a593Smuzhiyun }
1522*4882a593Smuzhiyun
1523*4882a593Smuzhiyun if(chip->Architecture == NV_ARCH_10) {
1524*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
1525*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
1526*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
1527*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
1528*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
1529*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
1530*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
1531*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
1532*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000680, state->pitch3);
1533*4882a593Smuzhiyun } else {
1534*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000820, state->offset0);
1535*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000824, state->offset1);
1536*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000828, state->offset2);
1537*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000082C, state->offset3);
1538*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000850, state->pitch0);
1539*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000854, state->pitch1);
1540*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000858, state->pitch2);
1541*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x0000085C, state->pitch3);
1542*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000860, state->pitch3);
1543*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000864, state->pitch3);
1544*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x000009A4, NV_RD32(chip->PFB, 0x00000200));
1545*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x000009A8, NV_RD32(chip->PFB, 0x00000204));
1546*4882a593Smuzhiyun }
1547*4882a593Smuzhiyun if(chip->twoHeads) {
1548*4882a593Smuzhiyun NV_WR32(chip->PCRTC0, 0x00000860, state->head);
1549*4882a593Smuzhiyun NV_WR32(chip->PCRTC0, 0x00002860, state->head2);
1550*4882a593Smuzhiyun }
1551*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC, 0x00000404, NV_RD32(chip->PRAMDAC, 0x00000404) | (1 << 25));
1552*4882a593Smuzhiyun
1553*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00008704, 1);
1554*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00008140, 0);
1555*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00008920, 0);
1556*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00008924, 0);
1557*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00008908, 0x01ffffff);
1558*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x0000890C, 0x01ffffff);
1559*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00001588, 0);
1560*4882a593Smuzhiyun
1561*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000240, 0);
1562*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000250, 0);
1563*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000260, 0);
1564*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000270, 0);
1565*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000280, 0);
1566*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x00000290, 0);
1567*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x000002A0, 0);
1568*4882a593Smuzhiyun NV_WR32(chip->PFB, 0x000002B0, 0);
1569*4882a593Smuzhiyun
1570*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B00, NV_RD32(chip->PFB, 0x00000240));
1571*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B04, NV_RD32(chip->PFB, 0x00000244));
1572*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B08, NV_RD32(chip->PFB, 0x00000248));
1573*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B0C, NV_RD32(chip->PFB, 0x0000024C));
1574*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B10, NV_RD32(chip->PFB, 0x00000250));
1575*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B14, NV_RD32(chip->PFB, 0x00000254));
1576*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B18, NV_RD32(chip->PFB, 0x00000258));
1577*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B1C, NV_RD32(chip->PFB, 0x0000025C));
1578*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B20, NV_RD32(chip->PFB, 0x00000260));
1579*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B24, NV_RD32(chip->PFB, 0x00000264));
1580*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B28, NV_RD32(chip->PFB, 0x00000268));
1581*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B2C, NV_RD32(chip->PFB, 0x0000026C));
1582*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B30, NV_RD32(chip->PFB, 0x00000270));
1583*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B34, NV_RD32(chip->PFB, 0x00000274));
1584*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B38, NV_RD32(chip->PFB, 0x00000278));
1585*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B3C, NV_RD32(chip->PFB, 0x0000027C));
1586*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B40, NV_RD32(chip->PFB, 0x00000280));
1587*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B44, NV_RD32(chip->PFB, 0x00000284));
1588*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B48, NV_RD32(chip->PFB, 0x00000288));
1589*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B4C, NV_RD32(chip->PFB, 0x0000028C));
1590*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B50, NV_RD32(chip->PFB, 0x00000290));
1591*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B54, NV_RD32(chip->PFB, 0x00000294));
1592*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B58, NV_RD32(chip->PFB, 0x00000298));
1593*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B5C, NV_RD32(chip->PFB, 0x0000029C));
1594*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B60, NV_RD32(chip->PFB, 0x000002A0));
1595*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B64, NV_RD32(chip->PFB, 0x000002A4));
1596*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B68, NV_RD32(chip->PFB, 0x000002A8));
1597*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B6C, NV_RD32(chip->PFB, 0x000002AC));
1598*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B70, NV_RD32(chip->PFB, 0x000002B0));
1599*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B74, NV_RD32(chip->PFB, 0x000002B4));
1600*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B78, NV_RD32(chip->PFB, 0x000002B8));
1601*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000B7C, NV_RD32(chip->PFB, 0x000002BC));
1602*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F40, 0x10000000);
1603*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000000);
1604*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
1605*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000008);
1606*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000200);
1607*4882a593Smuzhiyun for (i = 0; i < (3*16); i++)
1608*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1609*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
1610*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1611*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000800);
1612*4882a593Smuzhiyun for (i = 0; i < (16*16); i++)
1613*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1614*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F40, 0x30000000);
1615*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000004);
1616*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006400);
1617*4882a593Smuzhiyun for (i = 0; i < (59*4); i++)
1618*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1619*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006800);
1620*4882a593Smuzhiyun for (i = 0; i < (47*4); i++)
1621*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1622*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006C00);
1623*4882a593Smuzhiyun for (i = 0; i < (3*4); i++)
1624*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1625*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007000);
1626*4882a593Smuzhiyun for (i = 0; i < (19*4); i++)
1627*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1628*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007400);
1629*4882a593Smuzhiyun for (i = 0; i < (12*4); i++)
1630*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1631*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007800);
1632*4882a593Smuzhiyun for (i = 0; i < (12*4); i++)
1633*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1634*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00004400);
1635*4882a593Smuzhiyun for (i = 0; i < (8*4); i++)
1636*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1637*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000000);
1638*4882a593Smuzhiyun for (i = 0; i < 16; i++)
1639*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1640*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
1641*4882a593Smuzhiyun for (i = 0; i < 4; i++)
1642*4882a593Smuzhiyun NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1643*4882a593Smuzhiyun
1644*4882a593Smuzhiyun NV_WR32(chip->PCRTC, 0x00000810, state->cursorConfig);
1645*4882a593Smuzhiyun
1646*4882a593Smuzhiyun if(chip->flatPanel) {
1647*4882a593Smuzhiyun if((chip->Chipset & 0x0ff0) == 0x0110) {
1648*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC, 0x0528, state->dither);
1649*4882a593Smuzhiyun } else
1650*4882a593Smuzhiyun if((chip->Chipset & 0x0ff0) >= 0x0170) {
1651*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC, 0x083C, state->dither);
1652*4882a593Smuzhiyun }
1653*4882a593Smuzhiyun
1654*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x53);
1655*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, 0);
1656*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x54);
1657*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, 0);
1658*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x21);
1659*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, 0xfa);
1660*4882a593Smuzhiyun }
1661*4882a593Smuzhiyun
1662*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x41);
1663*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->extra);
1664*4882a593Smuzhiyun }
1665*4882a593Smuzhiyun LOAD_FIXED_STATE(Riva,FIFO);
1666*4882a593Smuzhiyun UpdateFifoState(chip);
1667*4882a593Smuzhiyun /*
1668*4882a593Smuzhiyun * Load HW mode state.
1669*4882a593Smuzhiyun */
1670*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x19);
1671*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->repaint0);
1672*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
1673*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->repaint1);
1674*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x25);
1675*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->screen);
1676*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x28);
1677*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->pixel);
1678*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
1679*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->horiz);
1680*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
1681*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->arbitration0);
1682*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x20);
1683*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->arbitration1);
1684*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x30);
1685*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->cursor0);
1686*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x31);
1687*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->cursor1);
1688*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
1689*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->cursor2);
1690*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x39);
1691*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D5, state->interlace);
1692*4882a593Smuzhiyun
1693*4882a593Smuzhiyun if(!chip->flatPanel) {
1694*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC0, 0x00000508, state->vpll);
1695*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC0, 0x0000050C, state->pllsel);
1696*4882a593Smuzhiyun if(chip->twoHeads)
1697*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC0, 0x00000520, state->vpll2);
1698*4882a593Smuzhiyun } else {
1699*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC, 0x00000848 , state->scale);
1700*4882a593Smuzhiyun }
1701*4882a593Smuzhiyun NV_WR32(chip->PRAMDAC, 0x00000600 , state->general);
1702*4882a593Smuzhiyun
1703*4882a593Smuzhiyun /*
1704*4882a593Smuzhiyun * Turn off VBlank enable and reset.
1705*4882a593Smuzhiyun */
1706*4882a593Smuzhiyun NV_WR32(chip->PCRTC, 0x00000140, 0);
1707*4882a593Smuzhiyun NV_WR32(chip->PCRTC, 0x00000100, chip->VBlankBit);
1708*4882a593Smuzhiyun /*
1709*4882a593Smuzhiyun * Set interrupt enable.
1710*4882a593Smuzhiyun */
1711*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00000140, chip->EnableIRQ & 0x01);
1712*4882a593Smuzhiyun /*
1713*4882a593Smuzhiyun * Set current state pointer.
1714*4882a593Smuzhiyun */
1715*4882a593Smuzhiyun chip->CurrentState = state;
1716*4882a593Smuzhiyun /*
1717*4882a593Smuzhiyun * Reset FIFO free and empty counts.
1718*4882a593Smuzhiyun */
1719*4882a593Smuzhiyun chip->FifoFreeCount = 0;
1720*4882a593Smuzhiyun /* Free count from first subchannel */
1721*4882a593Smuzhiyun chip->FifoEmptyCount = NV_RD32(&chip->Rop->FifoFree, 0);
1722*4882a593Smuzhiyun }
UnloadStateExt(RIVA_HW_INST * chip,RIVA_HW_STATE * state)1723*4882a593Smuzhiyun static void UnloadStateExt
1724*4882a593Smuzhiyun (
1725*4882a593Smuzhiyun RIVA_HW_INST *chip,
1726*4882a593Smuzhiyun RIVA_HW_STATE *state
1727*4882a593Smuzhiyun )
1728*4882a593Smuzhiyun {
1729*4882a593Smuzhiyun /*
1730*4882a593Smuzhiyun * Save current HW state.
1731*4882a593Smuzhiyun */
1732*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x19);
1733*4882a593Smuzhiyun state->repaint0 = VGA_RD08(chip->PCIO, 0x03D5);
1734*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
1735*4882a593Smuzhiyun state->repaint1 = VGA_RD08(chip->PCIO, 0x03D5);
1736*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x25);
1737*4882a593Smuzhiyun state->screen = VGA_RD08(chip->PCIO, 0x03D5);
1738*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x28);
1739*4882a593Smuzhiyun state->pixel = VGA_RD08(chip->PCIO, 0x03D5);
1740*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
1741*4882a593Smuzhiyun state->horiz = VGA_RD08(chip->PCIO, 0x03D5);
1742*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
1743*4882a593Smuzhiyun state->arbitration0 = VGA_RD08(chip->PCIO, 0x03D5);
1744*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x20);
1745*4882a593Smuzhiyun state->arbitration1 = VGA_RD08(chip->PCIO, 0x03D5);
1746*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x30);
1747*4882a593Smuzhiyun state->cursor0 = VGA_RD08(chip->PCIO, 0x03D5);
1748*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x31);
1749*4882a593Smuzhiyun state->cursor1 = VGA_RD08(chip->PCIO, 0x03D5);
1750*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
1751*4882a593Smuzhiyun state->cursor2 = VGA_RD08(chip->PCIO, 0x03D5);
1752*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x39);
1753*4882a593Smuzhiyun state->interlace = VGA_RD08(chip->PCIO, 0x03D5);
1754*4882a593Smuzhiyun state->vpll = NV_RD32(chip->PRAMDAC0, 0x00000508);
1755*4882a593Smuzhiyun state->vpll2 = NV_RD32(chip->PRAMDAC0, 0x00000520);
1756*4882a593Smuzhiyun state->pllsel = NV_RD32(chip->PRAMDAC0, 0x0000050C);
1757*4882a593Smuzhiyun state->general = NV_RD32(chip->PRAMDAC, 0x00000600);
1758*4882a593Smuzhiyun state->scale = NV_RD32(chip->PRAMDAC, 0x00000848);
1759*4882a593Smuzhiyun state->config = NV_RD32(chip->PFB, 0x00000200);
1760*4882a593Smuzhiyun switch (chip->Architecture)
1761*4882a593Smuzhiyun {
1762*4882a593Smuzhiyun case NV_ARCH_03:
1763*4882a593Smuzhiyun state->offset0 = NV_RD32(chip->PGRAPH, 0x00000630);
1764*4882a593Smuzhiyun state->offset1 = NV_RD32(chip->PGRAPH, 0x00000634);
1765*4882a593Smuzhiyun state->offset2 = NV_RD32(chip->PGRAPH, 0x00000638);
1766*4882a593Smuzhiyun state->offset3 = NV_RD32(chip->PGRAPH, 0x0000063C);
1767*4882a593Smuzhiyun state->pitch0 = NV_RD32(chip->PGRAPH, 0x00000650);
1768*4882a593Smuzhiyun state->pitch1 = NV_RD32(chip->PGRAPH, 0x00000654);
1769*4882a593Smuzhiyun state->pitch2 = NV_RD32(chip->PGRAPH, 0x00000658);
1770*4882a593Smuzhiyun state->pitch3 = NV_RD32(chip->PGRAPH, 0x0000065C);
1771*4882a593Smuzhiyun break;
1772*4882a593Smuzhiyun case NV_ARCH_04:
1773*4882a593Smuzhiyun state->offset0 = NV_RD32(chip->PGRAPH, 0x00000640);
1774*4882a593Smuzhiyun state->offset1 = NV_RD32(chip->PGRAPH, 0x00000644);
1775*4882a593Smuzhiyun state->offset2 = NV_RD32(chip->PGRAPH, 0x00000648);
1776*4882a593Smuzhiyun state->offset3 = NV_RD32(chip->PGRAPH, 0x0000064C);
1777*4882a593Smuzhiyun state->pitch0 = NV_RD32(chip->PGRAPH, 0x00000670);
1778*4882a593Smuzhiyun state->pitch1 = NV_RD32(chip->PGRAPH, 0x00000674);
1779*4882a593Smuzhiyun state->pitch2 = NV_RD32(chip->PGRAPH, 0x00000678);
1780*4882a593Smuzhiyun state->pitch3 = NV_RD32(chip->PGRAPH, 0x0000067C);
1781*4882a593Smuzhiyun break;
1782*4882a593Smuzhiyun case NV_ARCH_10:
1783*4882a593Smuzhiyun case NV_ARCH_20:
1784*4882a593Smuzhiyun case NV_ARCH_30:
1785*4882a593Smuzhiyun state->offset0 = NV_RD32(chip->PGRAPH, 0x00000640);
1786*4882a593Smuzhiyun state->offset1 = NV_RD32(chip->PGRAPH, 0x00000644);
1787*4882a593Smuzhiyun state->offset2 = NV_RD32(chip->PGRAPH, 0x00000648);
1788*4882a593Smuzhiyun state->offset3 = NV_RD32(chip->PGRAPH, 0x0000064C);
1789*4882a593Smuzhiyun state->pitch0 = NV_RD32(chip->PGRAPH, 0x00000670);
1790*4882a593Smuzhiyun state->pitch1 = NV_RD32(chip->PGRAPH, 0x00000674);
1791*4882a593Smuzhiyun state->pitch2 = NV_RD32(chip->PGRAPH, 0x00000678);
1792*4882a593Smuzhiyun state->pitch3 = NV_RD32(chip->PGRAPH, 0x0000067C);
1793*4882a593Smuzhiyun if(chip->twoHeads) {
1794*4882a593Smuzhiyun state->head = NV_RD32(chip->PCRTC0, 0x00000860);
1795*4882a593Smuzhiyun state->head2 = NV_RD32(chip->PCRTC0, 0x00002860);
1796*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x44);
1797*4882a593Smuzhiyun state->crtcOwner = VGA_RD08(chip->PCIO, 0x03D5);
1798*4882a593Smuzhiyun }
1799*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x03D4, 0x41);
1800*4882a593Smuzhiyun state->extra = VGA_RD08(chip->PCIO, 0x03D5);
1801*4882a593Smuzhiyun state->cursorConfig = NV_RD32(chip->PCRTC, 0x00000810);
1802*4882a593Smuzhiyun
1803*4882a593Smuzhiyun if((chip->Chipset & 0x0ff0) == 0x0110) {
1804*4882a593Smuzhiyun state->dither = NV_RD32(chip->PRAMDAC, 0x0528);
1805*4882a593Smuzhiyun } else
1806*4882a593Smuzhiyun if((chip->Chipset & 0x0ff0) >= 0x0170) {
1807*4882a593Smuzhiyun state->dither = NV_RD32(chip->PRAMDAC, 0x083C);
1808*4882a593Smuzhiyun }
1809*4882a593Smuzhiyun break;
1810*4882a593Smuzhiyun }
1811*4882a593Smuzhiyun }
SetStartAddress(RIVA_HW_INST * chip,unsigned start)1812*4882a593Smuzhiyun static void SetStartAddress
1813*4882a593Smuzhiyun (
1814*4882a593Smuzhiyun RIVA_HW_INST *chip,
1815*4882a593Smuzhiyun unsigned start
1816*4882a593Smuzhiyun )
1817*4882a593Smuzhiyun {
1818*4882a593Smuzhiyun NV_WR32(chip->PCRTC, 0x800, start);
1819*4882a593Smuzhiyun }
1820*4882a593Smuzhiyun
SetStartAddress3(RIVA_HW_INST * chip,unsigned start)1821*4882a593Smuzhiyun static void SetStartAddress3
1822*4882a593Smuzhiyun (
1823*4882a593Smuzhiyun RIVA_HW_INST *chip,
1824*4882a593Smuzhiyun unsigned start
1825*4882a593Smuzhiyun )
1826*4882a593Smuzhiyun {
1827*4882a593Smuzhiyun int offset = start >> 2;
1828*4882a593Smuzhiyun int pan = (start & 3) << 1;
1829*4882a593Smuzhiyun unsigned char tmp;
1830*4882a593Smuzhiyun
1831*4882a593Smuzhiyun /*
1832*4882a593Smuzhiyun * Unlock extended registers.
1833*4882a593Smuzhiyun */
1834*4882a593Smuzhiyun chip->LockUnlock(chip, 0);
1835*4882a593Smuzhiyun /*
1836*4882a593Smuzhiyun * Set start address.
1837*4882a593Smuzhiyun */
1838*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x0D); VGA_WR08(chip->PCIO, 0x3D5, offset);
1839*4882a593Smuzhiyun offset >>= 8;
1840*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x0C); VGA_WR08(chip->PCIO, 0x3D5, offset);
1841*4882a593Smuzhiyun offset >>= 8;
1842*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x19); tmp = VGA_RD08(chip->PCIO, 0x3D5);
1843*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x01F) | (tmp & ~0x1F));
1844*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D4, 0x2D); tmp = VGA_RD08(chip->PCIO, 0x3D5);
1845*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x60) | (tmp & ~0x60));
1846*4882a593Smuzhiyun /*
1847*4882a593Smuzhiyun * 4 pixel pan register.
1848*4882a593Smuzhiyun */
1849*4882a593Smuzhiyun offset = VGA_RD08(chip->PCIO, chip->IO + 0x0A);
1850*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3C0, 0x13);
1851*4882a593Smuzhiyun VGA_WR08(chip->PCIO, 0x3C0, pan);
1852*4882a593Smuzhiyun }
nv3SetSurfaces2D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1853*4882a593Smuzhiyun static void nv3SetSurfaces2D
1854*4882a593Smuzhiyun (
1855*4882a593Smuzhiyun RIVA_HW_INST *chip,
1856*4882a593Smuzhiyun unsigned surf0,
1857*4882a593Smuzhiyun unsigned surf1
1858*4882a593Smuzhiyun )
1859*4882a593Smuzhiyun {
1860*4882a593Smuzhiyun RivaSurface __iomem *Surface =
1861*4882a593Smuzhiyun (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1862*4882a593Smuzhiyun
1863*4882a593Smuzhiyun RIVA_FIFO_FREE(*chip,Tri03,5);
1864*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
1865*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf0);
1866*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
1867*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf1);
1868*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
1869*4882a593Smuzhiyun }
nv4SetSurfaces2D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1870*4882a593Smuzhiyun static void nv4SetSurfaces2D
1871*4882a593Smuzhiyun (
1872*4882a593Smuzhiyun RIVA_HW_INST *chip,
1873*4882a593Smuzhiyun unsigned surf0,
1874*4882a593Smuzhiyun unsigned surf1
1875*4882a593Smuzhiyun )
1876*4882a593Smuzhiyun {
1877*4882a593Smuzhiyun RivaSurface __iomem *Surface =
1878*4882a593Smuzhiyun (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1879*4882a593Smuzhiyun
1880*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
1881*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf0);
1882*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
1883*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf1);
1884*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1885*4882a593Smuzhiyun }
nv10SetSurfaces2D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1886*4882a593Smuzhiyun static void nv10SetSurfaces2D
1887*4882a593Smuzhiyun (
1888*4882a593Smuzhiyun RIVA_HW_INST *chip,
1889*4882a593Smuzhiyun unsigned surf0,
1890*4882a593Smuzhiyun unsigned surf1
1891*4882a593Smuzhiyun )
1892*4882a593Smuzhiyun {
1893*4882a593Smuzhiyun RivaSurface __iomem *Surface =
1894*4882a593Smuzhiyun (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1895*4882a593Smuzhiyun
1896*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
1897*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf0);
1898*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
1899*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf1);
1900*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1901*4882a593Smuzhiyun }
nv3SetSurfaces3D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1902*4882a593Smuzhiyun static void nv3SetSurfaces3D
1903*4882a593Smuzhiyun (
1904*4882a593Smuzhiyun RIVA_HW_INST *chip,
1905*4882a593Smuzhiyun unsigned surf0,
1906*4882a593Smuzhiyun unsigned surf1
1907*4882a593Smuzhiyun )
1908*4882a593Smuzhiyun {
1909*4882a593Smuzhiyun RivaSurface __iomem *Surface =
1910*4882a593Smuzhiyun (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1911*4882a593Smuzhiyun
1912*4882a593Smuzhiyun RIVA_FIFO_FREE(*chip,Tri03,5);
1913*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
1914*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf0);
1915*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
1916*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf1);
1917*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
1918*4882a593Smuzhiyun }
nv4SetSurfaces3D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1919*4882a593Smuzhiyun static void nv4SetSurfaces3D
1920*4882a593Smuzhiyun (
1921*4882a593Smuzhiyun RIVA_HW_INST *chip,
1922*4882a593Smuzhiyun unsigned surf0,
1923*4882a593Smuzhiyun unsigned surf1
1924*4882a593Smuzhiyun )
1925*4882a593Smuzhiyun {
1926*4882a593Smuzhiyun RivaSurface __iomem *Surface =
1927*4882a593Smuzhiyun (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1928*4882a593Smuzhiyun
1929*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
1930*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf0);
1931*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
1932*4882a593Smuzhiyun NV_WR32(&Surface->Offset, 0, surf1);
1933*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1934*4882a593Smuzhiyun }
nv10SetSurfaces3D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1935*4882a593Smuzhiyun static void nv10SetSurfaces3D
1936*4882a593Smuzhiyun (
1937*4882a593Smuzhiyun RIVA_HW_INST *chip,
1938*4882a593Smuzhiyun unsigned surf0,
1939*4882a593Smuzhiyun unsigned surf1
1940*4882a593Smuzhiyun )
1941*4882a593Smuzhiyun {
1942*4882a593Smuzhiyun RivaSurface3D __iomem *Surfaces3D =
1943*4882a593Smuzhiyun (RivaSurface3D __iomem *)&(chip->FIFO[0x0000E000/4]);
1944*4882a593Smuzhiyun
1945*4882a593Smuzhiyun RIVA_FIFO_FREE(*chip,Tri03,4);
1946*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000007);
1947*4882a593Smuzhiyun NV_WR32(&Surfaces3D->RenderBufferOffset, 0, surf0);
1948*4882a593Smuzhiyun NV_WR32(&Surfaces3D->ZBufferOffset, 0, surf1);
1949*4882a593Smuzhiyun NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1950*4882a593Smuzhiyun }
1951*4882a593Smuzhiyun
1952*4882a593Smuzhiyun /****************************************************************************\
1953*4882a593Smuzhiyun * *
1954*4882a593Smuzhiyun * Probe RIVA Chip Configuration *
1955*4882a593Smuzhiyun * *
1956*4882a593Smuzhiyun \****************************************************************************/
1957*4882a593Smuzhiyun
nv3GetConfig(RIVA_HW_INST * chip)1958*4882a593Smuzhiyun static void nv3GetConfig
1959*4882a593Smuzhiyun (
1960*4882a593Smuzhiyun RIVA_HW_INST *chip
1961*4882a593Smuzhiyun )
1962*4882a593Smuzhiyun {
1963*4882a593Smuzhiyun /*
1964*4882a593Smuzhiyun * Fill in chip configuration.
1965*4882a593Smuzhiyun */
1966*4882a593Smuzhiyun if (NV_RD32(&chip->PFB[0x00000000/4], 0) & 0x00000020)
1967*4882a593Smuzhiyun {
1968*4882a593Smuzhiyun if (((NV_RD32(chip->PMC, 0x00000000) & 0xF0) == 0x20)
1969*4882a593Smuzhiyun && ((NV_RD32(chip->PMC, 0x00000000) & 0x0F) >= 0x02))
1970*4882a593Smuzhiyun {
1971*4882a593Smuzhiyun /*
1972*4882a593Smuzhiyun * SDRAM 128 ZX.
1973*4882a593Smuzhiyun */
1974*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 800000;
1975*4882a593Smuzhiyun switch (NV_RD32(chip->PFB, 0x00000000) & 0x03)
1976*4882a593Smuzhiyun {
1977*4882a593Smuzhiyun case 2:
1978*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 4;
1979*4882a593Smuzhiyun break;
1980*4882a593Smuzhiyun case 1:
1981*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 2;
1982*4882a593Smuzhiyun break;
1983*4882a593Smuzhiyun default:
1984*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 8;
1985*4882a593Smuzhiyun break;
1986*4882a593Smuzhiyun }
1987*4882a593Smuzhiyun }
1988*4882a593Smuzhiyun else
1989*4882a593Smuzhiyun {
1990*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 1000000;
1991*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 8;
1992*4882a593Smuzhiyun }
1993*4882a593Smuzhiyun }
1994*4882a593Smuzhiyun else
1995*4882a593Smuzhiyun {
1996*4882a593Smuzhiyun /*
1997*4882a593Smuzhiyun * SGRAM 128.
1998*4882a593Smuzhiyun */
1999*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 1000000;
2000*4882a593Smuzhiyun switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
2001*4882a593Smuzhiyun {
2002*4882a593Smuzhiyun case 0:
2003*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 8;
2004*4882a593Smuzhiyun break;
2005*4882a593Smuzhiyun case 2:
2006*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 4;
2007*4882a593Smuzhiyun break;
2008*4882a593Smuzhiyun default:
2009*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 2;
2010*4882a593Smuzhiyun break;
2011*4882a593Smuzhiyun }
2012*4882a593Smuzhiyun }
2013*4882a593Smuzhiyun chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
2014*4882a593Smuzhiyun chip->CURSOR = &(chip->PRAMIN[0x00008000/4 - 0x0800/4]);
2015*4882a593Smuzhiyun chip->VBlankBit = 0x00000100;
2016*4882a593Smuzhiyun chip->MaxVClockFreqKHz = 256000;
2017*4882a593Smuzhiyun /*
2018*4882a593Smuzhiyun * Set chip functions.
2019*4882a593Smuzhiyun */
2020*4882a593Smuzhiyun chip->Busy = nv3Busy;
2021*4882a593Smuzhiyun chip->ShowHideCursor = ShowHideCursor;
2022*4882a593Smuzhiyun chip->LoadStateExt = LoadStateExt;
2023*4882a593Smuzhiyun chip->UnloadStateExt = UnloadStateExt;
2024*4882a593Smuzhiyun chip->SetStartAddress = SetStartAddress3;
2025*4882a593Smuzhiyun chip->SetSurfaces2D = nv3SetSurfaces2D;
2026*4882a593Smuzhiyun chip->SetSurfaces3D = nv3SetSurfaces3D;
2027*4882a593Smuzhiyun chip->LockUnlock = nv3LockUnlock;
2028*4882a593Smuzhiyun }
nv4GetConfig(RIVA_HW_INST * chip)2029*4882a593Smuzhiyun static void nv4GetConfig
2030*4882a593Smuzhiyun (
2031*4882a593Smuzhiyun RIVA_HW_INST *chip
2032*4882a593Smuzhiyun )
2033*4882a593Smuzhiyun {
2034*4882a593Smuzhiyun /*
2035*4882a593Smuzhiyun * Fill in chip configuration.
2036*4882a593Smuzhiyun */
2037*4882a593Smuzhiyun if (NV_RD32(chip->PFB, 0x00000000) & 0x00000100)
2038*4882a593Smuzhiyun {
2039*4882a593Smuzhiyun chip->RamAmountKBytes = ((NV_RD32(chip->PFB, 0x00000000) >> 12) & 0x0F) * 1024 * 2
2040*4882a593Smuzhiyun + 1024 * 2;
2041*4882a593Smuzhiyun }
2042*4882a593Smuzhiyun else
2043*4882a593Smuzhiyun {
2044*4882a593Smuzhiyun switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
2045*4882a593Smuzhiyun {
2046*4882a593Smuzhiyun case 0:
2047*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 32;
2048*4882a593Smuzhiyun break;
2049*4882a593Smuzhiyun case 1:
2050*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 4;
2051*4882a593Smuzhiyun break;
2052*4882a593Smuzhiyun case 2:
2053*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 8;
2054*4882a593Smuzhiyun break;
2055*4882a593Smuzhiyun case 3:
2056*4882a593Smuzhiyun default:
2057*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 16;
2058*4882a593Smuzhiyun break;
2059*4882a593Smuzhiyun }
2060*4882a593Smuzhiyun }
2061*4882a593Smuzhiyun switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
2062*4882a593Smuzhiyun {
2063*4882a593Smuzhiyun case 3:
2064*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 800000;
2065*4882a593Smuzhiyun break;
2066*4882a593Smuzhiyun default:
2067*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 1000000;
2068*4882a593Smuzhiyun break;
2069*4882a593Smuzhiyun }
2070*4882a593Smuzhiyun chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
2071*4882a593Smuzhiyun chip->CURSOR = &(chip->PRAMIN[0x00010000/4 - 0x0800/4]);
2072*4882a593Smuzhiyun chip->VBlankBit = 0x00000001;
2073*4882a593Smuzhiyun chip->MaxVClockFreqKHz = 350000;
2074*4882a593Smuzhiyun /*
2075*4882a593Smuzhiyun * Set chip functions.
2076*4882a593Smuzhiyun */
2077*4882a593Smuzhiyun chip->Busy = nv4Busy;
2078*4882a593Smuzhiyun chip->ShowHideCursor = ShowHideCursor;
2079*4882a593Smuzhiyun chip->LoadStateExt = LoadStateExt;
2080*4882a593Smuzhiyun chip->UnloadStateExt = UnloadStateExt;
2081*4882a593Smuzhiyun chip->SetStartAddress = SetStartAddress;
2082*4882a593Smuzhiyun chip->SetSurfaces2D = nv4SetSurfaces2D;
2083*4882a593Smuzhiyun chip->SetSurfaces3D = nv4SetSurfaces3D;
2084*4882a593Smuzhiyun chip->LockUnlock = nv4LockUnlock;
2085*4882a593Smuzhiyun }
nv10GetConfig(RIVA_HW_INST * chip,struct pci_dev * pdev,unsigned int chipset)2086*4882a593Smuzhiyun static void nv10GetConfig
2087*4882a593Smuzhiyun (
2088*4882a593Smuzhiyun RIVA_HW_INST *chip,
2089*4882a593Smuzhiyun struct pci_dev *pdev,
2090*4882a593Smuzhiyun unsigned int chipset
2091*4882a593Smuzhiyun )
2092*4882a593Smuzhiyun {
2093*4882a593Smuzhiyun struct pci_dev* dev;
2094*4882a593Smuzhiyun int domain = pci_domain_nr(pdev->bus);
2095*4882a593Smuzhiyun u32 amt;
2096*4882a593Smuzhiyun
2097*4882a593Smuzhiyun #ifdef __BIG_ENDIAN
2098*4882a593Smuzhiyun /* turn on big endian register access */
2099*4882a593Smuzhiyun if(!(NV_RD32(chip->PMC, 0x00000004) & 0x01000001))
2100*4882a593Smuzhiyun NV_WR32(chip->PMC, 0x00000004, 0x01000001);
2101*4882a593Smuzhiyun #endif
2102*4882a593Smuzhiyun
2103*4882a593Smuzhiyun /*
2104*4882a593Smuzhiyun * Fill in chip configuration.
2105*4882a593Smuzhiyun */
2106*4882a593Smuzhiyun if(chipset == NV_CHIP_IGEFORCE2) {
2107*4882a593Smuzhiyun dev = pci_get_domain_bus_and_slot(domain, 0, 1);
2108*4882a593Smuzhiyun pci_read_config_dword(dev, 0x7C, &amt);
2109*4882a593Smuzhiyun pci_dev_put(dev);
2110*4882a593Smuzhiyun chip->RamAmountKBytes = (((amt >> 6) & 31) + 1) * 1024;
2111*4882a593Smuzhiyun } else if(chipset == NV_CHIP_0x01F0) {
2112*4882a593Smuzhiyun dev = pci_get_domain_bus_and_slot(domain, 0, 1);
2113*4882a593Smuzhiyun pci_read_config_dword(dev, 0x84, &amt);
2114*4882a593Smuzhiyun pci_dev_put(dev);
2115*4882a593Smuzhiyun chip->RamAmountKBytes = (((amt >> 4) & 127) + 1) * 1024;
2116*4882a593Smuzhiyun } else {
2117*4882a593Smuzhiyun switch ((NV_RD32(chip->PFB, 0x0000020C) >> 20) & 0x000000FF)
2118*4882a593Smuzhiyun {
2119*4882a593Smuzhiyun case 0x02:
2120*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 2;
2121*4882a593Smuzhiyun break;
2122*4882a593Smuzhiyun case 0x04:
2123*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 4;
2124*4882a593Smuzhiyun break;
2125*4882a593Smuzhiyun case 0x08:
2126*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 8;
2127*4882a593Smuzhiyun break;
2128*4882a593Smuzhiyun case 0x10:
2129*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 16;
2130*4882a593Smuzhiyun break;
2131*4882a593Smuzhiyun case 0x20:
2132*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 32;
2133*4882a593Smuzhiyun break;
2134*4882a593Smuzhiyun case 0x40:
2135*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 64;
2136*4882a593Smuzhiyun break;
2137*4882a593Smuzhiyun case 0x80:
2138*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 128;
2139*4882a593Smuzhiyun break;
2140*4882a593Smuzhiyun default:
2141*4882a593Smuzhiyun chip->RamAmountKBytes = 1024 * 16;
2142*4882a593Smuzhiyun break;
2143*4882a593Smuzhiyun }
2144*4882a593Smuzhiyun }
2145*4882a593Smuzhiyun switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
2146*4882a593Smuzhiyun {
2147*4882a593Smuzhiyun case 3:
2148*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 800000;
2149*4882a593Smuzhiyun break;
2150*4882a593Smuzhiyun default:
2151*4882a593Smuzhiyun chip->RamBandwidthKBytesPerSec = 1000000;
2152*4882a593Smuzhiyun break;
2153*4882a593Smuzhiyun }
2154*4882a593Smuzhiyun chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 6)) ?
2155*4882a593Smuzhiyun 14318 : 13500;
2156*4882a593Smuzhiyun
2157*4882a593Smuzhiyun switch (chipset & 0x0ff0) {
2158*4882a593Smuzhiyun case 0x0170:
2159*4882a593Smuzhiyun case 0x0180:
2160*4882a593Smuzhiyun case 0x01F0:
2161*4882a593Smuzhiyun case 0x0250:
2162*4882a593Smuzhiyun case 0x0280:
2163*4882a593Smuzhiyun case 0x0300:
2164*4882a593Smuzhiyun case 0x0310:
2165*4882a593Smuzhiyun case 0x0320:
2166*4882a593Smuzhiyun case 0x0330:
2167*4882a593Smuzhiyun case 0x0340:
2168*4882a593Smuzhiyun if(NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 22))
2169*4882a593Smuzhiyun chip->CrystalFreqKHz = 27000;
2170*4882a593Smuzhiyun break;
2171*4882a593Smuzhiyun default:
2172*4882a593Smuzhiyun break;
2173*4882a593Smuzhiyun }
2174*4882a593Smuzhiyun
2175*4882a593Smuzhiyun chip->CursorStart = (chip->RamAmountKBytes - 128) * 1024;
2176*4882a593Smuzhiyun chip->CURSOR = NULL; /* can't set this here */
2177*4882a593Smuzhiyun chip->VBlankBit = 0x00000001;
2178*4882a593Smuzhiyun chip->MaxVClockFreqKHz = 350000;
2179*4882a593Smuzhiyun /*
2180*4882a593Smuzhiyun * Set chip functions.
2181*4882a593Smuzhiyun */
2182*4882a593Smuzhiyun chip->Busy = nv10Busy;
2183*4882a593Smuzhiyun chip->ShowHideCursor = ShowHideCursor;
2184*4882a593Smuzhiyun chip->LoadStateExt = LoadStateExt;
2185*4882a593Smuzhiyun chip->UnloadStateExt = UnloadStateExt;
2186*4882a593Smuzhiyun chip->SetStartAddress = SetStartAddress;
2187*4882a593Smuzhiyun chip->SetSurfaces2D = nv10SetSurfaces2D;
2188*4882a593Smuzhiyun chip->SetSurfaces3D = nv10SetSurfaces3D;
2189*4882a593Smuzhiyun chip->LockUnlock = nv4LockUnlock;
2190*4882a593Smuzhiyun
2191*4882a593Smuzhiyun switch(chipset & 0x0ff0) {
2192*4882a593Smuzhiyun case 0x0110:
2193*4882a593Smuzhiyun case 0x0170:
2194*4882a593Smuzhiyun case 0x0180:
2195*4882a593Smuzhiyun case 0x01F0:
2196*4882a593Smuzhiyun case 0x0250:
2197*4882a593Smuzhiyun case 0x0280:
2198*4882a593Smuzhiyun case 0x0300:
2199*4882a593Smuzhiyun case 0x0310:
2200*4882a593Smuzhiyun case 0x0320:
2201*4882a593Smuzhiyun case 0x0330:
2202*4882a593Smuzhiyun case 0x0340:
2203*4882a593Smuzhiyun chip->twoHeads = TRUE;
2204*4882a593Smuzhiyun break;
2205*4882a593Smuzhiyun default:
2206*4882a593Smuzhiyun chip->twoHeads = FALSE;
2207*4882a593Smuzhiyun break;
2208*4882a593Smuzhiyun }
2209*4882a593Smuzhiyun }
RivaGetConfig(RIVA_HW_INST * chip,struct pci_dev * pdev,unsigned int chipset)2210*4882a593Smuzhiyun int RivaGetConfig
2211*4882a593Smuzhiyun (
2212*4882a593Smuzhiyun RIVA_HW_INST *chip,
2213*4882a593Smuzhiyun struct pci_dev *pdev,
2214*4882a593Smuzhiyun unsigned int chipset
2215*4882a593Smuzhiyun )
2216*4882a593Smuzhiyun {
2217*4882a593Smuzhiyun /*
2218*4882a593Smuzhiyun * Save this so future SW know whats it's dealing with.
2219*4882a593Smuzhiyun */
2220*4882a593Smuzhiyun chip->Version = RIVA_SW_VERSION;
2221*4882a593Smuzhiyun /*
2222*4882a593Smuzhiyun * Chip specific configuration.
2223*4882a593Smuzhiyun */
2224*4882a593Smuzhiyun switch (chip->Architecture)
2225*4882a593Smuzhiyun {
2226*4882a593Smuzhiyun case NV_ARCH_03:
2227*4882a593Smuzhiyun nv3GetConfig(chip);
2228*4882a593Smuzhiyun break;
2229*4882a593Smuzhiyun case NV_ARCH_04:
2230*4882a593Smuzhiyun nv4GetConfig(chip);
2231*4882a593Smuzhiyun break;
2232*4882a593Smuzhiyun case NV_ARCH_10:
2233*4882a593Smuzhiyun case NV_ARCH_20:
2234*4882a593Smuzhiyun case NV_ARCH_30:
2235*4882a593Smuzhiyun nv10GetConfig(chip, pdev, chipset);
2236*4882a593Smuzhiyun break;
2237*4882a593Smuzhiyun default:
2238*4882a593Smuzhiyun return (-1);
2239*4882a593Smuzhiyun }
2240*4882a593Smuzhiyun chip->Chipset = chipset;
2241*4882a593Smuzhiyun /*
2242*4882a593Smuzhiyun * Fill in FIFO pointers.
2243*4882a593Smuzhiyun */
2244*4882a593Smuzhiyun chip->Rop = (RivaRop __iomem *)&(chip->FIFO[0x00000000/4]);
2245*4882a593Smuzhiyun chip->Clip = (RivaClip __iomem *)&(chip->FIFO[0x00002000/4]);
2246*4882a593Smuzhiyun chip->Patt = (RivaPattern __iomem *)&(chip->FIFO[0x00004000/4]);
2247*4882a593Smuzhiyun chip->Pixmap = (RivaPixmap __iomem *)&(chip->FIFO[0x00006000/4]);
2248*4882a593Smuzhiyun chip->Blt = (RivaScreenBlt __iomem *)&(chip->FIFO[0x00008000/4]);
2249*4882a593Smuzhiyun chip->Bitmap = (RivaBitmap __iomem *)&(chip->FIFO[0x0000A000/4]);
2250*4882a593Smuzhiyun chip->Line = (RivaLine __iomem *)&(chip->FIFO[0x0000C000/4]);
2251*4882a593Smuzhiyun chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
2252*4882a593Smuzhiyun return (0);
2253*4882a593Smuzhiyun }
2254*4882a593Smuzhiyun
2255