xref: /openbmc/linux/drivers/video/fbdev/riva/riva_hw.c (revision 5c7ddcc8)
1  /***************************************************************************\
2 |*                                                                           *|
3 |*       Copyright 1993-1999 NVIDIA, Corporation.  All rights reserved.      *|
4 |*                                                                           *|
5 |*     NOTICE TO USER:   The source code  is copyrighted under  U.S. and     *|
6 |*     international laws.  Users and possessors of this source code are     *|
7 |*     hereby granted a nonexclusive,  royalty-free copyright license to     *|
8 |*     use this code in individual and commercial software.                  *|
9 |*                                                                           *|
10 |*     Any use of this source code must include,  in the user documenta-     *|
11 |*     tion and  internal comments to the code,  notices to the end user     *|
12 |*     as follows:                                                           *|
13 |*                                                                           *|
14 |*       Copyright 1993-1999 NVIDIA, Corporation.  All rights reserved.      *|
15 |*                                                                           *|
16 |*     NVIDIA, CORPORATION MAKES NO REPRESENTATION ABOUT THE SUITABILITY     *|
17 |*     OF  THIS SOURCE  CODE  FOR ANY PURPOSE.  IT IS  PROVIDED  "AS IS"     *|
18 |*     WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND.  NVIDIA, CORPOR-     *|
19 |*     ATION DISCLAIMS ALL WARRANTIES  WITH REGARD  TO THIS SOURCE CODE,     *|
20 |*     INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY, NONINFRINGE-     *|
21 |*     MENT,  AND FITNESS  FOR A PARTICULAR PURPOSE.   IN NO EVENT SHALL     *|
22 |*     NVIDIA, CORPORATION  BE LIABLE FOR ANY SPECIAL,  INDIRECT,  INCI-     *|
23 |*     DENTAL, OR CONSEQUENTIAL DAMAGES,  OR ANY DAMAGES  WHATSOEVER RE-     *|
24 |*     SULTING FROM LOSS OF USE,  DATA OR PROFITS,  WHETHER IN AN ACTION     *|
25 |*     OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,  ARISING OUT OF     *|
26 |*     OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOURCE CODE.     *|
27 |*                                                                           *|
28 |*     U.S. Government  End  Users.   This source code  is a "commercial     *|
29 |*     item,"  as that  term is  defined at  48 C.F.R. 2.101 (OCT 1995),     *|
30 |*     consisting  of "commercial  computer  software"  and  "commercial     *|
31 |*     computer  software  documentation,"  as such  terms  are  used in     *|
32 |*     48 C.F.R. 12.212 (SEPT 1995)  and is provided to the U.S. Govern-     *|
33 |*     ment only as  a commercial end item.   Consistent with  48 C.F.R.     *|
34 |*     12.212 and  48 C.F.R. 227.7202-1 through  227.7202-4 (JUNE 1995),     *|
35 |*     all U.S. Government End Users  acquire the source code  with only     *|
36 |*     those rights set forth herein.                                        *|
37 |*                                                                           *|
38  \***************************************************************************/
39 
40 /*
41  * GPL licensing note -- nVidia is allowing a liberal interpretation of
42  * the documentation restriction above, to merely say that this nVidia's
43  * copyright and disclaimer should be included with all code derived
44  * from this source.  -- Jeff Garzik <jgarzik@pobox.com>, 01/Nov/99
45  */
46 
47 /* $XFree86: xc/programs/Xserver/hw/xfree86/drivers/nv/riva_hw.c,v 1.33 2002/08/05 20:47:06 mvojkovi Exp $ */
48 
49 #include <linux/kernel.h>
50 #include <linux/pci.h>
51 #include <linux/pci_ids.h>
52 #include "riva_hw.h"
53 #include "riva_tbl.h"
54 #include "nv_type.h"
55 
56 /*
57  * This file is an OS-agnostic file used to make RIVA 128 and RIVA TNT
58  * operate identically (except TNT has more memory and better 3D quality.
59  */
nv3Busy(RIVA_HW_INST * chip)60 static int nv3Busy
61 (
62     RIVA_HW_INST *chip
63 )
64 {
65     return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
66 	    NV_RD32(&chip->PGRAPH[0x000006B0/4], 0) & 0x01);
67 }
nv4Busy(RIVA_HW_INST * chip)68 static int nv4Busy
69 (
70     RIVA_HW_INST *chip
71 )
72 {
73     return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
74 	    NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
75 }
nv10Busy(RIVA_HW_INST * chip)76 static int nv10Busy
77 (
78     RIVA_HW_INST *chip
79 )
80 {
81     return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
82 	    NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
83 }
84 
vgaLockUnlock(RIVA_HW_INST * chip,int Lock)85 static void vgaLockUnlock
86 (
87     RIVA_HW_INST *chip,
88     int           Lock
89 )
90 {
91     U008 cr11;
92     VGA_WR08(chip->PCIO, 0x3D4, 0x11);
93     cr11 = VGA_RD08(chip->PCIO, 0x3D5);
94     if(Lock) cr11 |= 0x80;
95     else cr11 &= ~0x80;
96     VGA_WR08(chip->PCIO, 0x3D5, cr11);
97 }
nv3LockUnlock(RIVA_HW_INST * chip,int Lock)98 static void nv3LockUnlock
99 (
100     RIVA_HW_INST *chip,
101     int           Lock
102 )
103 {
104     VGA_WR08(chip->PVIO, 0x3C4, 0x06);
105     VGA_WR08(chip->PVIO, 0x3C5, Lock ? 0x99 : 0x57);
106     vgaLockUnlock(chip, Lock);
107 }
nv4LockUnlock(RIVA_HW_INST * chip,int Lock)108 static void nv4LockUnlock
109 (
110     RIVA_HW_INST *chip,
111     int           Lock
112 )
113 {
114     VGA_WR08(chip->PCIO, 0x3D4, 0x1F);
115     VGA_WR08(chip->PCIO, 0x3D5, Lock ? 0x99 : 0x57);
116     vgaLockUnlock(chip, Lock);
117 }
118 
ShowHideCursor(RIVA_HW_INST * chip,int ShowHide)119 static int ShowHideCursor
120 (
121     RIVA_HW_INST *chip,
122     int           ShowHide
123 )
124 {
125     int cursor;
126     cursor                      =  chip->CurrentState->cursor1;
127     chip->CurrentState->cursor1 = (chip->CurrentState->cursor1 & 0xFE) |
128                                   (ShowHide & 0x01);
129     VGA_WR08(chip->PCIO, 0x3D4, 0x31);
130     VGA_WR08(chip->PCIO, 0x3D5, chip->CurrentState->cursor1);
131     return (cursor & 0x01);
132 }
133 
134 /****************************************************************************\
135 *                                                                            *
136 * The video arbitration routines calculate some "magic" numbers.  Fixes      *
137 * the snow seen when accessing the framebuffer without it.                   *
138 * It just works (I hope).                                                    *
139 *                                                                            *
140 \****************************************************************************/
141 
142 #define DEFAULT_GR_LWM 100
143 #define DEFAULT_VID_LWM 100
144 #define DEFAULT_GR_BURST_SIZE 256
145 #define DEFAULT_VID_BURST_SIZE 128
146 #define VIDEO		0
147 #define GRAPHICS	1
148 #define MPORT		2
149 #define ENGINE		3
150 #define GFIFO_SIZE	320
151 #define GFIFO_SIZE_128	256
152 #define MFIFO_SIZE	120
153 #define VFIFO_SIZE	256
154 
155 typedef struct {
156   int gdrain_rate;
157   int vdrain_rate;
158   int mdrain_rate;
159   int gburst_size;
160   int vburst_size;
161   char vid_en;
162   char gr_en;
163   int wcmocc, wcgocc, wcvocc, wcvlwm, wcglwm;
164   int by_gfacc;
165   char vid_only_once;
166   char gr_only_once;
167   char first_vacc;
168   char first_gacc;
169   char first_macc;
170   int vocc;
171   int gocc;
172   int mocc;
173   char cur;
174   char engine_en;
175   char converged;
176   int priority;
177 } nv3_arb_info;
178 typedef struct {
179   int graphics_lwm;
180   int video_lwm;
181   int graphics_burst_size;
182   int video_burst_size;
183   int graphics_hi_priority;
184   int media_hi_priority;
185   int rtl_values;
186   int valid;
187 } nv3_fifo_info;
188 typedef struct {
189   char pix_bpp;
190   char enable_video;
191   char gr_during_vid;
192   char enable_mp;
193   int memory_width;
194   int video_scale;
195   int pclk_khz;
196   int mclk_khz;
197   int mem_page_miss;
198   int mem_latency;
199   char mem_aligned;
200 } nv3_sim_state;
201 typedef struct {
202   int graphics_lwm;
203   int video_lwm;
204   int graphics_burst_size;
205   int video_burst_size;
206   int valid;
207 } nv4_fifo_info;
208 typedef struct {
209   int pclk_khz;
210   int mclk_khz;
211   int nvclk_khz;
212   char mem_page_miss;
213   char mem_latency;
214   int memory_width;
215   char enable_video;
216   char gr_during_vid;
217   char pix_bpp;
218   char mem_aligned;
219   char enable_mp;
220 } nv4_sim_state;
221 typedef struct {
222   int graphics_lwm;
223   int video_lwm;
224   int graphics_burst_size;
225   int video_burst_size;
226   int valid;
227 } nv10_fifo_info;
228 typedef struct {
229   int pclk_khz;
230   int mclk_khz;
231   int nvclk_khz;
232   char mem_page_miss;
233   char mem_latency;
234   u32 memory_type;
235   int memory_width;
236   char enable_video;
237   char gr_during_vid;
238   char pix_bpp;
239   char mem_aligned;
240   char enable_mp;
241 } nv10_sim_state;
nv3_iterate(nv3_fifo_info * res_info,nv3_sim_state * state,nv3_arb_info * ainfo)242 static int nv3_iterate(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
243 {
244     int iter = 0;
245     int tmp;
246     int vfsize, mfsize, gfsize;
247     int mburst_size = 32;
248     int mmisses, gmisses, vmisses;
249     int misses;
250     int vlwm, glwm;
251     int last, next, cur;
252     int max_gfsize ;
253     long ns;
254 
255     vlwm = 0;
256     glwm = 0;
257     vfsize = 0;
258     gfsize = 0;
259     cur = ainfo->cur;
260     mmisses = 2;
261     gmisses = 2;
262     vmisses = 2;
263     if (ainfo->gburst_size == 128) max_gfsize = GFIFO_SIZE_128;
264     else  max_gfsize = GFIFO_SIZE;
265     max_gfsize = GFIFO_SIZE;
266     while (1)
267     {
268         if (ainfo->vid_en)
269         {
270             if (ainfo->wcvocc > ainfo->vocc) ainfo->wcvocc = ainfo->vocc;
271             if (ainfo->wcvlwm > vlwm) ainfo->wcvlwm = vlwm ;
272             ns = 1000000 * ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
273             vfsize = ns * ainfo->vdrain_rate / 1000000;
274             vfsize =  ainfo->wcvlwm - ainfo->vburst_size + vfsize;
275         }
276         if (state->enable_mp)
277         {
278             if (ainfo->wcmocc > ainfo->mocc) ainfo->wcmocc = ainfo->mocc;
279         }
280         if (ainfo->gr_en)
281         {
282             if (ainfo->wcglwm > glwm) ainfo->wcglwm = glwm ;
283             if (ainfo->wcgocc > ainfo->gocc) ainfo->wcgocc = ainfo->gocc;
284             ns = 1000000 * (ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
285             gfsize = (ns * (long) ainfo->gdrain_rate)/1000000;
286             gfsize = ainfo->wcglwm - ainfo->gburst_size + gfsize;
287         }
288         mfsize = 0;
289         if (!state->gr_during_vid && ainfo->vid_en)
290             if (ainfo->vid_en && (ainfo->vocc < 0) && !ainfo->vid_only_once)
291                 next = VIDEO;
292             else if (ainfo->mocc < 0)
293                 next = MPORT;
294             else if (ainfo->gocc< ainfo->by_gfacc)
295                 next = GRAPHICS;
296             else return (0);
297         else switch (ainfo->priority)
298             {
299                 case VIDEO:
300                     if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
301                         next = VIDEO;
302                     else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
303                         next = GRAPHICS;
304                     else if (ainfo->mocc<0)
305                         next = MPORT;
306                     else    return (0);
307                     break;
308                 case GRAPHICS:
309                     if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
310                         next = GRAPHICS;
311                     else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
312                         next = VIDEO;
313                     else if (ainfo->mocc<0)
314                         next = MPORT;
315                     else    return (0);
316                     break;
317                 default:
318                     if (ainfo->mocc<0)
319                         next = MPORT;
320                     else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
321                         next = GRAPHICS;
322                     else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
323                         next = VIDEO;
324                     else    return (0);
325                     break;
326             }
327         last = cur;
328         cur = next;
329         iter++;
330         switch (cur)
331         {
332             case VIDEO:
333                 if (last==cur)    misses = 0;
334                 else if (ainfo->first_vacc)   misses = vmisses;
335                 else    misses = 1;
336                 ainfo->first_vacc = 0;
337                 if (last!=cur)
338                 {
339                     ns =  1000000 * (vmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
340                     vlwm = ns * ainfo->vdrain_rate/ 1000000;
341                     vlwm = ainfo->vocc - vlwm;
342                 }
343                 ns = 1000000*(misses*state->mem_page_miss + ainfo->vburst_size)/(state->memory_width/8)/state->mclk_khz;
344                 ainfo->vocc = ainfo->vocc + ainfo->vburst_size - ns*ainfo->vdrain_rate/1000000;
345                 ainfo->gocc = ainfo->gocc - ns*ainfo->gdrain_rate/1000000;
346                 ainfo->mocc = ainfo->mocc - ns*ainfo->mdrain_rate/1000000;
347                 break;
348             case GRAPHICS:
349                 if (last==cur)    misses = 0;
350                 else if (ainfo->first_gacc)   misses = gmisses;
351                 else    misses = 1;
352                 ainfo->first_gacc = 0;
353                 if (last!=cur)
354                 {
355                     ns = 1000000*(gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz ;
356                     glwm = ns * ainfo->gdrain_rate/1000000;
357                     glwm = ainfo->gocc - glwm;
358                 }
359                 ns = 1000000*(misses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
360                 ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
361                 ainfo->gocc = ainfo->gocc + ainfo->gburst_size - ns*ainfo->gdrain_rate/1000000;
362                 ainfo->mocc = ainfo->mocc + 0 - ns*ainfo->mdrain_rate/1000000;
363                 break;
364             default:
365                 if (last==cur)    misses = 0;
366                 else if (ainfo->first_macc)   misses = mmisses;
367                 else    misses = 1;
368                 ainfo->first_macc = 0;
369                 ns = 1000000*(misses*state->mem_page_miss + mburst_size/(state->memory_width/8))/state->mclk_khz;
370                 ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
371                 ainfo->gocc = ainfo->gocc + 0 - ns*ainfo->gdrain_rate/1000000;
372                 ainfo->mocc = ainfo->mocc + mburst_size - ns*ainfo->mdrain_rate/1000000;
373                 break;
374         }
375         if (iter>100)
376         {
377             ainfo->converged = 0;
378             return (1);
379         }
380         ns = 1000000*ainfo->gburst_size/(state->memory_width/8)/state->mclk_khz;
381         tmp = ns * ainfo->gdrain_rate/1000000;
382         if (abs(ainfo->gburst_size) + ((abs(ainfo->wcglwm) + 16 ) & ~0x7) - tmp > max_gfsize)
383         {
384             ainfo->converged = 0;
385             return (1);
386         }
387         ns = 1000000*ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
388         tmp = ns * ainfo->vdrain_rate/1000000;
389         if (abs(ainfo->vburst_size) + (abs(ainfo->wcvlwm + 32) & ~0xf)  - tmp> VFIFO_SIZE)
390         {
391             ainfo->converged = 0;
392             return (1);
393         }
394         if (abs(ainfo->gocc) > max_gfsize)
395         {
396             ainfo->converged = 0;
397             return (1);
398         }
399         if (abs(ainfo->vocc) > VFIFO_SIZE)
400         {
401             ainfo->converged = 0;
402             return (1);
403         }
404         if (abs(ainfo->mocc) > MFIFO_SIZE)
405         {
406             ainfo->converged = 0;
407             return (1);
408         }
409         if (abs(vfsize) > VFIFO_SIZE)
410         {
411             ainfo->converged = 0;
412             return (1);
413         }
414         if (abs(gfsize) > max_gfsize)
415         {
416             ainfo->converged = 0;
417             return (1);
418         }
419         if (abs(mfsize) > MFIFO_SIZE)
420         {
421             ainfo->converged = 0;
422             return (1);
423         }
424     }
425 }
nv3_arb(nv3_fifo_info * res_info,nv3_sim_state * state,nv3_arb_info * ainfo)426 static char nv3_arb(nv3_fifo_info * res_info, nv3_sim_state * state,  nv3_arb_info *ainfo)
427 {
428     long ens, vns, mns, gns;
429     int mmisses, gmisses, vmisses, eburst_size, mburst_size;
430     int refresh_cycle;
431 
432     refresh_cycle = 2*(state->mclk_khz/state->pclk_khz) + 5;
433     mmisses = 2;
434     if (state->mem_aligned) gmisses = 2;
435     else    gmisses = 3;
436     vmisses = 2;
437     eburst_size = state->memory_width * 1;
438     mburst_size = 32;
439     gns = 1000000 * (gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
440     ainfo->by_gfacc = gns*ainfo->gdrain_rate/1000000;
441     ainfo->wcmocc = 0;
442     ainfo->wcgocc = 0;
443     ainfo->wcvocc = 0;
444     ainfo->wcvlwm = 0;
445     ainfo->wcglwm = 0;
446     ainfo->engine_en = 1;
447     ainfo->converged = 1;
448     if (ainfo->engine_en)
449     {
450         ens =  1000000*(state->mem_page_miss + eburst_size/(state->memory_width/8) +refresh_cycle)/state->mclk_khz;
451         ainfo->mocc = state->enable_mp ? 0-ens*ainfo->mdrain_rate/1000000 : 0;
452         ainfo->vocc = ainfo->vid_en ? 0-ens*ainfo->vdrain_rate/1000000 : 0;
453         ainfo->gocc = ainfo->gr_en ? 0-ens*ainfo->gdrain_rate/1000000 : 0;
454         ainfo->cur = ENGINE;
455         ainfo->first_vacc = 1;
456         ainfo->first_gacc = 1;
457         ainfo->first_macc = 1;
458         nv3_iterate(res_info, state,ainfo);
459     }
460     if (state->enable_mp)
461     {
462         mns = 1000000 * (mmisses*state->mem_page_miss + mburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
463         ainfo->mocc = state->enable_mp ? 0 : mburst_size - mns*ainfo->mdrain_rate/1000000;
464         ainfo->vocc = ainfo->vid_en ? 0 : 0- mns*ainfo->vdrain_rate/1000000;
465         ainfo->gocc = ainfo->gr_en ? 0: 0- mns*ainfo->gdrain_rate/1000000;
466         ainfo->cur = MPORT;
467         ainfo->first_vacc = 1;
468         ainfo->first_gacc = 1;
469         ainfo->first_macc = 0;
470         nv3_iterate(res_info, state,ainfo);
471     }
472     if (ainfo->gr_en)
473     {
474         ainfo->first_vacc = 1;
475         ainfo->first_gacc = 0;
476         ainfo->first_macc = 1;
477         gns = 1000000*(gmisses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
478         ainfo->gocc = ainfo->gburst_size - gns*ainfo->gdrain_rate/1000000;
479         ainfo->vocc = ainfo->vid_en? 0-gns*ainfo->vdrain_rate/1000000 : 0;
480         ainfo->mocc = state->enable_mp ?  0-gns*ainfo->mdrain_rate/1000000: 0;
481         ainfo->cur = GRAPHICS;
482         nv3_iterate(res_info, state,ainfo);
483     }
484     if (ainfo->vid_en)
485     {
486         ainfo->first_vacc = 0;
487         ainfo->first_gacc = 1;
488         ainfo->first_macc = 1;
489         vns = 1000000*(vmisses*state->mem_page_miss + ainfo->vburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
490         ainfo->vocc = ainfo->vburst_size - vns*ainfo->vdrain_rate/1000000;
491         ainfo->gocc = ainfo->gr_en? (0-vns*ainfo->gdrain_rate/1000000) : 0;
492         ainfo->mocc = state->enable_mp? 0-vns*ainfo->mdrain_rate/1000000 :0 ;
493         ainfo->cur = VIDEO;
494         nv3_iterate(res_info, state, ainfo);
495     }
496     if (ainfo->converged)
497     {
498         res_info->graphics_lwm = (int)abs(ainfo->wcglwm) + 16;
499         res_info->video_lwm = (int)abs(ainfo->wcvlwm) + 32;
500         res_info->graphics_burst_size = ainfo->gburst_size;
501         res_info->video_burst_size = ainfo->vburst_size;
502         res_info->graphics_hi_priority = (ainfo->priority == GRAPHICS);
503         res_info->media_hi_priority = (ainfo->priority == MPORT);
504         if (res_info->video_lwm > 160)
505         {
506             res_info->graphics_lwm = 256;
507             res_info->video_lwm = 128;
508             res_info->graphics_burst_size = 64;
509             res_info->video_burst_size = 64;
510             res_info->graphics_hi_priority = 0;
511             res_info->media_hi_priority = 0;
512             ainfo->converged = 0;
513             return (0);
514         }
515         if (res_info->video_lwm > 128)
516         {
517             res_info->video_lwm = 128;
518         }
519         return (1);
520     }
521     else
522     {
523         res_info->graphics_lwm = 256;
524         res_info->video_lwm = 128;
525         res_info->graphics_burst_size = 64;
526         res_info->video_burst_size = 64;
527         res_info->graphics_hi_priority = 0;
528         res_info->media_hi_priority = 0;
529         return (0);
530     }
531 }
nv3_get_param(nv3_fifo_info * res_info,nv3_sim_state * state,nv3_arb_info * ainfo)532 static char nv3_get_param(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
533 {
534     int done, g,v, p;
535 
536     done = 0;
537     for (p=0; p < 2; p++)
538     {
539         for (g=128 ; g > 32; g= g>> 1)
540         {
541             for (v=128; v >=32; v = v>> 1)
542             {
543                 ainfo->priority = p;
544                 ainfo->gburst_size = g;
545                 ainfo->vburst_size = v;
546                 done = nv3_arb(res_info, state,ainfo);
547                 if (done && (g==128))
548                     if ((res_info->graphics_lwm + g) > 256)
549                         done = 0;
550                 if (done)
551                     goto Done;
552             }
553         }
554     }
555 
556  Done:
557     return done;
558 }
nv3CalcArbitration(nv3_fifo_info * res_info,nv3_sim_state * state)559 static void nv3CalcArbitration
560 (
561     nv3_fifo_info * res_info,
562     nv3_sim_state * state
563 )
564 {
565     nv3_fifo_info save_info;
566     nv3_arb_info ainfo;
567     char   res_gr, res_vid;
568 
569     ainfo.gr_en = 1;
570     ainfo.vid_en = state->enable_video;
571     ainfo.vid_only_once = 0;
572     ainfo.gr_only_once = 0;
573     ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
574     ainfo.vdrain_rate = (int) state->pclk_khz * 2;
575     if (state->video_scale != 0)
576         ainfo.vdrain_rate = ainfo.vdrain_rate/state->video_scale;
577     ainfo.mdrain_rate = 33000;
578     res_info->rtl_values = 0;
579     if (!state->gr_during_vid && state->enable_video)
580     {
581         ainfo.gr_only_once = 1;
582         ainfo.gr_en = 1;
583         ainfo.gdrain_rate = 0;
584         res_vid = nv3_get_param(res_info, state,  &ainfo);
585         res_vid = ainfo.converged;
586         save_info.video_lwm = res_info->video_lwm;
587         save_info.video_burst_size = res_info->video_burst_size;
588         ainfo.vid_en = 1;
589         ainfo.vid_only_once = 1;
590         ainfo.gr_en = 1;
591         ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
592         ainfo.vdrain_rate = 0;
593         res_gr = nv3_get_param(res_info, state,  &ainfo);
594         res_gr = ainfo.converged;
595         res_info->video_lwm = save_info.video_lwm;
596         res_info->video_burst_size = save_info.video_burst_size;
597         res_info->valid = res_gr & res_vid;
598     }
599     else
600     {
601         if (!ainfo.gr_en) ainfo.gdrain_rate = 0;
602         if (!ainfo.vid_en) ainfo.vdrain_rate = 0;
603         res_gr = nv3_get_param(res_info, state,  &ainfo);
604         res_info->valid = ainfo.converged;
605     }
606 }
nv3UpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip)607 static void nv3UpdateArbitrationSettings
608 (
609     unsigned      VClk,
610     unsigned      pixelDepth,
611     unsigned     *burst,
612     unsigned     *lwm,
613     RIVA_HW_INST *chip
614 )
615 {
616     nv3_fifo_info fifo_data;
617     nv3_sim_state sim_data;
618     unsigned int M, N, P, pll, MClk;
619 
620     pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
621     M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
622     MClk = (N * chip->CrystalFreqKHz / M) >> P;
623     sim_data.pix_bpp        = (char)pixelDepth;
624     sim_data.enable_video   = 0;
625     sim_data.enable_mp      = 0;
626     sim_data.video_scale    = 1;
627     sim_data.memory_width   = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
628 	128 : 64;
629     sim_data.memory_width   = 128;
630 
631     sim_data.mem_latency    = 9;
632     sim_data.mem_aligned    = 1;
633     sim_data.mem_page_miss  = 11;
634     sim_data.gr_during_vid  = 0;
635     sim_data.pclk_khz       = VClk;
636     sim_data.mclk_khz       = MClk;
637     nv3CalcArbitration(&fifo_data, &sim_data);
638     if (fifo_data.valid)
639     {
640         int  b = fifo_data.graphics_burst_size >> 4;
641         *burst = 0;
642         while (b >>= 1)
643 	    (*burst)++;
644         *lwm   = fifo_data.graphics_lwm >> 3;
645     }
646     else
647     {
648         *lwm   = 0x24;
649         *burst = 0x2;
650     }
651 }
nv4CalcArbitration(nv4_fifo_info * fifo,nv4_sim_state * arb)652 static void nv4CalcArbitration
653 (
654     nv4_fifo_info *fifo,
655     nv4_sim_state *arb
656 )
657 {
658     int data, pagemiss, cas,width, video_enable, bpp;
659     int nvclks, mclks, pclks, vpagemiss, crtpagemiss, vbs;
660     int found, mclk_extra, mclk_loop, cbs, m1, p1;
661     int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
662     int us_m, us_n, us_p, video_drain_rate, crtc_drain_rate;
663     int vpm_us, us_video, vlwm, video_fill_us, cpm_us, us_crt,clwm;
664 
665     fifo->valid = 1;
666     pclk_freq = arb->pclk_khz;
667     mclk_freq = arb->mclk_khz;
668     nvclk_freq = arb->nvclk_khz;
669     pagemiss = arb->mem_page_miss;
670     cas = arb->mem_latency;
671     width = arb->memory_width >> 6;
672     video_enable = arb->enable_video;
673     bpp = arb->pix_bpp;
674     mp_enable = arb->enable_mp;
675     clwm = 0;
676     vlwm = 0;
677     cbs = 128;
678     pclks = 2;
679     nvclks = 2;
680     nvclks += 2;
681     nvclks += 1;
682     mclks = 5;
683     mclks += 3;
684     mclks += 1;
685     mclks += cas;
686     mclks += 1;
687     mclks += 1;
688     mclks += 1;
689     mclks += 1;
690     mclk_extra = 3;
691     nvclks += 2;
692     nvclks += 1;
693     nvclks += 1;
694     nvclks += 1;
695     if (mp_enable)
696         mclks+=4;
697     nvclks += 0;
698     pclks += 0;
699     found = 0;
700     vbs = 0;
701     while (found != 1)
702     {
703         fifo->valid = 1;
704         found = 1;
705         mclk_loop = mclks+mclk_extra;
706         us_m = mclk_loop *1000*1000 / mclk_freq;
707         us_n = nvclks*1000*1000 / nvclk_freq;
708         us_p = nvclks*1000*1000 / pclk_freq;
709         if (video_enable)
710         {
711             video_drain_rate = pclk_freq * 2;
712             crtc_drain_rate = pclk_freq * bpp/8;
713             vpagemiss = 2;
714             vpagemiss += 1;
715             crtpagemiss = 2;
716             vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
717             if (nvclk_freq * 2 > mclk_freq * width)
718                 video_fill_us = cbs*1000*1000 / 16 / nvclk_freq ;
719             else
720                 video_fill_us = cbs*1000*1000 / (8 * width) / mclk_freq;
721             us_video = vpm_us + us_m + us_n + us_p + video_fill_us;
722             vlwm = us_video * video_drain_rate/(1000*1000);
723             vlwm++;
724             vbs = 128;
725             if (vlwm > 128) vbs = 64;
726             if (vlwm > (256-64)) vbs = 32;
727             if (nvclk_freq * 2 > mclk_freq * width)
728                 video_fill_us = vbs *1000*1000/ 16 / nvclk_freq ;
729             else
730                 video_fill_us = vbs*1000*1000 / (8 * width) / mclk_freq;
731             cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
732             us_crt =
733             us_video
734             +video_fill_us
735             +cpm_us
736             +us_m + us_n +us_p
737             ;
738             clwm = us_crt * crtc_drain_rate/(1000*1000);
739             clwm++;
740         }
741         else
742         {
743             crtc_drain_rate = pclk_freq * bpp/8;
744             crtpagemiss = 2;
745             crtpagemiss += 1;
746             cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
747             us_crt =  cpm_us + us_m + us_n + us_p ;
748             clwm = us_crt * crtc_drain_rate/(1000*1000);
749             clwm++;
750         }
751         m1 = clwm + cbs - 512;
752         p1 = m1 * pclk_freq / mclk_freq;
753         p1 = p1 * bpp / 8;
754         if ((p1 < m1) && (m1 > 0))
755         {
756             fifo->valid = 0;
757             found = 0;
758             if (mclk_extra ==0)   found = 1;
759             mclk_extra--;
760         }
761         else if (video_enable)
762         {
763             if ((clwm > 511) || (vlwm > 255))
764             {
765                 fifo->valid = 0;
766                 found = 0;
767                 if (mclk_extra ==0)   found = 1;
768                 mclk_extra--;
769             }
770         }
771         else
772         {
773             if (clwm > 519)
774             {
775                 fifo->valid = 0;
776                 found = 0;
777                 if (mclk_extra ==0)   found = 1;
778                 mclk_extra--;
779             }
780         }
781         if (clwm < 384) clwm = 384;
782         if (vlwm < 128) vlwm = 128;
783         data = (int)(clwm);
784         fifo->graphics_lwm = data;
785         fifo->graphics_burst_size = 128;
786         data = (int)((vlwm+15));
787         fifo->video_lwm = data;
788         fifo->video_burst_size = vbs;
789     }
790 }
nv4UpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip)791 static void nv4UpdateArbitrationSettings
792 (
793     unsigned      VClk,
794     unsigned      pixelDepth,
795     unsigned     *burst,
796     unsigned     *lwm,
797     RIVA_HW_INST *chip
798 )
799 {
800     nv4_fifo_info fifo_data;
801     nv4_sim_state sim_data;
802     unsigned int M, N, P, pll, MClk, NVClk, cfg1;
803 
804     pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
805     M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
806     MClk  = (N * chip->CrystalFreqKHz / M) >> P;
807     pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
808     M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
809     NVClk  = (N * chip->CrystalFreqKHz / M) >> P;
810     cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
811     sim_data.pix_bpp        = (char)pixelDepth;
812     sim_data.enable_video   = 0;
813     sim_data.enable_mp      = 0;
814     sim_data.memory_width   = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
815 	128 : 64;
816     sim_data.mem_latency    = (char)cfg1 & 0x0F;
817     sim_data.mem_aligned    = 1;
818     sim_data.mem_page_miss  = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
819     sim_data.gr_during_vid  = 0;
820     sim_data.pclk_khz       = VClk;
821     sim_data.mclk_khz       = MClk;
822     sim_data.nvclk_khz      = NVClk;
823     nv4CalcArbitration(&fifo_data, &sim_data);
824     if (fifo_data.valid)
825     {
826         int  b = fifo_data.graphics_burst_size >> 4;
827         *burst = 0;
828         while (b >>= 1)
829 	    (*burst)++;
830         *lwm   = fifo_data.graphics_lwm >> 3;
831     }
832 }
nv10CalcArbitration(nv10_fifo_info * fifo,nv10_sim_state * arb)833 static void nv10CalcArbitration
834 (
835     nv10_fifo_info *fifo,
836     nv10_sim_state *arb
837 )
838 {
839     int data, pagemiss, width, video_enable, bpp;
840     int nvclks, mclks, pclks, vpagemiss, crtpagemiss;
841     int nvclk_fill;
842     int found, mclk_extra, mclk_loop, cbs, m1;
843     int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
844     int us_m, us_m_min, us_n, us_p, crtc_drain_rate;
845     int vus_m;
846     int vpm_us, us_video, cpm_us, us_crt,clwm;
847     int clwm_rnd_down;
848     int m2us, us_pipe_min, p1clk, p2;
849     int min_mclk_extra;
850     int us_min_mclk_extra;
851 
852     fifo->valid = 1;
853     pclk_freq = arb->pclk_khz; /* freq in KHz */
854     mclk_freq = arb->mclk_khz;
855     nvclk_freq = arb->nvclk_khz;
856     pagemiss = arb->mem_page_miss;
857     width = arb->memory_width/64;
858     video_enable = arb->enable_video;
859     bpp = arb->pix_bpp;
860     mp_enable = arb->enable_mp;
861     clwm = 0;
862 
863     cbs = 512;
864 
865     pclks = 4; /* lwm detect. */
866 
867     nvclks = 3; /* lwm -> sync. */
868     nvclks += 2; /* fbi bus cycles (1 req + 1 busy) */
869 
870     mclks  = 1;   /* 2 edge sync.  may be very close to edge so just put one. */
871 
872     mclks += 1;   /* arb_hp_req */
873     mclks += 5;   /* ap_hp_req   tiling pipeline */
874 
875     mclks += 2;    /* tc_req     latency fifo */
876     mclks += 2;    /* fb_cas_n_  memory request to fbio block */
877     mclks += 7;    /* sm_d_rdv   data returned from fbio block */
878 
879     /* fb.rd.d.Put_gc   need to accumulate 256 bits for read */
880     if (arb->memory_type == 0)
881       if (arb->memory_width == 64) /* 64 bit bus */
882         mclks += 4;
883       else
884         mclks += 2;
885     else
886       if (arb->memory_width == 64) /* 64 bit bus */
887         mclks += 2;
888       else
889         mclks += 1;
890 
891     if ((!video_enable) && (arb->memory_width == 128))
892     {
893       mclk_extra = (bpp == 32) ? 31 : 42; /* Margin of error */
894       min_mclk_extra = 17;
895     }
896     else
897     {
898       mclk_extra = (bpp == 32) ? 8 : 4; /* Margin of error */
899       /* mclk_extra = 4; */ /* Margin of error */
900       min_mclk_extra = 18;
901     }
902 
903     nvclks += 1; /* 2 edge sync.  may be very close to edge so just put one. */
904     nvclks += 1; /* fbi_d_rdv_n */
905     nvclks += 1; /* Fbi_d_rdata */
906     nvclks += 1; /* crtfifo load */
907 
908     if(mp_enable)
909       mclks+=4; /* Mp can get in with a burst of 8. */
910     /* Extra clocks determined by heuristics */
911 
912     nvclks += 0;
913     pclks += 0;
914     found = 0;
915     while(found != 1) {
916       fifo->valid = 1;
917       found = 1;
918       mclk_loop = mclks+mclk_extra;
919       us_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
920       us_m_min = mclks * 1000*1000 / mclk_freq; /* Minimum Mclk latency in us */
921       us_min_mclk_extra = min_mclk_extra *1000*1000 / mclk_freq;
922       us_n = nvclks*1000*1000 / nvclk_freq;/* nvclk latency in us */
923       us_p = pclks*1000*1000 / pclk_freq;/* nvclk latency in us */
924       us_pipe_min = us_m_min + us_n + us_p;
925 
926       vus_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
927 
928       if(video_enable) {
929         crtc_drain_rate = pclk_freq * bpp/8; /* MB/s */
930 
931         vpagemiss = 1; /* self generating page miss */
932         vpagemiss += 1; /* One higher priority before */
933 
934         crtpagemiss = 2; /* self generating page miss */
935         if(mp_enable)
936             crtpagemiss += 1; /* if MA0 conflict */
937 
938         vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
939 
940         us_video = vpm_us + vus_m; /* Video has separate read return path */
941 
942         cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
943         us_crt =
944           us_video  /* Wait for video */
945           +cpm_us /* CRT Page miss */
946           +us_m + us_n +us_p /* other latency */
947           ;
948 
949         clwm = us_crt * crtc_drain_rate/(1000*1000);
950         clwm++; /* fixed point <= float_point - 1.  Fixes that */
951       } else {
952         crtc_drain_rate = pclk_freq * bpp/8; /* bpp * pclk/8 */
953 
954         crtpagemiss = 1; /* self generating page miss */
955         crtpagemiss += 1; /* MA0 page miss */
956         if(mp_enable)
957             crtpagemiss += 1; /* if MA0 conflict */
958         cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
959         us_crt =  cpm_us + us_m + us_n + us_p ;
960         clwm = us_crt * crtc_drain_rate/(1000*1000);
961         clwm++; /* fixed point <= float_point - 1.  Fixes that */
962 
963   /*
964           //
965           // Another concern, only for high pclks so don't do this
966           // with video:
967           // What happens if the latency to fetch the cbs is so large that
968           // fifo empties.  In that case we need to have an alternate clwm value
969           // based off the total burst fetch
970           //
971           us_crt = (cbs * 1000 * 1000)/ (8*width)/mclk_freq ;
972           us_crt = us_crt + us_m + us_n + us_p + (4 * 1000 * 1000)/mclk_freq;
973           clwm_mt = us_crt * crtc_drain_rate/(1000*1000);
974           clwm_mt ++;
975           if(clwm_mt > clwm)
976               clwm = clwm_mt;
977   */
978           /* Finally, a heuristic check when width == 64 bits */
979           if(width == 1){
980               nvclk_fill = nvclk_freq * 8;
981               if(crtc_drain_rate * 100 >= nvclk_fill * 102)
982                       clwm = 0xfff; /*Large number to fail */
983 
984               else if(crtc_drain_rate * 100  >= nvclk_fill * 98) {
985                   clwm = 1024;
986                   cbs = 512;
987               }
988           }
989       }
990 
991 
992       /*
993         Overfill check:
994 
995         */
996 
997       clwm_rnd_down = ((int)clwm/8)*8;
998       if (clwm_rnd_down < clwm)
999           clwm += 8;
1000 
1001       m1 = clwm + cbs -  1024; /* Amount of overfill */
1002       m2us = us_pipe_min + us_min_mclk_extra;
1003 
1004       /* pclk cycles to drain */
1005       p1clk = m2us * pclk_freq/(1000*1000);
1006       p2 = p1clk * bpp / 8; /* bytes drained. */
1007 
1008       if((p2 < m1) && (m1 > 0)) {
1009           fifo->valid = 0;
1010           found = 0;
1011           if(min_mclk_extra == 0)   {
1012             if(cbs <= 32) {
1013               found = 1; /* Can't adjust anymore! */
1014             } else {
1015               cbs = cbs/2;  /* reduce the burst size */
1016             }
1017           } else {
1018             min_mclk_extra--;
1019           }
1020       } else {
1021         if (clwm > 1023){ /* Have some margin */
1022           fifo->valid = 0;
1023           found = 0;
1024           if(min_mclk_extra == 0)
1025               found = 1; /* Can't adjust anymore! */
1026           else
1027               min_mclk_extra--;
1028         }
1029       }
1030 
1031       if(clwm < (1024-cbs+8)) clwm = 1024-cbs+8;
1032       data = (int)(clwm);
1033       /*  printf("CRT LWM: %f bytes, prog: 0x%x, bs: 256\n", clwm, data ); */
1034       fifo->graphics_lwm = data;   fifo->graphics_burst_size = cbs;
1035 
1036       /*  printf("VID LWM: %f bytes, prog: 0x%x, bs: %d\n, ", vlwm, data, vbs ); */
1037       fifo->video_lwm = 1024;  fifo->video_burst_size = 512;
1038     }
1039 }
nv10UpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip)1040 static void nv10UpdateArbitrationSettings
1041 (
1042     unsigned      VClk,
1043     unsigned      pixelDepth,
1044     unsigned     *burst,
1045     unsigned     *lwm,
1046     RIVA_HW_INST *chip
1047 )
1048 {
1049     nv10_fifo_info fifo_data;
1050     nv10_sim_state sim_data;
1051     unsigned int M, N, P, pll, MClk, NVClk, cfg1;
1052 
1053     pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
1054     M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
1055     MClk  = (N * chip->CrystalFreqKHz / M) >> P;
1056     pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
1057     M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
1058     NVClk  = (N * chip->CrystalFreqKHz / M) >> P;
1059     cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
1060     sim_data.pix_bpp        = (char)pixelDepth;
1061     sim_data.enable_video   = 0;
1062     sim_data.enable_mp      = 0;
1063     sim_data.memory_type    = (NV_RD32(&chip->PFB[0x00000200/4], 0) & 0x01) ?
1064 	1 : 0;
1065     sim_data.memory_width   = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
1066 	128 : 64;
1067     sim_data.mem_latency    = (char)cfg1 & 0x0F;
1068     sim_data.mem_aligned    = 1;
1069     sim_data.mem_page_miss  = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
1070     sim_data.gr_during_vid  = 0;
1071     sim_data.pclk_khz       = VClk;
1072     sim_data.mclk_khz       = MClk;
1073     sim_data.nvclk_khz      = NVClk;
1074     nv10CalcArbitration(&fifo_data, &sim_data);
1075     if (fifo_data.valid)
1076     {
1077         int  b = fifo_data.graphics_burst_size >> 4;
1078         *burst = 0;
1079         while (b >>= 1)
1080 	    (*burst)++;
1081         *lwm   = fifo_data.graphics_lwm >> 3;
1082     }
1083 }
1084 
nForceUpdateArbitrationSettings(unsigned VClk,unsigned pixelDepth,unsigned * burst,unsigned * lwm,RIVA_HW_INST * chip,struct pci_dev * pdev)1085 static void nForceUpdateArbitrationSettings
1086 (
1087     unsigned      VClk,
1088     unsigned      pixelDepth,
1089     unsigned     *burst,
1090     unsigned     *lwm,
1091     RIVA_HW_INST *chip,
1092     struct pci_dev *pdev
1093 )
1094 {
1095     nv10_fifo_info fifo_data;
1096     nv10_sim_state sim_data;
1097     unsigned int M, N, P, pll, MClk, NVClk;
1098     unsigned int uMClkPostDiv;
1099     struct pci_dev *dev;
1100     int domain = pci_domain_nr(pdev->bus);
1101 
1102     dev = pci_get_domain_bus_and_slot(domain, 0, 3);
1103     pci_read_config_dword(dev, 0x6C, &uMClkPostDiv);
1104     pci_dev_put(dev);
1105     uMClkPostDiv = (uMClkPostDiv >> 8) & 0xf;
1106 
1107     if(!uMClkPostDiv) uMClkPostDiv = 4;
1108     MClk = 400000 / uMClkPostDiv;
1109 
1110     pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
1111     M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
1112     NVClk  = (N * chip->CrystalFreqKHz / M) >> P;
1113     sim_data.pix_bpp        = (char)pixelDepth;
1114     sim_data.enable_video   = 0;
1115     sim_data.enable_mp      = 0;
1116 
1117     dev = pci_get_domain_bus_and_slot(domain, 0, 1);
1118     pci_read_config_dword(dev, 0x7C, &sim_data.memory_type);
1119     pci_dev_put(dev);
1120     sim_data.memory_type    = (sim_data.memory_type >> 12) & 1;
1121 
1122     sim_data.memory_width   = 64;
1123     sim_data.mem_latency    = 3;
1124     sim_data.mem_aligned    = 1;
1125     sim_data.mem_page_miss  = 10;
1126     sim_data.gr_during_vid  = 0;
1127     sim_data.pclk_khz       = VClk;
1128     sim_data.mclk_khz       = MClk;
1129     sim_data.nvclk_khz      = NVClk;
1130     nv10CalcArbitration(&fifo_data, &sim_data);
1131     if (fifo_data.valid)
1132     {
1133         int  b = fifo_data.graphics_burst_size >> 4;
1134         *burst = 0;
1135         while (b >>= 1)
1136 	    (*burst)++;
1137         *lwm   = fifo_data.graphics_lwm >> 3;
1138     }
1139 }
1140 
1141 /****************************************************************************\
1142 *                                                                            *
1143 *                          RIVA Mode State Routines                          *
1144 *                                                                            *
1145 \****************************************************************************/
1146 
1147 /*
1148  * Calculate the Video Clock parameters for the PLL.
1149  */
CalcVClock(int clockIn,int * clockOut,int * mOut,int * nOut,int * pOut,RIVA_HW_INST * chip)1150 static int CalcVClock
1151 (
1152     int           clockIn,
1153     int          *clockOut,
1154     int          *mOut,
1155     int          *nOut,
1156     int          *pOut,
1157     RIVA_HW_INST *chip
1158 )
1159 {
1160     unsigned lowM, highM, highP;
1161     unsigned DeltaNew, DeltaOld;
1162     unsigned VClk, Freq;
1163     unsigned M, N, P;
1164 
1165     DeltaOld = 0xFFFFFFFF;
1166 
1167     VClk     = (unsigned)clockIn;
1168 
1169     if (chip->CrystalFreqKHz == 13500)
1170     {
1171         lowM  = 7;
1172         highM = 13 - (chip->Architecture == NV_ARCH_03);
1173     }
1174     else
1175     {
1176         lowM  = 8;
1177         highM = 14 - (chip->Architecture == NV_ARCH_03);
1178     }
1179 
1180     highP = 4 - (chip->Architecture == NV_ARCH_03);
1181     for (P = 0; P <= highP; P ++)
1182     {
1183         Freq = VClk << P;
1184         if ((Freq >= 128000) && (Freq <= chip->MaxVClockFreqKHz))
1185         {
1186             for (M = lowM; M <= highM; M++)
1187             {
1188                 N    = (VClk << P) * M / chip->CrystalFreqKHz;
1189                 if(N <= 255) {
1190                 Freq = (chip->CrystalFreqKHz * N / M) >> P;
1191                 if (Freq > VClk)
1192                     DeltaNew = Freq - VClk;
1193                 else
1194                     DeltaNew = VClk - Freq;
1195                 if (DeltaNew < DeltaOld)
1196                 {
1197                     *mOut     = M;
1198                     *nOut     = N;
1199                     *pOut     = P;
1200                     *clockOut = Freq;
1201                     DeltaOld  = DeltaNew;
1202                 }
1203             }
1204         }
1205     }
1206     }
1207 
1208     /* non-zero: M/N/P/clock values assigned.  zero: error (not set) */
1209     return (DeltaOld != 0xFFFFFFFF);
1210 }
1211 /*
1212  * Calculate extended mode parameters (SVGA) and save in a
1213  * mode state structure.
1214  */
CalcStateExt(RIVA_HW_INST * chip,RIVA_HW_STATE * state,struct pci_dev * pdev,int bpp,int width,int hDisplaySize,int height,int dotClock)1215 int CalcStateExt
1216 (
1217     RIVA_HW_INST  *chip,
1218     RIVA_HW_STATE *state,
1219     struct pci_dev *pdev,
1220     int            bpp,
1221     int            width,
1222     int            hDisplaySize,
1223     int            height,
1224     int            dotClock
1225 )
1226 {
1227     int pixelDepth;
1228     int VClk, m, n, p;
1229 
1230     /*
1231      * Save mode parameters.
1232      */
1233     state->bpp    = bpp;    /* this is not bitsPerPixel, it's 8,15,16,32 */
1234     state->width  = width;
1235     state->height = height;
1236     /*
1237      * Extended RIVA registers.
1238      */
1239     pixelDepth = (bpp + 1)/8;
1240     if (!CalcVClock(dotClock, &VClk, &m, &n, &p, chip))
1241     	return -EINVAL;
1242 
1243     switch (chip->Architecture)
1244     {
1245         case NV_ARCH_03:
1246             nv3UpdateArbitrationSettings(VClk,
1247                                          pixelDepth * 8,
1248                                         &(state->arbitration0),
1249                                         &(state->arbitration1),
1250                                          chip);
1251             state->cursor0  = 0x00;
1252             state->cursor1  = 0x78;
1253             state->cursor2  = 0x00000000;
1254             state->pllsel   = 0x10010100;
1255             state->config   = ((width + 31)/32)
1256                             | (((pixelDepth > 2) ? 3 : pixelDepth) << 8)
1257                             | 0x1000;
1258             state->general  = 0x00100100;
1259             state->repaint1 = hDisplaySize < 1280 ? 0x06 : 0x02;
1260             break;
1261         case NV_ARCH_04:
1262             nv4UpdateArbitrationSettings(VClk,
1263                                          pixelDepth * 8,
1264                                         &(state->arbitration0),
1265                                         &(state->arbitration1),
1266                                          chip);
1267             state->cursor0  = 0x00;
1268             state->cursor1  = 0xFC;
1269             state->cursor2  = 0x00000000;
1270             state->pllsel   = 0x10000700;
1271             state->config   = 0x00001114;
1272             state->general  = bpp == 16 ? 0x00101100 : 0x00100100;
1273             state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
1274             break;
1275         case NV_ARCH_10:
1276         case NV_ARCH_20:
1277         case NV_ARCH_30:
1278             if((chip->Chipset == NV_CHIP_IGEFORCE2) ||
1279                (chip->Chipset == NV_CHIP_0x01F0))
1280             {
1281                 nForceUpdateArbitrationSettings(VClk,
1282                                           pixelDepth * 8,
1283                                          &(state->arbitration0),
1284                                          &(state->arbitration1),
1285                                           chip, pdev);
1286             } else {
1287                 nv10UpdateArbitrationSettings(VClk,
1288                                           pixelDepth * 8,
1289                                          &(state->arbitration0),
1290                                          &(state->arbitration1),
1291                                           chip);
1292             }
1293             state->cursor0  = 0x80 | (chip->CursorStart >> 17);
1294             state->cursor1  = (chip->CursorStart >> 11) << 2;
1295             state->cursor2  = chip->CursorStart >> 24;
1296             state->pllsel   = 0x10000700;
1297             state->config   = NV_RD32(&chip->PFB[0x00000200/4], 0);
1298             state->general  = bpp == 16 ? 0x00101100 : 0x00100100;
1299             state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
1300             break;
1301     }
1302 
1303      /* Paul Richards: below if block borks things in kernel for some reason */
1304      /* Tony: Below is needed to set hardware in DirectColor */
1305     if((bpp != 8) && (chip->Architecture != NV_ARCH_03))
1306 	    state->general |= 0x00000030;
1307 
1308     state->vpll     = (p << 16) | (n << 8) | m;
1309     state->repaint0 = (((width/8)*pixelDepth) & 0x700) >> 3;
1310     state->pixel    = pixelDepth > 2   ? 3    : pixelDepth;
1311     state->offset0  =
1312     state->offset1  =
1313     state->offset2  =
1314     state->offset3  = 0;
1315     state->pitch0   =
1316     state->pitch1   =
1317     state->pitch2   =
1318     state->pitch3   = pixelDepth * width;
1319 
1320     return 0;
1321 }
1322 /*
1323  * Load fixed function state and pre-calculated/stored state.
1324  */
1325 #define LOAD_FIXED_STATE(tbl,dev)                                       \
1326     for (i = 0; i < sizeof(tbl##Table##dev)/8; i++)                 \
1327         NV_WR32(&chip->dev[tbl##Table##dev[i][0]], 0, tbl##Table##dev[i][1])
1328 #define LOAD_FIXED_STATE_8BPP(tbl,dev)                                  \
1329     for (i = 0; i < sizeof(tbl##Table##dev##_8BPP)/8; i++)            \
1330         NV_WR32(&chip->dev[tbl##Table##dev##_8BPP[i][0]], 0, tbl##Table##dev##_8BPP[i][1])
1331 #define LOAD_FIXED_STATE_15BPP(tbl,dev)                                 \
1332     for (i = 0; i < sizeof(tbl##Table##dev##_15BPP)/8; i++)           \
1333         NV_WR32(&chip->dev[tbl##Table##dev##_15BPP[i][0]], 0, tbl##Table##dev##_15BPP[i][1])
1334 #define LOAD_FIXED_STATE_16BPP(tbl,dev)                                 \
1335     for (i = 0; i < sizeof(tbl##Table##dev##_16BPP)/8; i++)           \
1336         NV_WR32(&chip->dev[tbl##Table##dev##_16BPP[i][0]], 0, tbl##Table##dev##_16BPP[i][1])
1337 #define LOAD_FIXED_STATE_32BPP(tbl,dev)                                 \
1338     for (i = 0; i < sizeof(tbl##Table##dev##_32BPP)/8; i++)           \
1339         NV_WR32(&chip->dev[tbl##Table##dev##_32BPP[i][0]], 0, tbl##Table##dev##_32BPP[i][1])
1340 
UpdateFifoState(RIVA_HW_INST * chip)1341 static void UpdateFifoState
1342 (
1343     RIVA_HW_INST  *chip
1344 )
1345 {
1346     int i;
1347 
1348     switch (chip->Architecture)
1349     {
1350         case NV_ARCH_04:
1351             LOAD_FIXED_STATE(nv4,FIFO);
1352             chip->Tri03 = NULL;
1353             chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
1354             break;
1355         case NV_ARCH_10:
1356         case NV_ARCH_20:
1357         case NV_ARCH_30:
1358             /*
1359              * Initialize state for the RivaTriangle3D05 routines.
1360              */
1361             LOAD_FIXED_STATE(nv10tri05,PGRAPH);
1362             LOAD_FIXED_STATE(nv10,FIFO);
1363             chip->Tri03 = NULL;
1364             chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
1365             break;
1366     }
1367 }
LoadStateExt(RIVA_HW_INST * chip,RIVA_HW_STATE * state)1368 static void LoadStateExt
1369 (
1370     RIVA_HW_INST  *chip,
1371     RIVA_HW_STATE *state
1372 )
1373 {
1374     int i;
1375 
1376     /*
1377      * Load HW fixed function state.
1378      */
1379     LOAD_FIXED_STATE(Riva,PMC);
1380     LOAD_FIXED_STATE(Riva,PTIMER);
1381     switch (chip->Architecture)
1382     {
1383         case NV_ARCH_03:
1384             /*
1385              * Make sure frame buffer config gets set before loading PRAMIN.
1386              */
1387             NV_WR32(chip->PFB, 0x00000200, state->config);
1388             LOAD_FIXED_STATE(nv3,PFIFO);
1389             LOAD_FIXED_STATE(nv3,PRAMIN);
1390             LOAD_FIXED_STATE(nv3,PGRAPH);
1391             switch (state->bpp)
1392             {
1393                 case 15:
1394                 case 16:
1395                     LOAD_FIXED_STATE_15BPP(nv3,PRAMIN);
1396                     LOAD_FIXED_STATE_15BPP(nv3,PGRAPH);
1397                     chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
1398                     break;
1399                 case 24:
1400                 case 32:
1401                     LOAD_FIXED_STATE_32BPP(nv3,PRAMIN);
1402                     LOAD_FIXED_STATE_32BPP(nv3,PGRAPH);
1403                     chip->Tri03 = NULL;
1404                     break;
1405                 case 8:
1406                 default:
1407                     LOAD_FIXED_STATE_8BPP(nv3,PRAMIN);
1408                     LOAD_FIXED_STATE_8BPP(nv3,PGRAPH);
1409                     chip->Tri03 = NULL;
1410                     break;
1411             }
1412             for (i = 0x00000; i < 0x00800; i++)
1413                 NV_WR32(&chip->PRAMIN[0x00000502 + i], 0, (i << 12) | 0x03);
1414             NV_WR32(chip->PGRAPH, 0x00000630, state->offset0);
1415             NV_WR32(chip->PGRAPH, 0x00000634, state->offset1);
1416             NV_WR32(chip->PGRAPH, 0x00000638, state->offset2);
1417             NV_WR32(chip->PGRAPH, 0x0000063C, state->offset3);
1418             NV_WR32(chip->PGRAPH, 0x00000650, state->pitch0);
1419             NV_WR32(chip->PGRAPH, 0x00000654, state->pitch1);
1420             NV_WR32(chip->PGRAPH, 0x00000658, state->pitch2);
1421             NV_WR32(chip->PGRAPH, 0x0000065C, state->pitch3);
1422             break;
1423         case NV_ARCH_04:
1424             /*
1425              * Make sure frame buffer config gets set before loading PRAMIN.
1426              */
1427             NV_WR32(chip->PFB, 0x00000200, state->config);
1428             LOAD_FIXED_STATE(nv4,PFIFO);
1429             LOAD_FIXED_STATE(nv4,PRAMIN);
1430             LOAD_FIXED_STATE(nv4,PGRAPH);
1431             switch (state->bpp)
1432             {
1433                 case 15:
1434                     LOAD_FIXED_STATE_15BPP(nv4,PRAMIN);
1435                     LOAD_FIXED_STATE_15BPP(nv4,PGRAPH);
1436                     chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
1437                     break;
1438                 case 16:
1439                     LOAD_FIXED_STATE_16BPP(nv4,PRAMIN);
1440                     LOAD_FIXED_STATE_16BPP(nv4,PGRAPH);
1441                     chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
1442                     break;
1443                 case 24:
1444                 case 32:
1445                     LOAD_FIXED_STATE_32BPP(nv4,PRAMIN);
1446                     LOAD_FIXED_STATE_32BPP(nv4,PGRAPH);
1447                     chip->Tri03 = NULL;
1448                     break;
1449                 case 8:
1450                 default:
1451                     LOAD_FIXED_STATE_8BPP(nv4,PRAMIN);
1452                     LOAD_FIXED_STATE_8BPP(nv4,PGRAPH);
1453                     chip->Tri03 = NULL;
1454                     break;
1455             }
1456             NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
1457             NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
1458             NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
1459             NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
1460             NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
1461             NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
1462             NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
1463             NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
1464             break;
1465         case NV_ARCH_10:
1466         case NV_ARCH_20:
1467         case NV_ARCH_30:
1468             if(chip->twoHeads) {
1469                VGA_WR08(chip->PCIO, 0x03D4, 0x44);
1470                VGA_WR08(chip->PCIO, 0x03D5, state->crtcOwner);
1471                chip->LockUnlock(chip, 0);
1472             }
1473 
1474             LOAD_FIXED_STATE(nv10,PFIFO);
1475             LOAD_FIXED_STATE(nv10,PRAMIN);
1476             LOAD_FIXED_STATE(nv10,PGRAPH);
1477             switch (state->bpp)
1478             {
1479                 case 15:
1480                     LOAD_FIXED_STATE_15BPP(nv10,PRAMIN);
1481                     LOAD_FIXED_STATE_15BPP(nv10,PGRAPH);
1482                     chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
1483                     break;
1484                 case 16:
1485                     LOAD_FIXED_STATE_16BPP(nv10,PRAMIN);
1486                     LOAD_FIXED_STATE_16BPP(nv10,PGRAPH);
1487                     chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
1488                     break;
1489                 case 24:
1490                 case 32:
1491                     LOAD_FIXED_STATE_32BPP(nv10,PRAMIN);
1492                     LOAD_FIXED_STATE_32BPP(nv10,PGRAPH);
1493                     chip->Tri03 = NULL;
1494                     break;
1495                 case 8:
1496                 default:
1497                     LOAD_FIXED_STATE_8BPP(nv10,PRAMIN);
1498                     LOAD_FIXED_STATE_8BPP(nv10,PGRAPH);
1499                     chip->Tri03 = NULL;
1500                     break;
1501             }
1502 
1503             if(chip->Architecture == NV_ARCH_10) {
1504                 NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
1505                 NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
1506                 NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
1507                 NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
1508                 NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
1509                 NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
1510                 NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
1511                 NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
1512                 NV_WR32(chip->PGRAPH, 0x00000680, state->pitch3);
1513         } else {
1514         NV_WR32(chip->PGRAPH, 0x00000820, state->offset0);
1515         NV_WR32(chip->PGRAPH, 0x00000824, state->offset1);
1516         NV_WR32(chip->PGRAPH, 0x00000828, state->offset2);
1517         NV_WR32(chip->PGRAPH, 0x0000082C, state->offset3);
1518         NV_WR32(chip->PGRAPH, 0x00000850, state->pitch0);
1519         NV_WR32(chip->PGRAPH, 0x00000854, state->pitch1);
1520         NV_WR32(chip->PGRAPH, 0x00000858, state->pitch2);
1521         NV_WR32(chip->PGRAPH, 0x0000085C, state->pitch3);
1522         NV_WR32(chip->PGRAPH, 0x00000860, state->pitch3);
1523         NV_WR32(chip->PGRAPH, 0x00000864, state->pitch3);
1524         NV_WR32(chip->PGRAPH, 0x000009A4, NV_RD32(chip->PFB, 0x00000200));
1525         NV_WR32(chip->PGRAPH, 0x000009A8, NV_RD32(chip->PFB, 0x00000204));
1526         }
1527             if(chip->twoHeads) {
1528                NV_WR32(chip->PCRTC0, 0x00000860, state->head);
1529                NV_WR32(chip->PCRTC0, 0x00002860, state->head2);
1530             }
1531             NV_WR32(chip->PRAMDAC, 0x00000404, NV_RD32(chip->PRAMDAC, 0x00000404) | (1 << 25));
1532 
1533             NV_WR32(chip->PMC, 0x00008704, 1);
1534             NV_WR32(chip->PMC, 0x00008140, 0);
1535             NV_WR32(chip->PMC, 0x00008920, 0);
1536             NV_WR32(chip->PMC, 0x00008924, 0);
1537             NV_WR32(chip->PMC, 0x00008908, 0x01ffffff);
1538             NV_WR32(chip->PMC, 0x0000890C, 0x01ffffff);
1539             NV_WR32(chip->PMC, 0x00001588, 0);
1540 
1541             NV_WR32(chip->PFB, 0x00000240, 0);
1542             NV_WR32(chip->PFB, 0x00000250, 0);
1543             NV_WR32(chip->PFB, 0x00000260, 0);
1544             NV_WR32(chip->PFB, 0x00000270, 0);
1545             NV_WR32(chip->PFB, 0x00000280, 0);
1546             NV_WR32(chip->PFB, 0x00000290, 0);
1547             NV_WR32(chip->PFB, 0x000002A0, 0);
1548             NV_WR32(chip->PFB, 0x000002B0, 0);
1549 
1550             NV_WR32(chip->PGRAPH, 0x00000B00, NV_RD32(chip->PFB, 0x00000240));
1551             NV_WR32(chip->PGRAPH, 0x00000B04, NV_RD32(chip->PFB, 0x00000244));
1552             NV_WR32(chip->PGRAPH, 0x00000B08, NV_RD32(chip->PFB, 0x00000248));
1553             NV_WR32(chip->PGRAPH, 0x00000B0C, NV_RD32(chip->PFB, 0x0000024C));
1554             NV_WR32(chip->PGRAPH, 0x00000B10, NV_RD32(chip->PFB, 0x00000250));
1555             NV_WR32(chip->PGRAPH, 0x00000B14, NV_RD32(chip->PFB, 0x00000254));
1556             NV_WR32(chip->PGRAPH, 0x00000B18, NV_RD32(chip->PFB, 0x00000258));
1557             NV_WR32(chip->PGRAPH, 0x00000B1C, NV_RD32(chip->PFB, 0x0000025C));
1558             NV_WR32(chip->PGRAPH, 0x00000B20, NV_RD32(chip->PFB, 0x00000260));
1559             NV_WR32(chip->PGRAPH, 0x00000B24, NV_RD32(chip->PFB, 0x00000264));
1560             NV_WR32(chip->PGRAPH, 0x00000B28, NV_RD32(chip->PFB, 0x00000268));
1561             NV_WR32(chip->PGRAPH, 0x00000B2C, NV_RD32(chip->PFB, 0x0000026C));
1562             NV_WR32(chip->PGRAPH, 0x00000B30, NV_RD32(chip->PFB, 0x00000270));
1563             NV_WR32(chip->PGRAPH, 0x00000B34, NV_RD32(chip->PFB, 0x00000274));
1564             NV_WR32(chip->PGRAPH, 0x00000B38, NV_RD32(chip->PFB, 0x00000278));
1565             NV_WR32(chip->PGRAPH, 0x00000B3C, NV_RD32(chip->PFB, 0x0000027C));
1566             NV_WR32(chip->PGRAPH, 0x00000B40, NV_RD32(chip->PFB, 0x00000280));
1567             NV_WR32(chip->PGRAPH, 0x00000B44, NV_RD32(chip->PFB, 0x00000284));
1568             NV_WR32(chip->PGRAPH, 0x00000B48, NV_RD32(chip->PFB, 0x00000288));
1569             NV_WR32(chip->PGRAPH, 0x00000B4C, NV_RD32(chip->PFB, 0x0000028C));
1570             NV_WR32(chip->PGRAPH, 0x00000B50, NV_RD32(chip->PFB, 0x00000290));
1571             NV_WR32(chip->PGRAPH, 0x00000B54, NV_RD32(chip->PFB, 0x00000294));
1572             NV_WR32(chip->PGRAPH, 0x00000B58, NV_RD32(chip->PFB, 0x00000298));
1573             NV_WR32(chip->PGRAPH, 0x00000B5C, NV_RD32(chip->PFB, 0x0000029C));
1574             NV_WR32(chip->PGRAPH, 0x00000B60, NV_RD32(chip->PFB, 0x000002A0));
1575             NV_WR32(chip->PGRAPH, 0x00000B64, NV_RD32(chip->PFB, 0x000002A4));
1576             NV_WR32(chip->PGRAPH, 0x00000B68, NV_RD32(chip->PFB, 0x000002A8));
1577             NV_WR32(chip->PGRAPH, 0x00000B6C, NV_RD32(chip->PFB, 0x000002AC));
1578             NV_WR32(chip->PGRAPH, 0x00000B70, NV_RD32(chip->PFB, 0x000002B0));
1579             NV_WR32(chip->PGRAPH, 0x00000B74, NV_RD32(chip->PFB, 0x000002B4));
1580             NV_WR32(chip->PGRAPH, 0x00000B78, NV_RD32(chip->PFB, 0x000002B8));
1581             NV_WR32(chip->PGRAPH, 0x00000B7C, NV_RD32(chip->PFB, 0x000002BC));
1582             NV_WR32(chip->PGRAPH, 0x00000F40, 0x10000000);
1583             NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000000);
1584             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
1585             NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000008);
1586             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000200);
1587             for (i = 0; i < (3*16); i++)
1588                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1589             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
1590             NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1591             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000800);
1592             for (i = 0; i < (16*16); i++)
1593                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1594             NV_WR32(chip->PGRAPH, 0x00000F40, 0x30000000);
1595             NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000004);
1596             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006400);
1597             for (i = 0; i < (59*4); i++)
1598                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1599             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006800);
1600             for (i = 0; i < (47*4); i++)
1601                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1602             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006C00);
1603             for (i = 0; i < (3*4); i++)
1604                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1605             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007000);
1606             for (i = 0; i < (19*4); i++)
1607                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1608             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007400);
1609             for (i = 0; i < (12*4); i++)
1610                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1611             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007800);
1612             for (i = 0; i < (12*4); i++)
1613                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1614             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00004400);
1615             for (i = 0; i < (8*4); i++)
1616                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1617             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000000);
1618             for (i = 0; i < 16; i++)
1619                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1620             NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
1621             for (i = 0; i < 4; i++)
1622                 NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
1623 
1624             NV_WR32(chip->PCRTC, 0x00000810, state->cursorConfig);
1625 
1626             if(chip->flatPanel) {
1627                if((chip->Chipset & 0x0ff0) == 0x0110) {
1628                    NV_WR32(chip->PRAMDAC, 0x0528, state->dither);
1629                } else
1630                if((chip->Chipset & 0x0ff0) >= 0x0170) {
1631                    NV_WR32(chip->PRAMDAC, 0x083C, state->dither);
1632                }
1633 
1634                VGA_WR08(chip->PCIO, 0x03D4, 0x53);
1635                VGA_WR08(chip->PCIO, 0x03D5, 0);
1636                VGA_WR08(chip->PCIO, 0x03D4, 0x54);
1637                VGA_WR08(chip->PCIO, 0x03D5, 0);
1638                VGA_WR08(chip->PCIO, 0x03D4, 0x21);
1639                VGA_WR08(chip->PCIO, 0x03D5, 0xfa);
1640             }
1641 
1642             VGA_WR08(chip->PCIO, 0x03D4, 0x41);
1643             VGA_WR08(chip->PCIO, 0x03D5, state->extra);
1644     }
1645     LOAD_FIXED_STATE(Riva,FIFO);
1646     UpdateFifoState(chip);
1647     /*
1648      * Load HW mode state.
1649      */
1650     VGA_WR08(chip->PCIO, 0x03D4, 0x19);
1651     VGA_WR08(chip->PCIO, 0x03D5, state->repaint0);
1652     VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
1653     VGA_WR08(chip->PCIO, 0x03D5, state->repaint1);
1654     VGA_WR08(chip->PCIO, 0x03D4, 0x25);
1655     VGA_WR08(chip->PCIO, 0x03D5, state->screen);
1656     VGA_WR08(chip->PCIO, 0x03D4, 0x28);
1657     VGA_WR08(chip->PCIO, 0x03D5, state->pixel);
1658     VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
1659     VGA_WR08(chip->PCIO, 0x03D5, state->horiz);
1660     VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
1661     VGA_WR08(chip->PCIO, 0x03D5, state->arbitration0);
1662     VGA_WR08(chip->PCIO, 0x03D4, 0x20);
1663     VGA_WR08(chip->PCIO, 0x03D5, state->arbitration1);
1664     VGA_WR08(chip->PCIO, 0x03D4, 0x30);
1665     VGA_WR08(chip->PCIO, 0x03D5, state->cursor0);
1666     VGA_WR08(chip->PCIO, 0x03D4, 0x31);
1667     VGA_WR08(chip->PCIO, 0x03D5, state->cursor1);
1668     VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
1669     VGA_WR08(chip->PCIO, 0x03D5, state->cursor2);
1670     VGA_WR08(chip->PCIO, 0x03D4, 0x39);
1671     VGA_WR08(chip->PCIO, 0x03D5, state->interlace);
1672 
1673     if(!chip->flatPanel) {
1674        NV_WR32(chip->PRAMDAC0, 0x00000508, state->vpll);
1675        NV_WR32(chip->PRAMDAC0, 0x0000050C, state->pllsel);
1676        if(chip->twoHeads)
1677           NV_WR32(chip->PRAMDAC0, 0x00000520, state->vpll2);
1678     }  else {
1679        NV_WR32(chip->PRAMDAC, 0x00000848 , state->scale);
1680     }
1681     NV_WR32(chip->PRAMDAC, 0x00000600 , state->general);
1682 
1683     /*
1684      * Turn off VBlank enable and reset.
1685      */
1686     NV_WR32(chip->PCRTC, 0x00000140, 0);
1687     NV_WR32(chip->PCRTC, 0x00000100, chip->VBlankBit);
1688     /*
1689      * Set interrupt enable.
1690      */
1691     NV_WR32(chip->PMC, 0x00000140, chip->EnableIRQ & 0x01);
1692     /*
1693      * Set current state pointer.
1694      */
1695     chip->CurrentState = state;
1696     /*
1697      * Reset FIFO free and empty counts.
1698      */
1699     chip->FifoFreeCount  = 0;
1700     /* Free count from first subchannel */
1701     chip->FifoEmptyCount = NV_RD32(&chip->Rop->FifoFree, 0);
1702 }
UnloadStateExt(RIVA_HW_INST * chip,RIVA_HW_STATE * state)1703 static void UnloadStateExt
1704 (
1705     RIVA_HW_INST  *chip,
1706     RIVA_HW_STATE *state
1707 )
1708 {
1709     /*
1710      * Save current HW state.
1711      */
1712     VGA_WR08(chip->PCIO, 0x03D4, 0x19);
1713     state->repaint0     = VGA_RD08(chip->PCIO, 0x03D5);
1714     VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
1715     state->repaint1     = VGA_RD08(chip->PCIO, 0x03D5);
1716     VGA_WR08(chip->PCIO, 0x03D4, 0x25);
1717     state->screen       = VGA_RD08(chip->PCIO, 0x03D5);
1718     VGA_WR08(chip->PCIO, 0x03D4, 0x28);
1719     state->pixel        = VGA_RD08(chip->PCIO, 0x03D5);
1720     VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
1721     state->horiz        = VGA_RD08(chip->PCIO, 0x03D5);
1722     VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
1723     state->arbitration0 = VGA_RD08(chip->PCIO, 0x03D5);
1724     VGA_WR08(chip->PCIO, 0x03D4, 0x20);
1725     state->arbitration1 = VGA_RD08(chip->PCIO, 0x03D5);
1726     VGA_WR08(chip->PCIO, 0x03D4, 0x30);
1727     state->cursor0      = VGA_RD08(chip->PCIO, 0x03D5);
1728     VGA_WR08(chip->PCIO, 0x03D4, 0x31);
1729     state->cursor1      = VGA_RD08(chip->PCIO, 0x03D5);
1730     VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
1731     state->cursor2      = VGA_RD08(chip->PCIO, 0x03D5);
1732     VGA_WR08(chip->PCIO, 0x03D4, 0x39);
1733     state->interlace    = VGA_RD08(chip->PCIO, 0x03D5);
1734     state->vpll         = NV_RD32(chip->PRAMDAC0, 0x00000508);
1735     state->vpll2        = NV_RD32(chip->PRAMDAC0, 0x00000520);
1736     state->pllsel       = NV_RD32(chip->PRAMDAC0, 0x0000050C);
1737     state->general      = NV_RD32(chip->PRAMDAC, 0x00000600);
1738     state->scale        = NV_RD32(chip->PRAMDAC, 0x00000848);
1739     state->config       = NV_RD32(chip->PFB, 0x00000200);
1740     switch (chip->Architecture)
1741     {
1742         case NV_ARCH_03:
1743             state->offset0  = NV_RD32(chip->PGRAPH, 0x00000630);
1744             state->offset1  = NV_RD32(chip->PGRAPH, 0x00000634);
1745             state->offset2  = NV_RD32(chip->PGRAPH, 0x00000638);
1746             state->offset3  = NV_RD32(chip->PGRAPH, 0x0000063C);
1747             state->pitch0   = NV_RD32(chip->PGRAPH, 0x00000650);
1748             state->pitch1   = NV_RD32(chip->PGRAPH, 0x00000654);
1749             state->pitch2   = NV_RD32(chip->PGRAPH, 0x00000658);
1750             state->pitch3   = NV_RD32(chip->PGRAPH, 0x0000065C);
1751             break;
1752         case NV_ARCH_04:
1753             state->offset0  = NV_RD32(chip->PGRAPH, 0x00000640);
1754             state->offset1  = NV_RD32(chip->PGRAPH, 0x00000644);
1755             state->offset2  = NV_RD32(chip->PGRAPH, 0x00000648);
1756             state->offset3  = NV_RD32(chip->PGRAPH, 0x0000064C);
1757             state->pitch0   = NV_RD32(chip->PGRAPH, 0x00000670);
1758             state->pitch1   = NV_RD32(chip->PGRAPH, 0x00000674);
1759             state->pitch2   = NV_RD32(chip->PGRAPH, 0x00000678);
1760             state->pitch3   = NV_RD32(chip->PGRAPH, 0x0000067C);
1761             break;
1762         case NV_ARCH_10:
1763         case NV_ARCH_20:
1764         case NV_ARCH_30:
1765             state->offset0  = NV_RD32(chip->PGRAPH, 0x00000640);
1766             state->offset1  = NV_RD32(chip->PGRAPH, 0x00000644);
1767             state->offset2  = NV_RD32(chip->PGRAPH, 0x00000648);
1768             state->offset3  = NV_RD32(chip->PGRAPH, 0x0000064C);
1769             state->pitch0   = NV_RD32(chip->PGRAPH, 0x00000670);
1770             state->pitch1   = NV_RD32(chip->PGRAPH, 0x00000674);
1771             state->pitch2   = NV_RD32(chip->PGRAPH, 0x00000678);
1772             state->pitch3   = NV_RD32(chip->PGRAPH, 0x0000067C);
1773             if(chip->twoHeads) {
1774                state->head     = NV_RD32(chip->PCRTC0, 0x00000860);
1775                state->head2    = NV_RD32(chip->PCRTC0, 0x00002860);
1776                VGA_WR08(chip->PCIO, 0x03D4, 0x44);
1777                state->crtcOwner = VGA_RD08(chip->PCIO, 0x03D5);
1778             }
1779             VGA_WR08(chip->PCIO, 0x03D4, 0x41);
1780             state->extra = VGA_RD08(chip->PCIO, 0x03D5);
1781             state->cursorConfig = NV_RD32(chip->PCRTC, 0x00000810);
1782 
1783             if((chip->Chipset & 0x0ff0) == 0x0110) {
1784                 state->dither = NV_RD32(chip->PRAMDAC, 0x0528);
1785             } else
1786             if((chip->Chipset & 0x0ff0) >= 0x0170) {
1787                 state->dither = NV_RD32(chip->PRAMDAC, 0x083C);
1788             }
1789             break;
1790     }
1791 }
SetStartAddress(RIVA_HW_INST * chip,unsigned start)1792 static void SetStartAddress
1793 (
1794     RIVA_HW_INST *chip,
1795     unsigned      start
1796 )
1797 {
1798     NV_WR32(chip->PCRTC, 0x800, start);
1799 }
1800 
SetStartAddress3(RIVA_HW_INST * chip,unsigned start)1801 static void SetStartAddress3
1802 (
1803     RIVA_HW_INST *chip,
1804     unsigned      start
1805 )
1806 {
1807     int offset = start >> 2;
1808     int pan    = (start & 3) << 1;
1809     unsigned char tmp;
1810 
1811     /*
1812      * Unlock extended registers.
1813      */
1814     chip->LockUnlock(chip, 0);
1815     /*
1816      * Set start address.
1817      */
1818     VGA_WR08(chip->PCIO, 0x3D4, 0x0D); VGA_WR08(chip->PCIO, 0x3D5, offset);
1819     offset >>= 8;
1820     VGA_WR08(chip->PCIO, 0x3D4, 0x0C); VGA_WR08(chip->PCIO, 0x3D5, offset);
1821     offset >>= 8;
1822     VGA_WR08(chip->PCIO, 0x3D4, 0x19); tmp = VGA_RD08(chip->PCIO, 0x3D5);
1823     VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x01F) | (tmp & ~0x1F));
1824     VGA_WR08(chip->PCIO, 0x3D4, 0x2D); tmp = VGA_RD08(chip->PCIO, 0x3D5);
1825     VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x60) | (tmp & ~0x60));
1826     /*
1827      * 4 pixel pan register.
1828      */
1829     offset = VGA_RD08(chip->PCIO, chip->IO + 0x0A);
1830     VGA_WR08(chip->PCIO, 0x3C0, 0x13);
1831     VGA_WR08(chip->PCIO, 0x3C0, pan);
1832 }
nv3SetSurfaces2D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1833 static void nv3SetSurfaces2D
1834 (
1835     RIVA_HW_INST *chip,
1836     unsigned     surf0,
1837     unsigned     surf1
1838 )
1839 {
1840     RivaSurface __iomem *Surface =
1841 	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1842 
1843     RIVA_FIFO_FREE(*chip,Tri03,5);
1844     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
1845     NV_WR32(&Surface->Offset, 0, surf0);
1846     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
1847     NV_WR32(&Surface->Offset, 0, surf1);
1848     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
1849 }
nv4SetSurfaces2D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1850 static void nv4SetSurfaces2D
1851 (
1852     RIVA_HW_INST *chip,
1853     unsigned     surf0,
1854     unsigned     surf1
1855 )
1856 {
1857     RivaSurface __iomem *Surface =
1858 	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1859 
1860     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
1861     NV_WR32(&Surface->Offset, 0, surf0);
1862     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
1863     NV_WR32(&Surface->Offset, 0, surf1);
1864     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1865 }
nv10SetSurfaces2D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1866 static void nv10SetSurfaces2D
1867 (
1868     RIVA_HW_INST *chip,
1869     unsigned     surf0,
1870     unsigned     surf1
1871 )
1872 {
1873     RivaSurface __iomem *Surface =
1874 	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1875 
1876     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
1877     NV_WR32(&Surface->Offset, 0, surf0);
1878     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
1879     NV_WR32(&Surface->Offset, 0, surf1);
1880     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1881 }
nv3SetSurfaces3D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1882 static void nv3SetSurfaces3D
1883 (
1884     RIVA_HW_INST *chip,
1885     unsigned     surf0,
1886     unsigned     surf1
1887 )
1888 {
1889     RivaSurface __iomem *Surface =
1890 	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1891 
1892     RIVA_FIFO_FREE(*chip,Tri03,5);
1893     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
1894     NV_WR32(&Surface->Offset, 0, surf0);
1895     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
1896     NV_WR32(&Surface->Offset, 0, surf1);
1897     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
1898 }
nv4SetSurfaces3D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1899 static void nv4SetSurfaces3D
1900 (
1901     RIVA_HW_INST *chip,
1902     unsigned     surf0,
1903     unsigned     surf1
1904 )
1905 {
1906     RivaSurface __iomem *Surface =
1907 	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
1908 
1909     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
1910     NV_WR32(&Surface->Offset, 0, surf0);
1911     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
1912     NV_WR32(&Surface->Offset, 0, surf1);
1913     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1914 }
nv10SetSurfaces3D(RIVA_HW_INST * chip,unsigned surf0,unsigned surf1)1915 static void nv10SetSurfaces3D
1916 (
1917     RIVA_HW_INST *chip,
1918     unsigned     surf0,
1919     unsigned     surf1
1920 )
1921 {
1922     RivaSurface3D __iomem *Surfaces3D =
1923 	(RivaSurface3D __iomem *)&(chip->FIFO[0x0000E000/4]);
1924 
1925     RIVA_FIFO_FREE(*chip,Tri03,4);
1926     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000007);
1927     NV_WR32(&Surfaces3D->RenderBufferOffset, 0, surf0);
1928     NV_WR32(&Surfaces3D->ZBufferOffset, 0, surf1);
1929     NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
1930 }
1931 
1932 /****************************************************************************\
1933 *                                                                            *
1934 *                      Probe RIVA Chip Configuration                         *
1935 *                                                                            *
1936 \****************************************************************************/
1937 
nv3GetConfig(RIVA_HW_INST * chip)1938 static void nv3GetConfig
1939 (
1940     RIVA_HW_INST *chip
1941 )
1942 {
1943     /*
1944      * Fill in chip configuration.
1945      */
1946     if (NV_RD32(&chip->PFB[0x00000000/4], 0) & 0x00000020)
1947     {
1948         if (((NV_RD32(chip->PMC, 0x00000000) & 0xF0) == 0x20)
1949          && ((NV_RD32(chip->PMC, 0x00000000) & 0x0F) >= 0x02))
1950         {
1951             /*
1952              * SDRAM 128 ZX.
1953              */
1954             chip->RamBandwidthKBytesPerSec = 800000;
1955             switch (NV_RD32(chip->PFB, 0x00000000) & 0x03)
1956             {
1957                 case 2:
1958                     chip->RamAmountKBytes = 1024 * 4;
1959                     break;
1960                 case 1:
1961                     chip->RamAmountKBytes = 1024 * 2;
1962                     break;
1963                 default:
1964                     chip->RamAmountKBytes = 1024 * 8;
1965                     break;
1966             }
1967         }
1968         else
1969         {
1970             chip->RamBandwidthKBytesPerSec = 1000000;
1971             chip->RamAmountKBytes          = 1024 * 8;
1972         }
1973     }
1974     else
1975     {
1976         /*
1977          * SGRAM 128.
1978          */
1979         chip->RamBandwidthKBytesPerSec = 1000000;
1980         switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
1981         {
1982             case 0:
1983                 chip->RamAmountKBytes = 1024 * 8;
1984                 break;
1985             case 2:
1986                 chip->RamAmountKBytes = 1024 * 4;
1987                 break;
1988             default:
1989                 chip->RamAmountKBytes = 1024 * 2;
1990                 break;
1991         }
1992     }
1993     chip->CrystalFreqKHz   = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
1994     chip->CURSOR           = &(chip->PRAMIN[0x00008000/4 - 0x0800/4]);
1995     chip->VBlankBit        = 0x00000100;
1996     chip->MaxVClockFreqKHz = 256000;
1997     /*
1998      * Set chip functions.
1999      */
2000     chip->Busy            = nv3Busy;
2001     chip->ShowHideCursor  = ShowHideCursor;
2002     chip->LoadStateExt    = LoadStateExt;
2003     chip->UnloadStateExt  = UnloadStateExt;
2004     chip->SetStartAddress = SetStartAddress3;
2005     chip->SetSurfaces2D   = nv3SetSurfaces2D;
2006     chip->SetSurfaces3D   = nv3SetSurfaces3D;
2007     chip->LockUnlock      = nv3LockUnlock;
2008 }
nv4GetConfig(RIVA_HW_INST * chip)2009 static void nv4GetConfig
2010 (
2011     RIVA_HW_INST *chip
2012 )
2013 {
2014     /*
2015      * Fill in chip configuration.
2016      */
2017     if (NV_RD32(chip->PFB, 0x00000000) & 0x00000100)
2018     {
2019         chip->RamAmountKBytes = ((NV_RD32(chip->PFB, 0x00000000) >> 12) & 0x0F) * 1024 * 2
2020                               + 1024 * 2;
2021     }
2022     else
2023     {
2024         switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
2025         {
2026             case 0:
2027                 chip->RamAmountKBytes = 1024 * 32;
2028                 break;
2029             case 1:
2030                 chip->RamAmountKBytes = 1024 * 4;
2031                 break;
2032             case 2:
2033                 chip->RamAmountKBytes = 1024 * 8;
2034                 break;
2035             case 3:
2036             default:
2037                 chip->RamAmountKBytes = 1024 * 16;
2038                 break;
2039         }
2040     }
2041     switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
2042     {
2043         case 3:
2044             chip->RamBandwidthKBytesPerSec = 800000;
2045             break;
2046         default:
2047             chip->RamBandwidthKBytesPerSec = 1000000;
2048             break;
2049     }
2050     chip->CrystalFreqKHz   = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
2051     chip->CURSOR           = &(chip->PRAMIN[0x00010000/4 - 0x0800/4]);
2052     chip->VBlankBit        = 0x00000001;
2053     chip->MaxVClockFreqKHz = 350000;
2054     /*
2055      * Set chip functions.
2056      */
2057     chip->Busy            = nv4Busy;
2058     chip->ShowHideCursor  = ShowHideCursor;
2059     chip->LoadStateExt    = LoadStateExt;
2060     chip->UnloadStateExt  = UnloadStateExt;
2061     chip->SetStartAddress = SetStartAddress;
2062     chip->SetSurfaces2D   = nv4SetSurfaces2D;
2063     chip->SetSurfaces3D   = nv4SetSurfaces3D;
2064     chip->LockUnlock      = nv4LockUnlock;
2065 }
nv10GetConfig(RIVA_HW_INST * chip,struct pci_dev * pdev,unsigned int chipset)2066 static void nv10GetConfig
2067 (
2068     RIVA_HW_INST *chip,
2069     struct pci_dev *pdev,
2070     unsigned int chipset
2071 )
2072 {
2073     struct pci_dev* dev;
2074     int domain = pci_domain_nr(pdev->bus);
2075     u32 amt;
2076 
2077 #ifdef __BIG_ENDIAN
2078     /* turn on big endian register access */
2079     if(!(NV_RD32(chip->PMC, 0x00000004) & 0x01000001))
2080     	NV_WR32(chip->PMC, 0x00000004, 0x01000001);
2081 #endif
2082 
2083     /*
2084      * Fill in chip configuration.
2085      */
2086     if(chipset == NV_CHIP_IGEFORCE2) {
2087         dev = pci_get_domain_bus_and_slot(domain, 0, 1);
2088         pci_read_config_dword(dev, 0x7C, &amt);
2089         pci_dev_put(dev);
2090         chip->RamAmountKBytes = (((amt >> 6) & 31) + 1) * 1024;
2091     } else if(chipset == NV_CHIP_0x01F0) {
2092         dev = pci_get_domain_bus_and_slot(domain, 0, 1);
2093         pci_read_config_dword(dev, 0x84, &amt);
2094         pci_dev_put(dev);
2095         chip->RamAmountKBytes = (((amt >> 4) & 127) + 1) * 1024;
2096     } else {
2097         switch ((NV_RD32(chip->PFB, 0x0000020C) >> 20) & 0x000000FF)
2098         {
2099             case 0x02:
2100                 chip->RamAmountKBytes = 1024 * 2;
2101                 break;
2102             case 0x04:
2103                 chip->RamAmountKBytes = 1024 * 4;
2104                 break;
2105             case 0x08:
2106                 chip->RamAmountKBytes = 1024 * 8;
2107                 break;
2108             case 0x10:
2109                 chip->RamAmountKBytes = 1024 * 16;
2110                 break;
2111             case 0x20:
2112                 chip->RamAmountKBytes = 1024 * 32;
2113                 break;
2114             case 0x40:
2115                 chip->RamAmountKBytes = 1024 * 64;
2116                 break;
2117             case 0x80:
2118                 chip->RamAmountKBytes = 1024 * 128;
2119                 break;
2120             default:
2121                 chip->RamAmountKBytes = 1024 * 16;
2122                 break;
2123         }
2124     }
2125     switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
2126     {
2127         case 3:
2128             chip->RamBandwidthKBytesPerSec = 800000;
2129             break;
2130         default:
2131             chip->RamBandwidthKBytesPerSec = 1000000;
2132             break;
2133     }
2134     chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 6)) ?
2135 	14318 : 13500;
2136 
2137     switch (chipset & 0x0ff0) {
2138     case 0x0170:
2139     case 0x0180:
2140     case 0x01F0:
2141     case 0x0250:
2142     case 0x0280:
2143     case 0x0300:
2144     case 0x0310:
2145     case 0x0320:
2146     case 0x0330:
2147     case 0x0340:
2148        if(NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 22))
2149            chip->CrystalFreqKHz = 27000;
2150        break;
2151     default:
2152        break;
2153     }
2154 
2155     chip->CursorStart      = (chip->RamAmountKBytes - 128) * 1024;
2156     chip->CURSOR           = NULL;  /* can't set this here */
2157     chip->VBlankBit        = 0x00000001;
2158     chip->MaxVClockFreqKHz = 350000;
2159     /*
2160      * Set chip functions.
2161      */
2162     chip->Busy            = nv10Busy;
2163     chip->ShowHideCursor  = ShowHideCursor;
2164     chip->LoadStateExt    = LoadStateExt;
2165     chip->UnloadStateExt  = UnloadStateExt;
2166     chip->SetStartAddress = SetStartAddress;
2167     chip->SetSurfaces2D   = nv10SetSurfaces2D;
2168     chip->SetSurfaces3D   = nv10SetSurfaces3D;
2169     chip->LockUnlock      = nv4LockUnlock;
2170 
2171     switch(chipset & 0x0ff0) {
2172     case 0x0110:
2173     case 0x0170:
2174     case 0x0180:
2175     case 0x01F0:
2176     case 0x0250:
2177     case 0x0280:
2178     case 0x0300:
2179     case 0x0310:
2180     case 0x0320:
2181     case 0x0330:
2182     case 0x0340:
2183         chip->twoHeads = TRUE;
2184         break;
2185     default:
2186         chip->twoHeads = FALSE;
2187         break;
2188     }
2189 }
RivaGetConfig(RIVA_HW_INST * chip,struct pci_dev * pdev,unsigned int chipset)2190 int RivaGetConfig
2191 (
2192     RIVA_HW_INST *chip,
2193     struct pci_dev *pdev,
2194     unsigned int chipset
2195 )
2196 {
2197     /*
2198      * Save this so future SW know whats it's dealing with.
2199      */
2200     chip->Version = RIVA_SW_VERSION;
2201     /*
2202      * Chip specific configuration.
2203      */
2204     switch (chip->Architecture)
2205     {
2206         case NV_ARCH_03:
2207             nv3GetConfig(chip);
2208             break;
2209         case NV_ARCH_04:
2210             nv4GetConfig(chip);
2211             break;
2212         case NV_ARCH_10:
2213         case NV_ARCH_20:
2214         case NV_ARCH_30:
2215             nv10GetConfig(chip, pdev, chipset);
2216             break;
2217         default:
2218             return (-1);
2219     }
2220     chip->Chipset = chipset;
2221     /*
2222      * Fill in FIFO pointers.
2223      */
2224     chip->Rop    = (RivaRop __iomem         *)&(chip->FIFO[0x00000000/4]);
2225     chip->Clip   = (RivaClip __iomem        *)&(chip->FIFO[0x00002000/4]);
2226     chip->Patt   = (RivaPattern __iomem     *)&(chip->FIFO[0x00004000/4]);
2227     chip->Pixmap = (RivaPixmap __iomem      *)&(chip->FIFO[0x00006000/4]);
2228     chip->Blt    = (RivaScreenBlt __iomem   *)&(chip->FIFO[0x00008000/4]);
2229     chip->Bitmap = (RivaBitmap __iomem      *)&(chip->FIFO[0x0000A000/4]);
2230     chip->Line   = (RivaLine __iomem        *)&(chip->FIFO[0x0000C000/4]);
2231     chip->Tri03  = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
2232     return (0);
2233 }
2234 
2235