cachepc-linux

Fork of AMDESE/linux with modifications for CachePC side-channel attack
git clone https://git.sinitax.com/sinitax/cachepc-linux
Log | Files | Refs | README | LICENSE | sfeed.txt

riva_hw.c (78165B)


      1 /***************************************************************************\
      2|*                                                                           *|
      3|*       Copyright 1993-1999 NVIDIA, Corporation.  All rights reserved.      *|
      4|*                                                                           *|
      5|*     NOTICE TO USER:   The source code  is copyrighted under  U.S. and     *|
      6|*     international laws.  Users and possessors of this source code are     *|
      7|*     hereby granted a nonexclusive,  royalty-free copyright license to     *|
      8|*     use this code in individual and commercial software.                  *|
      9|*                                                                           *|
     10|*     Any use of this source code must include,  in the user documenta-     *|
     11|*     tion and  internal comments to the code,  notices to the end user     *|
     12|*     as follows:                                                           *|
     13|*                                                                           *|
     14|*       Copyright 1993-1999 NVIDIA, Corporation.  All rights reserved.      *|
     15|*                                                                           *|
     16|*     NVIDIA, CORPORATION MAKES NO REPRESENTATION ABOUT THE SUITABILITY     *|
     17|*     OF  THIS SOURCE  CODE  FOR ANY PURPOSE.  IT IS  PROVIDED  "AS IS"     *|
     18|*     WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND.  NVIDIA, CORPOR-     *|
     19|*     ATION DISCLAIMS ALL WARRANTIES  WITH REGARD  TO THIS SOURCE CODE,     *|
     20|*     INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY, NONINFRINGE-     *|
     21|*     MENT,  AND FITNESS  FOR A PARTICULAR PURPOSE.   IN NO EVENT SHALL     *|
     22|*     NVIDIA, CORPORATION  BE LIABLE FOR ANY SPECIAL,  INDIRECT,  INCI-     *|
     23|*     DENTAL, OR CONSEQUENTIAL DAMAGES,  OR ANY DAMAGES  WHATSOEVER RE-     *|
     24|*     SULTING FROM LOSS OF USE,  DATA OR PROFITS,  WHETHER IN AN ACTION     *|
     25|*     OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION,  ARISING OUT OF     *|
     26|*     OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOURCE CODE.     *|
     27|*                                                                           *|
     28|*     U.S. Government  End  Users.   This source code  is a "commercial     *|
     29|*     item,"  as that  term is  defined at  48 C.F.R. 2.101 (OCT 1995),     *|
     30|*     consisting  of "commercial  computer  software"  and  "commercial     *|
     31|*     computer  software  documentation,"  as such  terms  are  used in     *|
     32|*     48 C.F.R. 12.212 (SEPT 1995)  and is provided to the U.S. Govern-     *|
     33|*     ment only as  a commercial end item.   Consistent with  48 C.F.R.     *|
     34|*     12.212 and  48 C.F.R. 227.7202-1 through  227.7202-4 (JUNE 1995),     *|
     35|*     all U.S. Government End Users  acquire the source code  with only     *|
     36|*     those rights set forth herein.                                        *|
     37|*                                                                           *|
     38 \***************************************************************************/
     39
     40/*
     41 * GPL licensing note -- nVidia is allowing a liberal interpretation of
     42 * the documentation restriction above, to merely say that this nVidia's
     43 * copyright and disclaimer should be included with all code derived
     44 * from this source.  -- Jeff Garzik <jgarzik@pobox.com>, 01/Nov/99 
     45 */
     46
     47/* $XFree86: xc/programs/Xserver/hw/xfree86/drivers/nv/riva_hw.c,v 1.33 2002/08/05 20:47:06 mvojkovi Exp $ */
     48
     49#include <linux/kernel.h>
     50#include <linux/pci.h>
     51#include <linux/pci_ids.h>
     52#include "riva_hw.h"
     53#include "riva_tbl.h"
     54#include "nv_type.h"
     55
     56/*
     57 * This file is an OS-agnostic file used to make RIVA 128 and RIVA TNT
     58 * operate identically (except TNT has more memory and better 3D quality.
     59 */
     60static int nv3Busy
     61(
     62    RIVA_HW_INST *chip
     63)
     64{
     65    return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
     66	    NV_RD32(&chip->PGRAPH[0x000006B0/4], 0) & 0x01);
     67}
     68static int nv4Busy
     69(
     70    RIVA_HW_INST *chip
     71)
     72{
     73    return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
     74	    NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
     75}
     76static int nv10Busy
     77(
     78    RIVA_HW_INST *chip
     79)
     80{
     81    return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
     82	    NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
     83}
     84
     85static void vgaLockUnlock
     86(
     87    RIVA_HW_INST *chip,
     88    int           Lock
     89)
     90{
     91    U008 cr11;
     92    VGA_WR08(chip->PCIO, 0x3D4, 0x11);
     93    cr11 = VGA_RD08(chip->PCIO, 0x3D5);
     94    if(Lock) cr11 |= 0x80;
     95    else cr11 &= ~0x80;
     96    VGA_WR08(chip->PCIO, 0x3D5, cr11);
     97}
     98static void nv3LockUnlock
     99(
    100    RIVA_HW_INST *chip,
    101    int           Lock
    102)
    103{
    104    VGA_WR08(chip->PVIO, 0x3C4, 0x06);
    105    VGA_WR08(chip->PVIO, 0x3C5, Lock ? 0x99 : 0x57);
    106    vgaLockUnlock(chip, Lock);
    107}
    108static void nv4LockUnlock
    109(
    110    RIVA_HW_INST *chip,
    111    int           Lock
    112)
    113{
    114    VGA_WR08(chip->PCIO, 0x3D4, 0x1F);
    115    VGA_WR08(chip->PCIO, 0x3D5, Lock ? 0x99 : 0x57);
    116    vgaLockUnlock(chip, Lock);
    117}
    118
    119static int ShowHideCursor
    120(
    121    RIVA_HW_INST *chip,
    122    int           ShowHide
    123)
    124{
    125    int cursor;
    126    cursor                      =  chip->CurrentState->cursor1;
    127    chip->CurrentState->cursor1 = (chip->CurrentState->cursor1 & 0xFE) |
    128                                  (ShowHide & 0x01);
    129    VGA_WR08(chip->PCIO, 0x3D4, 0x31);
    130    VGA_WR08(chip->PCIO, 0x3D5, chip->CurrentState->cursor1);
    131    return (cursor & 0x01);
    132}
    133
    134/****************************************************************************\
    135*                                                                            *
    136* The video arbitration routines calculate some "magic" numbers.  Fixes      *
    137* the snow seen when accessing the framebuffer without it.                   *
    138* It just works (I hope).                                                    *
    139*                                                                            *
    140\****************************************************************************/
    141
    142#define DEFAULT_GR_LWM 100
    143#define DEFAULT_VID_LWM 100
    144#define DEFAULT_GR_BURST_SIZE 256
    145#define DEFAULT_VID_BURST_SIZE 128
    146#define VIDEO		0
    147#define GRAPHICS	1
    148#define MPORT		2
    149#define ENGINE		3
    150#define GFIFO_SIZE	320
    151#define GFIFO_SIZE_128	256
    152#define MFIFO_SIZE	120
    153#define VFIFO_SIZE	256
    154
    155typedef struct {
    156  int gdrain_rate;
    157  int vdrain_rate;
    158  int mdrain_rate;
    159  int gburst_size;
    160  int vburst_size;
    161  char vid_en;
    162  char gr_en;
    163  int wcmocc, wcgocc, wcvocc, wcvlwm, wcglwm;
    164  int by_gfacc;
    165  char vid_only_once;
    166  char gr_only_once;
    167  char first_vacc;
    168  char first_gacc;
    169  char first_macc;
    170  int vocc;
    171  int gocc;
    172  int mocc;
    173  char cur;
    174  char engine_en;
    175  char converged;
    176  int priority;
    177} nv3_arb_info;
    178typedef struct {
    179  int graphics_lwm;
    180  int video_lwm;
    181  int graphics_burst_size;
    182  int video_burst_size;
    183  int graphics_hi_priority;
    184  int media_hi_priority;
    185  int rtl_values;
    186  int valid;
    187} nv3_fifo_info;
    188typedef struct {
    189  char pix_bpp;
    190  char enable_video;
    191  char gr_during_vid;
    192  char enable_mp;
    193  int memory_width;
    194  int video_scale;
    195  int pclk_khz;
    196  int mclk_khz;
    197  int mem_page_miss;
    198  int mem_latency;
    199  char mem_aligned;
    200} nv3_sim_state;
    201typedef struct {
    202  int graphics_lwm;
    203  int video_lwm;
    204  int graphics_burst_size;
    205  int video_burst_size;
    206  int valid;
    207} nv4_fifo_info;
    208typedef struct {
    209  int pclk_khz;
    210  int mclk_khz;
    211  int nvclk_khz;
    212  char mem_page_miss;
    213  char mem_latency;
    214  int memory_width;
    215  char enable_video;
    216  char gr_during_vid;
    217  char pix_bpp;
    218  char mem_aligned;
    219  char enable_mp;
    220} nv4_sim_state;
    221typedef struct {
    222  int graphics_lwm;
    223  int video_lwm;
    224  int graphics_burst_size;
    225  int video_burst_size;
    226  int valid;
    227} nv10_fifo_info;
    228typedef struct {
    229  int pclk_khz;
    230  int mclk_khz;
    231  int nvclk_khz;
    232  char mem_page_miss;
    233  char mem_latency;
    234  u32 memory_type;
    235  int memory_width;
    236  char enable_video;
    237  char gr_during_vid;
    238  char pix_bpp;
    239  char mem_aligned;
    240  char enable_mp;
    241} nv10_sim_state;
    242static int nv3_iterate(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
    243{
    244    int iter = 0;
    245    int tmp;
    246    int vfsize, mfsize, gfsize;
    247    int mburst_size = 32;
    248    int mmisses, gmisses, vmisses;
    249    int misses;
    250    int vlwm, glwm;
    251    int last, next, cur;
    252    int max_gfsize ;
    253    long ns;
    254
    255    vlwm = 0;
    256    glwm = 0;
    257    vfsize = 0;
    258    gfsize = 0;
    259    cur = ainfo->cur;
    260    mmisses = 2;
    261    gmisses = 2;
    262    vmisses = 2;
    263    if (ainfo->gburst_size == 128) max_gfsize = GFIFO_SIZE_128;
    264    else  max_gfsize = GFIFO_SIZE;
    265    max_gfsize = GFIFO_SIZE;
    266    while (1)
    267    {
    268        if (ainfo->vid_en)
    269        {
    270            if (ainfo->wcvocc > ainfo->vocc) ainfo->wcvocc = ainfo->vocc;
    271            if (ainfo->wcvlwm > vlwm) ainfo->wcvlwm = vlwm ;
    272            ns = 1000000 * ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
    273            vfsize = ns * ainfo->vdrain_rate / 1000000;
    274            vfsize =  ainfo->wcvlwm - ainfo->vburst_size + vfsize;
    275        }
    276        if (state->enable_mp)
    277        {
    278            if (ainfo->wcmocc > ainfo->mocc) ainfo->wcmocc = ainfo->mocc;
    279        }
    280        if (ainfo->gr_en)
    281        {
    282            if (ainfo->wcglwm > glwm) ainfo->wcglwm = glwm ;
    283            if (ainfo->wcgocc > ainfo->gocc) ainfo->wcgocc = ainfo->gocc;
    284            ns = 1000000 * (ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
    285            gfsize = (ns * (long) ainfo->gdrain_rate)/1000000;
    286            gfsize = ainfo->wcglwm - ainfo->gburst_size + gfsize;
    287        }
    288        mfsize = 0;
    289        if (!state->gr_during_vid && ainfo->vid_en)
    290            if (ainfo->vid_en && (ainfo->vocc < 0) && !ainfo->vid_only_once)
    291                next = VIDEO;
    292            else if (ainfo->mocc < 0)
    293                next = MPORT;
    294            else if (ainfo->gocc< ainfo->by_gfacc)
    295                next = GRAPHICS;
    296            else return (0);
    297        else switch (ainfo->priority)
    298            {
    299                case VIDEO:
    300                    if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
    301                        next = VIDEO;
    302                    else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
    303                        next = GRAPHICS;
    304                    else if (ainfo->mocc<0)
    305                        next = MPORT;
    306                    else    return (0);
    307                    break;
    308                case GRAPHICS:
    309                    if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
    310                        next = GRAPHICS;
    311                    else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
    312                        next = VIDEO;
    313                    else if (ainfo->mocc<0)
    314                        next = MPORT;
    315                    else    return (0);
    316                    break;
    317                default:
    318                    if (ainfo->mocc<0)
    319                        next = MPORT;
    320                    else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
    321                        next = GRAPHICS;
    322                    else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
    323                        next = VIDEO;
    324                    else    return (0);
    325                    break;
    326            }
    327        last = cur;
    328        cur = next;
    329        iter++;
    330        switch (cur)
    331        {
    332            case VIDEO:
    333                if (last==cur)    misses = 0;
    334                else if (ainfo->first_vacc)   misses = vmisses;
    335                else    misses = 1;
    336                ainfo->first_vacc = 0;
    337                if (last!=cur)
    338                {
    339                    ns =  1000000 * (vmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz; 
    340                    vlwm = ns * ainfo->vdrain_rate/ 1000000;
    341                    vlwm = ainfo->vocc - vlwm;
    342                }
    343                ns = 1000000*(misses*state->mem_page_miss + ainfo->vburst_size)/(state->memory_width/8)/state->mclk_khz;
    344                ainfo->vocc = ainfo->vocc + ainfo->vburst_size - ns*ainfo->vdrain_rate/1000000;
    345                ainfo->gocc = ainfo->gocc - ns*ainfo->gdrain_rate/1000000;
    346                ainfo->mocc = ainfo->mocc - ns*ainfo->mdrain_rate/1000000;
    347                break;
    348            case GRAPHICS:
    349                if (last==cur)    misses = 0;
    350                else if (ainfo->first_gacc)   misses = gmisses;
    351                else    misses = 1;
    352                ainfo->first_gacc = 0;
    353                if (last!=cur)
    354                {
    355                    ns = 1000000*(gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz ;
    356                    glwm = ns * ainfo->gdrain_rate/1000000;
    357                    glwm = ainfo->gocc - glwm;
    358                }
    359                ns = 1000000*(misses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
    360                ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
    361                ainfo->gocc = ainfo->gocc + ainfo->gburst_size - ns*ainfo->gdrain_rate/1000000;
    362                ainfo->mocc = ainfo->mocc + 0 - ns*ainfo->mdrain_rate/1000000;
    363                break;
    364            default:
    365                if (last==cur)    misses = 0;
    366                else if (ainfo->first_macc)   misses = mmisses;
    367                else    misses = 1;
    368                ainfo->first_macc = 0;
    369                ns = 1000000*(misses*state->mem_page_miss + mburst_size/(state->memory_width/8))/state->mclk_khz;
    370                ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
    371                ainfo->gocc = ainfo->gocc + 0 - ns*ainfo->gdrain_rate/1000000;
    372                ainfo->mocc = ainfo->mocc + mburst_size - ns*ainfo->mdrain_rate/1000000;
    373                break;
    374        }
    375        if (iter>100)
    376        {
    377            ainfo->converged = 0;
    378            return (1);
    379        }
    380        ns = 1000000*ainfo->gburst_size/(state->memory_width/8)/state->mclk_khz;
    381        tmp = ns * ainfo->gdrain_rate/1000000;
    382        if (abs(ainfo->gburst_size) + ((abs(ainfo->wcglwm) + 16 ) & ~0x7) - tmp > max_gfsize)
    383        {
    384            ainfo->converged = 0;
    385            return (1);
    386        }
    387        ns = 1000000*ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
    388        tmp = ns * ainfo->vdrain_rate/1000000;
    389        if (abs(ainfo->vburst_size) + (abs(ainfo->wcvlwm + 32) & ~0xf)  - tmp> VFIFO_SIZE)
    390        {
    391            ainfo->converged = 0;
    392            return (1);
    393        }
    394        if (abs(ainfo->gocc) > max_gfsize)
    395        {
    396            ainfo->converged = 0;
    397            return (1);
    398        }
    399        if (abs(ainfo->vocc) > VFIFO_SIZE)
    400        {
    401            ainfo->converged = 0;
    402            return (1);
    403        }
    404        if (abs(ainfo->mocc) > MFIFO_SIZE)
    405        {
    406            ainfo->converged = 0;
    407            return (1);
    408        }
    409        if (abs(vfsize) > VFIFO_SIZE)
    410        {
    411            ainfo->converged = 0;
    412            return (1);
    413        }
    414        if (abs(gfsize) > max_gfsize)
    415        {
    416            ainfo->converged = 0;
    417            return (1);
    418        }
    419        if (abs(mfsize) > MFIFO_SIZE)
    420        {
    421            ainfo->converged = 0;
    422            return (1);
    423        }
    424    }
    425}
    426static char nv3_arb(nv3_fifo_info * res_info, nv3_sim_state * state,  nv3_arb_info *ainfo) 
    427{
    428    long ens, vns, mns, gns;
    429    int mmisses, gmisses, vmisses, eburst_size, mburst_size;
    430    int refresh_cycle;
    431
    432    refresh_cycle = 2*(state->mclk_khz/state->pclk_khz) + 5;
    433    mmisses = 2;
    434    if (state->mem_aligned) gmisses = 2;
    435    else    gmisses = 3;
    436    vmisses = 2;
    437    eburst_size = state->memory_width * 1;
    438    mburst_size = 32;
    439    gns = 1000000 * (gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
    440    ainfo->by_gfacc = gns*ainfo->gdrain_rate/1000000;
    441    ainfo->wcmocc = 0;
    442    ainfo->wcgocc = 0;
    443    ainfo->wcvocc = 0;
    444    ainfo->wcvlwm = 0;
    445    ainfo->wcglwm = 0;
    446    ainfo->engine_en = 1;
    447    ainfo->converged = 1;
    448    if (ainfo->engine_en)
    449    {
    450        ens =  1000000*(state->mem_page_miss + eburst_size/(state->memory_width/8) +refresh_cycle)/state->mclk_khz;
    451        ainfo->mocc = state->enable_mp ? 0-ens*ainfo->mdrain_rate/1000000 : 0;
    452        ainfo->vocc = ainfo->vid_en ? 0-ens*ainfo->vdrain_rate/1000000 : 0;
    453        ainfo->gocc = ainfo->gr_en ? 0-ens*ainfo->gdrain_rate/1000000 : 0;
    454        ainfo->cur = ENGINE;
    455        ainfo->first_vacc = 1;
    456        ainfo->first_gacc = 1;
    457        ainfo->first_macc = 1;
    458        nv3_iterate(res_info, state,ainfo);
    459    }
    460    if (state->enable_mp)
    461    {
    462        mns = 1000000 * (mmisses*state->mem_page_miss + mburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
    463        ainfo->mocc = state->enable_mp ? 0 : mburst_size - mns*ainfo->mdrain_rate/1000000;
    464        ainfo->vocc = ainfo->vid_en ? 0 : 0- mns*ainfo->vdrain_rate/1000000;
    465        ainfo->gocc = ainfo->gr_en ? 0: 0- mns*ainfo->gdrain_rate/1000000;
    466        ainfo->cur = MPORT;
    467        ainfo->first_vacc = 1;
    468        ainfo->first_gacc = 1;
    469        ainfo->first_macc = 0;
    470        nv3_iterate(res_info, state,ainfo);
    471    }
    472    if (ainfo->gr_en)
    473    {
    474        ainfo->first_vacc = 1;
    475        ainfo->first_gacc = 0;
    476        ainfo->first_macc = 1;
    477        gns = 1000000*(gmisses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
    478        ainfo->gocc = ainfo->gburst_size - gns*ainfo->gdrain_rate/1000000;
    479        ainfo->vocc = ainfo->vid_en? 0-gns*ainfo->vdrain_rate/1000000 : 0;
    480        ainfo->mocc = state->enable_mp ?  0-gns*ainfo->mdrain_rate/1000000: 0;
    481        ainfo->cur = GRAPHICS;
    482        nv3_iterate(res_info, state,ainfo);
    483    }
    484    if (ainfo->vid_en)
    485    {
    486        ainfo->first_vacc = 0;
    487        ainfo->first_gacc = 1;
    488        ainfo->first_macc = 1;
    489        vns = 1000000*(vmisses*state->mem_page_miss + ainfo->vburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
    490        ainfo->vocc = ainfo->vburst_size - vns*ainfo->vdrain_rate/1000000;
    491        ainfo->gocc = ainfo->gr_en? (0-vns*ainfo->gdrain_rate/1000000) : 0;
    492        ainfo->mocc = state->enable_mp? 0-vns*ainfo->mdrain_rate/1000000 :0 ;
    493        ainfo->cur = VIDEO;
    494        nv3_iterate(res_info, state, ainfo);
    495    }
    496    if (ainfo->converged)
    497    {
    498        res_info->graphics_lwm = (int)abs(ainfo->wcglwm) + 16;
    499        res_info->video_lwm = (int)abs(ainfo->wcvlwm) + 32;
    500        res_info->graphics_burst_size = ainfo->gburst_size;
    501        res_info->video_burst_size = ainfo->vburst_size;
    502        res_info->graphics_hi_priority = (ainfo->priority == GRAPHICS);
    503        res_info->media_hi_priority = (ainfo->priority == MPORT);
    504        if (res_info->video_lwm > 160)
    505        {
    506            res_info->graphics_lwm = 256;
    507            res_info->video_lwm = 128;
    508            res_info->graphics_burst_size = 64;
    509            res_info->video_burst_size = 64;
    510            res_info->graphics_hi_priority = 0;
    511            res_info->media_hi_priority = 0;
    512            ainfo->converged = 0;
    513            return (0);
    514        }
    515        if (res_info->video_lwm > 128)
    516        {
    517            res_info->video_lwm = 128;
    518        }
    519        return (1);
    520    }
    521    else
    522    {
    523        res_info->graphics_lwm = 256;
    524        res_info->video_lwm = 128;
    525        res_info->graphics_burst_size = 64;
    526        res_info->video_burst_size = 64;
    527        res_info->graphics_hi_priority = 0;
    528        res_info->media_hi_priority = 0;
    529        return (0);
    530    }
    531}
    532static char nv3_get_param(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
    533{
    534    int done, g,v, p;
    535    
    536    done = 0;
    537    for (p=0; p < 2; p++)
    538    {
    539        for (g=128 ; g > 32; g= g>> 1)
    540        {
    541            for (v=128; v >=32; v = v>> 1)
    542            {
    543                ainfo->priority = p;
    544                ainfo->gburst_size = g;     
    545                ainfo->vburst_size = v;
    546                done = nv3_arb(res_info, state,ainfo);
    547                if (done && (g==128))
    548                    if ((res_info->graphics_lwm + g) > 256)
    549                        done = 0;
    550                if (done)
    551                    goto Done;
    552            }
    553        }
    554    }
    555
    556 Done:
    557    return done;
    558}
    559static void nv3CalcArbitration 
    560(
    561    nv3_fifo_info * res_info,
    562    nv3_sim_state * state
    563)
    564{
    565    nv3_fifo_info save_info;
    566    nv3_arb_info ainfo;
    567    char   res_gr, res_vid;
    568
    569    ainfo.gr_en = 1;
    570    ainfo.vid_en = state->enable_video;
    571    ainfo.vid_only_once = 0;
    572    ainfo.gr_only_once = 0;
    573    ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
    574    ainfo.vdrain_rate = (int) state->pclk_khz * 2;
    575    if (state->video_scale != 0)
    576        ainfo.vdrain_rate = ainfo.vdrain_rate/state->video_scale;
    577    ainfo.mdrain_rate = 33000;
    578    res_info->rtl_values = 0;
    579    if (!state->gr_during_vid && state->enable_video)
    580    {
    581        ainfo.gr_only_once = 1;
    582        ainfo.gr_en = 1;
    583        ainfo.gdrain_rate = 0;
    584        res_vid = nv3_get_param(res_info, state,  &ainfo);
    585        res_vid = ainfo.converged;
    586        save_info.video_lwm = res_info->video_lwm;
    587        save_info.video_burst_size = res_info->video_burst_size;
    588        ainfo.vid_en = 1;
    589        ainfo.vid_only_once = 1;
    590        ainfo.gr_en = 1;
    591        ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
    592        ainfo.vdrain_rate = 0;
    593        res_gr = nv3_get_param(res_info, state,  &ainfo);
    594        res_gr = ainfo.converged;
    595        res_info->video_lwm = save_info.video_lwm;
    596        res_info->video_burst_size = save_info.video_burst_size;
    597        res_info->valid = res_gr & res_vid;
    598    }
    599    else
    600    {
    601        if (!ainfo.gr_en) ainfo.gdrain_rate = 0;
    602        if (!ainfo.vid_en) ainfo.vdrain_rate = 0;
    603        res_gr = nv3_get_param(res_info, state,  &ainfo);
    604        res_info->valid = ainfo.converged;
    605    }
    606}
    607static void nv3UpdateArbitrationSettings
    608(
    609    unsigned      VClk, 
    610    unsigned      pixelDepth, 
    611    unsigned     *burst,
    612    unsigned     *lwm,
    613    RIVA_HW_INST *chip
    614)
    615{
    616    nv3_fifo_info fifo_data;
    617    nv3_sim_state sim_data;
    618    unsigned int M, N, P, pll, MClk;
    619    
    620    pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
    621    M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
    622    MClk = (N * chip->CrystalFreqKHz / M) >> P;
    623    sim_data.pix_bpp        = (char)pixelDepth;
    624    sim_data.enable_video   = 0;
    625    sim_data.enable_mp      = 0;
    626    sim_data.video_scale    = 1;
    627    sim_data.memory_width   = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
    628	128 : 64;
    629    sim_data.memory_width   = 128;
    630
    631    sim_data.mem_latency    = 9;
    632    sim_data.mem_aligned    = 1;
    633    sim_data.mem_page_miss  = 11;
    634    sim_data.gr_during_vid  = 0;
    635    sim_data.pclk_khz       = VClk;
    636    sim_data.mclk_khz       = MClk;
    637    nv3CalcArbitration(&fifo_data, &sim_data);
    638    if (fifo_data.valid)
    639    {
    640        int  b = fifo_data.graphics_burst_size >> 4;
    641        *burst = 0;
    642        while (b >>= 1)
    643	    (*burst)++;
    644        *lwm   = fifo_data.graphics_lwm >> 3;
    645    }
    646    else
    647    {
    648        *lwm   = 0x24;
    649        *burst = 0x2;
    650    }
    651}
    652static void nv4CalcArbitration 
    653(
    654    nv4_fifo_info *fifo,
    655    nv4_sim_state *arb
    656)
    657{
    658    int data, pagemiss, cas,width, video_enable, bpp;
    659    int nvclks, mclks, pclks, vpagemiss, crtpagemiss, vbs;
    660    int found, mclk_extra, mclk_loop, cbs, m1, p1;
    661    int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
    662    int us_m, us_n, us_p, video_drain_rate, crtc_drain_rate;
    663    int vpm_us, us_video, vlwm, video_fill_us, cpm_us, us_crt,clwm;
    664
    665    fifo->valid = 1;
    666    pclk_freq = arb->pclk_khz;
    667    mclk_freq = arb->mclk_khz;
    668    nvclk_freq = arb->nvclk_khz;
    669    pagemiss = arb->mem_page_miss;
    670    cas = arb->mem_latency;
    671    width = arb->memory_width >> 6;
    672    video_enable = arb->enable_video;
    673    bpp = arb->pix_bpp;
    674    mp_enable = arb->enable_mp;
    675    clwm = 0;
    676    vlwm = 0;
    677    cbs = 128;
    678    pclks = 2;
    679    nvclks = 2;
    680    nvclks += 2;
    681    nvclks += 1;
    682    mclks = 5;
    683    mclks += 3;
    684    mclks += 1;
    685    mclks += cas;
    686    mclks += 1;
    687    mclks += 1;
    688    mclks += 1;
    689    mclks += 1;
    690    mclk_extra = 3;
    691    nvclks += 2;
    692    nvclks += 1;
    693    nvclks += 1;
    694    nvclks += 1;
    695    if (mp_enable)
    696        mclks+=4;
    697    nvclks += 0;
    698    pclks += 0;
    699    found = 0;
    700    vbs = 0;
    701    while (found != 1)
    702    {
    703        fifo->valid = 1;
    704        found = 1;
    705        mclk_loop = mclks+mclk_extra;
    706        us_m = mclk_loop *1000*1000 / mclk_freq;
    707        us_n = nvclks*1000*1000 / nvclk_freq;
    708        us_p = nvclks*1000*1000 / pclk_freq;
    709        if (video_enable)
    710        {
    711            video_drain_rate = pclk_freq * 2;
    712            crtc_drain_rate = pclk_freq * bpp/8;
    713            vpagemiss = 2;
    714            vpagemiss += 1;
    715            crtpagemiss = 2;
    716            vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
    717            if (nvclk_freq * 2 > mclk_freq * width)
    718                video_fill_us = cbs*1000*1000 / 16 / nvclk_freq ;
    719            else
    720                video_fill_us = cbs*1000*1000 / (8 * width) / mclk_freq;
    721            us_video = vpm_us + us_m + us_n + us_p + video_fill_us;
    722            vlwm = us_video * video_drain_rate/(1000*1000);
    723            vlwm++;
    724            vbs = 128;
    725            if (vlwm > 128) vbs = 64;
    726            if (vlwm > (256-64)) vbs = 32;
    727            if (nvclk_freq * 2 > mclk_freq * width)
    728                video_fill_us = vbs *1000*1000/ 16 / nvclk_freq ;
    729            else
    730                video_fill_us = vbs*1000*1000 / (8 * width) / mclk_freq;
    731            cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
    732            us_crt =
    733            us_video
    734            +video_fill_us
    735            +cpm_us
    736            +us_m + us_n +us_p
    737            ;
    738            clwm = us_crt * crtc_drain_rate/(1000*1000);
    739            clwm++;
    740        }
    741        else
    742        {
    743            crtc_drain_rate = pclk_freq * bpp/8;
    744            crtpagemiss = 2;
    745            crtpagemiss += 1;
    746            cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
    747            us_crt =  cpm_us + us_m + us_n + us_p ;
    748            clwm = us_crt * crtc_drain_rate/(1000*1000);
    749            clwm++;
    750        }
    751        m1 = clwm + cbs - 512;
    752        p1 = m1 * pclk_freq / mclk_freq;
    753        p1 = p1 * bpp / 8;
    754        if ((p1 < m1) && (m1 > 0))
    755        {
    756            fifo->valid = 0;
    757            found = 0;
    758            if (mclk_extra ==0)   found = 1;
    759            mclk_extra--;
    760        }
    761        else if (video_enable)
    762        {
    763            if ((clwm > 511) || (vlwm > 255))
    764            {
    765                fifo->valid = 0;
    766                found = 0;
    767                if (mclk_extra ==0)   found = 1;
    768                mclk_extra--;
    769            }
    770        }
    771        else
    772        {
    773            if (clwm > 519)
    774            {
    775                fifo->valid = 0;
    776                found = 0;
    777                if (mclk_extra ==0)   found = 1;
    778                mclk_extra--;
    779            }
    780        }
    781        if (clwm < 384) clwm = 384;
    782        if (vlwm < 128) vlwm = 128;
    783        data = (int)(clwm);
    784        fifo->graphics_lwm = data;
    785        fifo->graphics_burst_size = 128;
    786        data = (int)((vlwm+15));
    787        fifo->video_lwm = data;
    788        fifo->video_burst_size = vbs;
    789    }
    790}
    791static void nv4UpdateArbitrationSettings
    792(
    793    unsigned      VClk, 
    794    unsigned      pixelDepth, 
    795    unsigned     *burst,
    796    unsigned     *lwm,
    797    RIVA_HW_INST *chip
    798)
    799{
    800    nv4_fifo_info fifo_data;
    801    nv4_sim_state sim_data;
    802    unsigned int M, N, P, pll, MClk, NVClk, cfg1;
    803
    804    pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
    805    M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
    806    MClk  = (N * chip->CrystalFreqKHz / M) >> P;
    807    pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
    808    M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
    809    NVClk  = (N * chip->CrystalFreqKHz / M) >> P;
    810    cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
    811    sim_data.pix_bpp        = (char)pixelDepth;
    812    sim_data.enable_video   = 0;
    813    sim_data.enable_mp      = 0;
    814    sim_data.memory_width   = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
    815	128 : 64;
    816    sim_data.mem_latency    = (char)cfg1 & 0x0F;
    817    sim_data.mem_aligned    = 1;
    818    sim_data.mem_page_miss  = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
    819    sim_data.gr_during_vid  = 0;
    820    sim_data.pclk_khz       = VClk;
    821    sim_data.mclk_khz       = MClk;
    822    sim_data.nvclk_khz      = NVClk;
    823    nv4CalcArbitration(&fifo_data, &sim_data);
    824    if (fifo_data.valid)
    825    {
    826        int  b = fifo_data.graphics_burst_size >> 4;
    827        *burst = 0;
    828        while (b >>= 1)
    829	    (*burst)++;
    830        *lwm   = fifo_data.graphics_lwm >> 3;
    831    }
    832}
    833static void nv10CalcArbitration 
    834(
    835    nv10_fifo_info *fifo,
    836    nv10_sim_state *arb
    837)
    838{
    839    int data, pagemiss, width, video_enable, bpp;
    840    int nvclks, mclks, pclks, vpagemiss, crtpagemiss;
    841    int nvclk_fill;
    842    int found, mclk_extra, mclk_loop, cbs, m1;
    843    int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
    844    int us_m, us_m_min, us_n, us_p, crtc_drain_rate;
    845    int vus_m;
    846    int vpm_us, us_video, cpm_us, us_crt,clwm;
    847    int clwm_rnd_down;
    848    int m2us, us_pipe_min, p1clk, p2;
    849    int min_mclk_extra;
    850    int us_min_mclk_extra;
    851
    852    fifo->valid = 1;
    853    pclk_freq = arb->pclk_khz; /* freq in KHz */
    854    mclk_freq = arb->mclk_khz;
    855    nvclk_freq = arb->nvclk_khz;
    856    pagemiss = arb->mem_page_miss;
    857    width = arb->memory_width/64;
    858    video_enable = arb->enable_video;
    859    bpp = arb->pix_bpp;
    860    mp_enable = arb->enable_mp;
    861    clwm = 0;
    862
    863    cbs = 512;
    864
    865    pclks = 4; /* lwm detect. */
    866
    867    nvclks = 3; /* lwm -> sync. */
    868    nvclks += 2; /* fbi bus cycles (1 req + 1 busy) */
    869
    870    mclks  = 1;   /* 2 edge sync.  may be very close to edge so just put one. */
    871
    872    mclks += 1;   /* arb_hp_req */
    873    mclks += 5;   /* ap_hp_req   tiling pipeline */
    874
    875    mclks += 2;    /* tc_req     latency fifo */
    876    mclks += 2;    /* fb_cas_n_  memory request to fbio block */
    877    mclks += 7;    /* sm_d_rdv   data returned from fbio block */
    878
    879    /* fb.rd.d.Put_gc   need to accumulate 256 bits for read */
    880    if (arb->memory_type == 0)
    881      if (arb->memory_width == 64) /* 64 bit bus */
    882        mclks += 4;
    883      else
    884        mclks += 2;
    885    else
    886      if (arb->memory_width == 64) /* 64 bit bus */
    887        mclks += 2;
    888      else
    889        mclks += 1;
    890
    891    if ((!video_enable) && (arb->memory_width == 128))
    892    {  
    893      mclk_extra = (bpp == 32) ? 31 : 42; /* Margin of error */
    894      min_mclk_extra = 17;
    895    }
    896    else
    897    {
    898      mclk_extra = (bpp == 32) ? 8 : 4; /* Margin of error */
    899      /* mclk_extra = 4; */ /* Margin of error */
    900      min_mclk_extra = 18;
    901    }
    902
    903    nvclks += 1; /* 2 edge sync.  may be very close to edge so just put one. */
    904    nvclks += 1; /* fbi_d_rdv_n */
    905    nvclks += 1; /* Fbi_d_rdata */
    906    nvclks += 1; /* crtfifo load */
    907
    908    if(mp_enable)
    909      mclks+=4; /* Mp can get in with a burst of 8. */
    910    /* Extra clocks determined by heuristics */
    911
    912    nvclks += 0;
    913    pclks += 0;
    914    found = 0;
    915    while(found != 1) {
    916      fifo->valid = 1;
    917      found = 1;
    918      mclk_loop = mclks+mclk_extra;
    919      us_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
    920      us_m_min = mclks * 1000*1000 / mclk_freq; /* Minimum Mclk latency in us */
    921      us_min_mclk_extra = min_mclk_extra *1000*1000 / mclk_freq;
    922      us_n = nvclks*1000*1000 / nvclk_freq;/* nvclk latency in us */
    923      us_p = pclks*1000*1000 / pclk_freq;/* nvclk latency in us */
    924      us_pipe_min = us_m_min + us_n + us_p;
    925
    926      vus_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
    927
    928      if(video_enable) {
    929        crtc_drain_rate = pclk_freq * bpp/8; /* MB/s */
    930
    931        vpagemiss = 1; /* self generating page miss */
    932        vpagemiss += 1; /* One higher priority before */
    933
    934        crtpagemiss = 2; /* self generating page miss */
    935        if(mp_enable)
    936            crtpagemiss += 1; /* if MA0 conflict */
    937
    938        vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
    939
    940        us_video = vpm_us + vus_m; /* Video has separate read return path */
    941
    942        cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
    943        us_crt =
    944          us_video  /* Wait for video */
    945          +cpm_us /* CRT Page miss */
    946          +us_m + us_n +us_p /* other latency */
    947          ;
    948
    949        clwm = us_crt * crtc_drain_rate/(1000*1000);
    950        clwm++; /* fixed point <= float_point - 1.  Fixes that */
    951      } else {
    952        crtc_drain_rate = pclk_freq * bpp/8; /* bpp * pclk/8 */
    953
    954        crtpagemiss = 1; /* self generating page miss */
    955        crtpagemiss += 1; /* MA0 page miss */
    956        if(mp_enable)
    957            crtpagemiss += 1; /* if MA0 conflict */
    958        cpm_us = crtpagemiss  * pagemiss *1000*1000/ mclk_freq;
    959        us_crt =  cpm_us + us_m + us_n + us_p ;
    960        clwm = us_crt * crtc_drain_rate/(1000*1000);
    961        clwm++; /* fixed point <= float_point - 1.  Fixes that */
    962
    963  /*
    964          //
    965          // Another concern, only for high pclks so don't do this
    966          // with video:
    967          // What happens if the latency to fetch the cbs is so large that
    968          // fifo empties.  In that case we need to have an alternate clwm value
    969          // based off the total burst fetch
    970          //
    971          us_crt = (cbs * 1000 * 1000)/ (8*width)/mclk_freq ;
    972          us_crt = us_crt + us_m + us_n + us_p + (4 * 1000 * 1000)/mclk_freq;
    973          clwm_mt = us_crt * crtc_drain_rate/(1000*1000);
    974          clwm_mt ++;
    975          if(clwm_mt > clwm)
    976              clwm = clwm_mt;
    977  */
    978          /* Finally, a heuristic check when width == 64 bits */
    979          if(width == 1){
    980              nvclk_fill = nvclk_freq * 8;
    981              if(crtc_drain_rate * 100 >= nvclk_fill * 102)
    982                      clwm = 0xfff; /*Large number to fail */
    983
    984              else if(crtc_drain_rate * 100  >= nvclk_fill * 98) {
    985                  clwm = 1024;
    986                  cbs = 512;
    987              }
    988          }
    989      }
    990
    991
    992      /*
    993        Overfill check:
    994
    995        */
    996
    997      clwm_rnd_down = ((int)clwm/8)*8;
    998      if (clwm_rnd_down < clwm)
    999          clwm += 8;
   1000
   1001      m1 = clwm + cbs -  1024; /* Amount of overfill */
   1002      m2us = us_pipe_min + us_min_mclk_extra;
   1003
   1004      /* pclk cycles to drain */
   1005      p1clk = m2us * pclk_freq/(1000*1000); 
   1006      p2 = p1clk * bpp / 8; /* bytes drained. */
   1007
   1008      if((p2 < m1) && (m1 > 0)) {
   1009          fifo->valid = 0;
   1010          found = 0;
   1011          if(min_mclk_extra == 0)   {
   1012            if(cbs <= 32) {
   1013              found = 1; /* Can't adjust anymore! */
   1014            } else {
   1015              cbs = cbs/2;  /* reduce the burst size */
   1016            }
   1017          } else {
   1018            min_mclk_extra--;
   1019          }
   1020      } else {
   1021        if (clwm > 1023){ /* Have some margin */
   1022          fifo->valid = 0;
   1023          found = 0;
   1024          if(min_mclk_extra == 0)   
   1025              found = 1; /* Can't adjust anymore! */
   1026          else 
   1027              min_mclk_extra--;
   1028        }
   1029      }
   1030
   1031      if(clwm < (1024-cbs+8)) clwm = 1024-cbs+8;
   1032      data = (int)(clwm);
   1033      /*  printf("CRT LWM: %f bytes, prog: 0x%x, bs: 256\n", clwm, data ); */
   1034      fifo->graphics_lwm = data;   fifo->graphics_burst_size = cbs;
   1035
   1036      /*  printf("VID LWM: %f bytes, prog: 0x%x, bs: %d\n, ", vlwm, data, vbs ); */
   1037      fifo->video_lwm = 1024;  fifo->video_burst_size = 512;
   1038    }
   1039}
   1040static void nv10UpdateArbitrationSettings
   1041(
   1042    unsigned      VClk, 
   1043    unsigned      pixelDepth, 
   1044    unsigned     *burst,
   1045    unsigned     *lwm,
   1046    RIVA_HW_INST *chip
   1047)
   1048{
   1049    nv10_fifo_info fifo_data;
   1050    nv10_sim_state sim_data;
   1051    unsigned int M, N, P, pll, MClk, NVClk, cfg1;
   1052
   1053    pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
   1054    M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
   1055    MClk  = (N * chip->CrystalFreqKHz / M) >> P;
   1056    pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
   1057    M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
   1058    NVClk  = (N * chip->CrystalFreqKHz / M) >> P;
   1059    cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
   1060    sim_data.pix_bpp        = (char)pixelDepth;
   1061    sim_data.enable_video   = 0;
   1062    sim_data.enable_mp      = 0;
   1063    sim_data.memory_type    = (NV_RD32(&chip->PFB[0x00000200/4], 0) & 0x01) ?
   1064	1 : 0;
   1065    sim_data.memory_width   = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
   1066	128 : 64;
   1067    sim_data.mem_latency    = (char)cfg1 & 0x0F;
   1068    sim_data.mem_aligned    = 1;
   1069    sim_data.mem_page_miss  = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
   1070    sim_data.gr_during_vid  = 0;
   1071    sim_data.pclk_khz       = VClk;
   1072    sim_data.mclk_khz       = MClk;
   1073    sim_data.nvclk_khz      = NVClk;
   1074    nv10CalcArbitration(&fifo_data, &sim_data);
   1075    if (fifo_data.valid)
   1076    {
   1077        int  b = fifo_data.graphics_burst_size >> 4;
   1078        *burst = 0;
   1079        while (b >>= 1)
   1080	    (*burst)++;
   1081        *lwm   = fifo_data.graphics_lwm >> 3;
   1082    }
   1083}
   1084
   1085static void nForceUpdateArbitrationSettings
   1086(
   1087    unsigned      VClk,
   1088    unsigned      pixelDepth,
   1089    unsigned     *burst,
   1090    unsigned     *lwm,
   1091    RIVA_HW_INST *chip,
   1092    struct pci_dev *pdev
   1093)
   1094{
   1095    nv10_fifo_info fifo_data;
   1096    nv10_sim_state sim_data;
   1097    unsigned int M, N, P, pll, MClk, NVClk;
   1098    unsigned int uMClkPostDiv;
   1099    struct pci_dev *dev;
   1100    int domain = pci_domain_nr(pdev->bus);
   1101
   1102    dev = pci_get_domain_bus_and_slot(domain, 0, 3);
   1103    pci_read_config_dword(dev, 0x6C, &uMClkPostDiv);
   1104    pci_dev_put(dev);
   1105    uMClkPostDiv = (uMClkPostDiv >> 8) & 0xf;
   1106
   1107    if(!uMClkPostDiv) uMClkPostDiv = 4;
   1108    MClk = 400000 / uMClkPostDiv;
   1109
   1110    pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
   1111    M = (pll >> 0)  & 0xFF; N = (pll >> 8)  & 0xFF; P = (pll >> 16) & 0x0F;
   1112    NVClk  = (N * chip->CrystalFreqKHz / M) >> P;
   1113    sim_data.pix_bpp        = (char)pixelDepth;
   1114    sim_data.enable_video   = 0;
   1115    sim_data.enable_mp      = 0;
   1116
   1117    dev = pci_get_domain_bus_and_slot(domain, 0, 1);
   1118    pci_read_config_dword(dev, 0x7C, &sim_data.memory_type);
   1119    pci_dev_put(dev);
   1120    sim_data.memory_type    = (sim_data.memory_type >> 12) & 1;
   1121
   1122    sim_data.memory_width   = 64;
   1123    sim_data.mem_latency    = 3;
   1124    sim_data.mem_aligned    = 1;
   1125    sim_data.mem_page_miss  = 10;
   1126    sim_data.gr_during_vid  = 0;
   1127    sim_data.pclk_khz       = VClk;
   1128    sim_data.mclk_khz       = MClk;
   1129    sim_data.nvclk_khz      = NVClk;
   1130    nv10CalcArbitration(&fifo_data, &sim_data);
   1131    if (fifo_data.valid)
   1132    {
   1133        int  b = fifo_data.graphics_burst_size >> 4;
   1134        *burst = 0;
   1135        while (b >>= 1)
   1136	    (*burst)++;
   1137        *lwm   = fifo_data.graphics_lwm >> 3;
   1138    }
   1139}
   1140
   1141/****************************************************************************\
   1142*                                                                            *
   1143*                          RIVA Mode State Routines                          *
   1144*                                                                            *
   1145\****************************************************************************/
   1146
   1147/*
   1148 * Calculate the Video Clock parameters for the PLL.
   1149 */
   1150static int CalcVClock
   1151(
   1152    int           clockIn,
   1153    int          *clockOut,
   1154    int          *mOut,
   1155    int          *nOut,
   1156    int          *pOut,
   1157    RIVA_HW_INST *chip
   1158)
   1159{
   1160    unsigned lowM, highM, highP;
   1161    unsigned DeltaNew, DeltaOld;
   1162    unsigned VClk, Freq;
   1163    unsigned M, N, P;
   1164    
   1165    DeltaOld = 0xFFFFFFFF;
   1166
   1167    VClk     = (unsigned)clockIn;
   1168    
   1169    if (chip->CrystalFreqKHz == 13500)
   1170    {
   1171        lowM  = 7;
   1172        highM = 13 - (chip->Architecture == NV_ARCH_03);
   1173    }
   1174    else
   1175    {
   1176        lowM  = 8;
   1177        highM = 14 - (chip->Architecture == NV_ARCH_03);
   1178    }                      
   1179
   1180    highP = 4 - (chip->Architecture == NV_ARCH_03);
   1181    for (P = 0; P <= highP; P ++)
   1182    {
   1183        Freq = VClk << P;
   1184        if ((Freq >= 128000) && (Freq <= chip->MaxVClockFreqKHz))
   1185        {
   1186            for (M = lowM; M <= highM; M++)
   1187            {
   1188                N    = (VClk << P) * M / chip->CrystalFreqKHz;
   1189                if(N <= 255) {
   1190                Freq = (chip->CrystalFreqKHz * N / M) >> P;
   1191                if (Freq > VClk)
   1192                    DeltaNew = Freq - VClk;
   1193                else
   1194                    DeltaNew = VClk - Freq;
   1195                if (DeltaNew < DeltaOld)
   1196                {
   1197                    *mOut     = M;
   1198                    *nOut     = N;
   1199                    *pOut     = P;
   1200                    *clockOut = Freq;
   1201                    DeltaOld  = DeltaNew;
   1202                }
   1203            }
   1204        }
   1205    }
   1206    }
   1207
   1208    /* non-zero: M/N/P/clock values assigned.  zero: error (not set) */
   1209    return (DeltaOld != 0xFFFFFFFF);
   1210}
   1211/*
   1212 * Calculate extended mode parameters (SVGA) and save in a 
   1213 * mode state structure.
   1214 */
   1215int CalcStateExt
   1216(
   1217    RIVA_HW_INST  *chip,
   1218    RIVA_HW_STATE *state,
   1219    struct pci_dev *pdev,
   1220    int            bpp,
   1221    int            width,
   1222    int            hDisplaySize,
   1223    int            height,
   1224    int            dotClock
   1225)
   1226{
   1227    int pixelDepth;
   1228    int VClk, m, n, p;
   1229
   1230    /*
   1231     * Save mode parameters.
   1232     */
   1233    state->bpp    = bpp;    /* this is not bitsPerPixel, it's 8,15,16,32 */
   1234    state->width  = width;
   1235    state->height = height;
   1236    /*
   1237     * Extended RIVA registers.
   1238     */
   1239    pixelDepth = (bpp + 1)/8;
   1240    if (!CalcVClock(dotClock, &VClk, &m, &n, &p, chip))
   1241    	return -EINVAL;
   1242
   1243    switch (chip->Architecture)
   1244    {
   1245        case NV_ARCH_03:
   1246            nv3UpdateArbitrationSettings(VClk, 
   1247                                         pixelDepth * 8, 
   1248                                        &(state->arbitration0),
   1249                                        &(state->arbitration1),
   1250                                         chip);
   1251            state->cursor0  = 0x00;
   1252            state->cursor1  = 0x78;
   1253            state->cursor2  = 0x00000000;
   1254            state->pllsel   = 0x10010100;
   1255            state->config   = ((width + 31)/32)
   1256                            | (((pixelDepth > 2) ? 3 : pixelDepth) << 8)
   1257                            | 0x1000;
   1258            state->general  = 0x00100100;
   1259            state->repaint1 = hDisplaySize < 1280 ? 0x06 : 0x02;
   1260            break;
   1261        case NV_ARCH_04:
   1262            nv4UpdateArbitrationSettings(VClk, 
   1263                                         pixelDepth * 8, 
   1264                                        &(state->arbitration0),
   1265                                        &(state->arbitration1),
   1266                                         chip);
   1267            state->cursor0  = 0x00;
   1268            state->cursor1  = 0xFC;
   1269            state->cursor2  = 0x00000000;
   1270            state->pllsel   = 0x10000700;
   1271            state->config   = 0x00001114;
   1272            state->general  = bpp == 16 ? 0x00101100 : 0x00100100;
   1273            state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
   1274            break;
   1275        case NV_ARCH_10:
   1276        case NV_ARCH_20:
   1277        case NV_ARCH_30:
   1278            if((chip->Chipset == NV_CHIP_IGEFORCE2) ||
   1279               (chip->Chipset == NV_CHIP_0x01F0))
   1280            {
   1281                nForceUpdateArbitrationSettings(VClk,
   1282                                          pixelDepth * 8,
   1283                                         &(state->arbitration0),
   1284                                         &(state->arbitration1),
   1285                                          chip, pdev);
   1286            } else {
   1287                nv10UpdateArbitrationSettings(VClk, 
   1288                                          pixelDepth * 8, 
   1289                                         &(state->arbitration0),
   1290                                         &(state->arbitration1),
   1291                                          chip);
   1292            }
   1293            state->cursor0  = 0x80 | (chip->CursorStart >> 17);
   1294            state->cursor1  = (chip->CursorStart >> 11) << 2;
   1295            state->cursor2  = chip->CursorStart >> 24;
   1296            state->pllsel   = 0x10000700;
   1297            state->config   = NV_RD32(&chip->PFB[0x00000200/4], 0);
   1298            state->general  = bpp == 16 ? 0x00101100 : 0x00100100;
   1299            state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
   1300            break;
   1301    }
   1302
   1303     /* Paul Richards: below if block borks things in kernel for some reason */
   1304     /* Tony: Below is needed to set hardware in DirectColor */
   1305    if((bpp != 8) && (chip->Architecture != NV_ARCH_03))
   1306	    state->general |= 0x00000030;
   1307
   1308    state->vpll     = (p << 16) | (n << 8) | m;
   1309    state->repaint0 = (((width/8)*pixelDepth) & 0x700) >> 3;
   1310    state->pixel    = pixelDepth > 2   ? 3    : pixelDepth;
   1311    state->offset0  =
   1312    state->offset1  =
   1313    state->offset2  =
   1314    state->offset3  = 0;
   1315    state->pitch0   =
   1316    state->pitch1   =
   1317    state->pitch2   =
   1318    state->pitch3   = pixelDepth * width;
   1319
   1320    return 0;
   1321}
   1322/*
   1323 * Load fixed function state and pre-calculated/stored state.
   1324 */
   1325#define LOAD_FIXED_STATE(tbl,dev)                                       \
   1326    for (i = 0; i < sizeof(tbl##Table##dev)/8; i++)                 \
   1327        NV_WR32(&chip->dev[tbl##Table##dev[i][0]], 0, tbl##Table##dev[i][1])
   1328#define LOAD_FIXED_STATE_8BPP(tbl,dev)                                  \
   1329    for (i = 0; i < sizeof(tbl##Table##dev##_8BPP)/8; i++)            \
   1330        NV_WR32(&chip->dev[tbl##Table##dev##_8BPP[i][0]], 0, tbl##Table##dev##_8BPP[i][1])
   1331#define LOAD_FIXED_STATE_15BPP(tbl,dev)                                 \
   1332    for (i = 0; i < sizeof(tbl##Table##dev##_15BPP)/8; i++)           \
   1333        NV_WR32(&chip->dev[tbl##Table##dev##_15BPP[i][0]], 0, tbl##Table##dev##_15BPP[i][1])
   1334#define LOAD_FIXED_STATE_16BPP(tbl,dev)                                 \
   1335    for (i = 0; i < sizeof(tbl##Table##dev##_16BPP)/8; i++)           \
   1336        NV_WR32(&chip->dev[tbl##Table##dev##_16BPP[i][0]], 0, tbl##Table##dev##_16BPP[i][1])
   1337#define LOAD_FIXED_STATE_32BPP(tbl,dev)                                 \
   1338    for (i = 0; i < sizeof(tbl##Table##dev##_32BPP)/8; i++)           \
   1339        NV_WR32(&chip->dev[tbl##Table##dev##_32BPP[i][0]], 0, tbl##Table##dev##_32BPP[i][1])
   1340
   1341static void UpdateFifoState
   1342(
   1343    RIVA_HW_INST  *chip
   1344)
   1345{
   1346    int i;
   1347
   1348    switch (chip->Architecture)
   1349    {
   1350        case NV_ARCH_04:
   1351            LOAD_FIXED_STATE(nv4,FIFO);
   1352            chip->Tri03 = NULL;
   1353            chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
   1354            break;
   1355        case NV_ARCH_10:
   1356        case NV_ARCH_20:
   1357        case NV_ARCH_30:
   1358            /*
   1359             * Initialize state for the RivaTriangle3D05 routines.
   1360             */
   1361            LOAD_FIXED_STATE(nv10tri05,PGRAPH);
   1362            LOAD_FIXED_STATE(nv10,FIFO);
   1363            chip->Tri03 = NULL;
   1364            chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
   1365            break;
   1366    }
   1367}
   1368static void LoadStateExt
   1369(
   1370    RIVA_HW_INST  *chip,
   1371    RIVA_HW_STATE *state
   1372)
   1373{
   1374    int i;
   1375
   1376    /*
   1377     * Load HW fixed function state.
   1378     */
   1379    LOAD_FIXED_STATE(Riva,PMC);
   1380    LOAD_FIXED_STATE(Riva,PTIMER);
   1381    switch (chip->Architecture)
   1382    {
   1383        case NV_ARCH_03:
   1384            /*
   1385             * Make sure frame buffer config gets set before loading PRAMIN.
   1386             */
   1387            NV_WR32(chip->PFB, 0x00000200, state->config);
   1388            LOAD_FIXED_STATE(nv3,PFIFO);
   1389            LOAD_FIXED_STATE(nv3,PRAMIN);
   1390            LOAD_FIXED_STATE(nv3,PGRAPH);
   1391            switch (state->bpp)
   1392            {
   1393                case 15:
   1394                case 16:
   1395                    LOAD_FIXED_STATE_15BPP(nv3,PRAMIN);
   1396                    LOAD_FIXED_STATE_15BPP(nv3,PGRAPH);
   1397                    chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
   1398                    break;
   1399                case 24:
   1400                case 32:
   1401                    LOAD_FIXED_STATE_32BPP(nv3,PRAMIN);
   1402                    LOAD_FIXED_STATE_32BPP(nv3,PGRAPH);
   1403                    chip->Tri03 = NULL;
   1404                    break;
   1405                case 8:
   1406                default:
   1407                    LOAD_FIXED_STATE_8BPP(nv3,PRAMIN);
   1408                    LOAD_FIXED_STATE_8BPP(nv3,PGRAPH);
   1409                    chip->Tri03 = NULL;
   1410                    break;
   1411            }
   1412            for (i = 0x00000; i < 0x00800; i++)
   1413                NV_WR32(&chip->PRAMIN[0x00000502 + i], 0, (i << 12) | 0x03);
   1414            NV_WR32(chip->PGRAPH, 0x00000630, state->offset0);
   1415            NV_WR32(chip->PGRAPH, 0x00000634, state->offset1);
   1416            NV_WR32(chip->PGRAPH, 0x00000638, state->offset2);
   1417            NV_WR32(chip->PGRAPH, 0x0000063C, state->offset3);
   1418            NV_WR32(chip->PGRAPH, 0x00000650, state->pitch0);
   1419            NV_WR32(chip->PGRAPH, 0x00000654, state->pitch1);
   1420            NV_WR32(chip->PGRAPH, 0x00000658, state->pitch2);
   1421            NV_WR32(chip->PGRAPH, 0x0000065C, state->pitch3);
   1422            break;
   1423        case NV_ARCH_04:
   1424            /*
   1425             * Make sure frame buffer config gets set before loading PRAMIN.
   1426             */
   1427            NV_WR32(chip->PFB, 0x00000200, state->config);
   1428            LOAD_FIXED_STATE(nv4,PFIFO);
   1429            LOAD_FIXED_STATE(nv4,PRAMIN);
   1430            LOAD_FIXED_STATE(nv4,PGRAPH);
   1431            switch (state->bpp)
   1432            {
   1433                case 15:
   1434                    LOAD_FIXED_STATE_15BPP(nv4,PRAMIN);
   1435                    LOAD_FIXED_STATE_15BPP(nv4,PGRAPH);
   1436                    chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
   1437                    break;
   1438                case 16:
   1439                    LOAD_FIXED_STATE_16BPP(nv4,PRAMIN);
   1440                    LOAD_FIXED_STATE_16BPP(nv4,PGRAPH);
   1441                    chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
   1442                    break;
   1443                case 24:
   1444                case 32:
   1445                    LOAD_FIXED_STATE_32BPP(nv4,PRAMIN);
   1446                    LOAD_FIXED_STATE_32BPP(nv4,PGRAPH);
   1447                    chip->Tri03 = NULL;
   1448                    break;
   1449                case 8:
   1450                default:
   1451                    LOAD_FIXED_STATE_8BPP(nv4,PRAMIN);
   1452                    LOAD_FIXED_STATE_8BPP(nv4,PGRAPH);
   1453                    chip->Tri03 = NULL;
   1454                    break;
   1455            }
   1456            NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
   1457            NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
   1458            NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
   1459            NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
   1460            NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
   1461            NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
   1462            NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
   1463            NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
   1464            break;
   1465        case NV_ARCH_10:
   1466        case NV_ARCH_20:
   1467        case NV_ARCH_30:
   1468            if(chip->twoHeads) {
   1469               VGA_WR08(chip->PCIO, 0x03D4, 0x44);
   1470               VGA_WR08(chip->PCIO, 0x03D5, state->crtcOwner);
   1471               chip->LockUnlock(chip, 0);
   1472            }
   1473
   1474            LOAD_FIXED_STATE(nv10,PFIFO);
   1475            LOAD_FIXED_STATE(nv10,PRAMIN);
   1476            LOAD_FIXED_STATE(nv10,PGRAPH);
   1477            switch (state->bpp)
   1478            {
   1479                case 15:
   1480                    LOAD_FIXED_STATE_15BPP(nv10,PRAMIN);
   1481                    LOAD_FIXED_STATE_15BPP(nv10,PGRAPH);
   1482                    chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
   1483                    break;
   1484                case 16:
   1485                    LOAD_FIXED_STATE_16BPP(nv10,PRAMIN);
   1486                    LOAD_FIXED_STATE_16BPP(nv10,PGRAPH);
   1487                    chip->Tri03 = (RivaTexturedTriangle03  __iomem *)&(chip->FIFO[0x0000E000/4]);
   1488                    break;
   1489                case 24:
   1490                case 32:
   1491                    LOAD_FIXED_STATE_32BPP(nv10,PRAMIN);
   1492                    LOAD_FIXED_STATE_32BPP(nv10,PGRAPH);
   1493                    chip->Tri03 = NULL;
   1494                    break;
   1495                case 8:
   1496                default:
   1497                    LOAD_FIXED_STATE_8BPP(nv10,PRAMIN);
   1498                    LOAD_FIXED_STATE_8BPP(nv10,PGRAPH);
   1499                    chip->Tri03 = NULL;
   1500                    break;
   1501            }
   1502
   1503            if(chip->Architecture == NV_ARCH_10) {
   1504                NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
   1505                NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
   1506                NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
   1507                NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
   1508                NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
   1509                NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
   1510                NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
   1511                NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
   1512                NV_WR32(chip->PGRAPH, 0x00000680, state->pitch3);
   1513        } else {
   1514        NV_WR32(chip->PGRAPH, 0x00000820, state->offset0);
   1515        NV_WR32(chip->PGRAPH, 0x00000824, state->offset1);
   1516        NV_WR32(chip->PGRAPH, 0x00000828, state->offset2);
   1517        NV_WR32(chip->PGRAPH, 0x0000082C, state->offset3);
   1518        NV_WR32(chip->PGRAPH, 0x00000850, state->pitch0);
   1519        NV_WR32(chip->PGRAPH, 0x00000854, state->pitch1);
   1520        NV_WR32(chip->PGRAPH, 0x00000858, state->pitch2);
   1521        NV_WR32(chip->PGRAPH, 0x0000085C, state->pitch3);
   1522        NV_WR32(chip->PGRAPH, 0x00000860, state->pitch3);
   1523        NV_WR32(chip->PGRAPH, 0x00000864, state->pitch3);
   1524        NV_WR32(chip->PGRAPH, 0x000009A4, NV_RD32(chip->PFB, 0x00000200));
   1525        NV_WR32(chip->PGRAPH, 0x000009A8, NV_RD32(chip->PFB, 0x00000204));
   1526        }
   1527            if(chip->twoHeads) {
   1528               NV_WR32(chip->PCRTC0, 0x00000860, state->head);
   1529               NV_WR32(chip->PCRTC0, 0x00002860, state->head2);
   1530            }
   1531            NV_WR32(chip->PRAMDAC, 0x00000404, NV_RD32(chip->PRAMDAC, 0x00000404) | (1 << 25));
   1532
   1533            NV_WR32(chip->PMC, 0x00008704, 1);
   1534            NV_WR32(chip->PMC, 0x00008140, 0);
   1535            NV_WR32(chip->PMC, 0x00008920, 0);
   1536            NV_WR32(chip->PMC, 0x00008924, 0);
   1537            NV_WR32(chip->PMC, 0x00008908, 0x01ffffff);
   1538            NV_WR32(chip->PMC, 0x0000890C, 0x01ffffff);
   1539            NV_WR32(chip->PMC, 0x00001588, 0);
   1540
   1541            NV_WR32(chip->PFB, 0x00000240, 0);
   1542            NV_WR32(chip->PFB, 0x00000250, 0);
   1543            NV_WR32(chip->PFB, 0x00000260, 0);
   1544            NV_WR32(chip->PFB, 0x00000270, 0);
   1545            NV_WR32(chip->PFB, 0x00000280, 0);
   1546            NV_WR32(chip->PFB, 0x00000290, 0);
   1547            NV_WR32(chip->PFB, 0x000002A0, 0);
   1548            NV_WR32(chip->PFB, 0x000002B0, 0);
   1549
   1550            NV_WR32(chip->PGRAPH, 0x00000B00, NV_RD32(chip->PFB, 0x00000240));
   1551            NV_WR32(chip->PGRAPH, 0x00000B04, NV_RD32(chip->PFB, 0x00000244));
   1552            NV_WR32(chip->PGRAPH, 0x00000B08, NV_RD32(chip->PFB, 0x00000248));
   1553            NV_WR32(chip->PGRAPH, 0x00000B0C, NV_RD32(chip->PFB, 0x0000024C));
   1554            NV_WR32(chip->PGRAPH, 0x00000B10, NV_RD32(chip->PFB, 0x00000250));
   1555            NV_WR32(chip->PGRAPH, 0x00000B14, NV_RD32(chip->PFB, 0x00000254));
   1556            NV_WR32(chip->PGRAPH, 0x00000B18, NV_RD32(chip->PFB, 0x00000258));
   1557            NV_WR32(chip->PGRAPH, 0x00000B1C, NV_RD32(chip->PFB, 0x0000025C));
   1558            NV_WR32(chip->PGRAPH, 0x00000B20, NV_RD32(chip->PFB, 0x00000260));
   1559            NV_WR32(chip->PGRAPH, 0x00000B24, NV_RD32(chip->PFB, 0x00000264));
   1560            NV_WR32(chip->PGRAPH, 0x00000B28, NV_RD32(chip->PFB, 0x00000268));
   1561            NV_WR32(chip->PGRAPH, 0x00000B2C, NV_RD32(chip->PFB, 0x0000026C));
   1562            NV_WR32(chip->PGRAPH, 0x00000B30, NV_RD32(chip->PFB, 0x00000270));
   1563            NV_WR32(chip->PGRAPH, 0x00000B34, NV_RD32(chip->PFB, 0x00000274));
   1564            NV_WR32(chip->PGRAPH, 0x00000B38, NV_RD32(chip->PFB, 0x00000278));
   1565            NV_WR32(chip->PGRAPH, 0x00000B3C, NV_RD32(chip->PFB, 0x0000027C));
   1566            NV_WR32(chip->PGRAPH, 0x00000B40, NV_RD32(chip->PFB, 0x00000280));
   1567            NV_WR32(chip->PGRAPH, 0x00000B44, NV_RD32(chip->PFB, 0x00000284));
   1568            NV_WR32(chip->PGRAPH, 0x00000B48, NV_RD32(chip->PFB, 0x00000288));
   1569            NV_WR32(chip->PGRAPH, 0x00000B4C, NV_RD32(chip->PFB, 0x0000028C));
   1570            NV_WR32(chip->PGRAPH, 0x00000B50, NV_RD32(chip->PFB, 0x00000290));
   1571            NV_WR32(chip->PGRAPH, 0x00000B54, NV_RD32(chip->PFB, 0x00000294));
   1572            NV_WR32(chip->PGRAPH, 0x00000B58, NV_RD32(chip->PFB, 0x00000298));
   1573            NV_WR32(chip->PGRAPH, 0x00000B5C, NV_RD32(chip->PFB, 0x0000029C));
   1574            NV_WR32(chip->PGRAPH, 0x00000B60, NV_RD32(chip->PFB, 0x000002A0));
   1575            NV_WR32(chip->PGRAPH, 0x00000B64, NV_RD32(chip->PFB, 0x000002A4));
   1576            NV_WR32(chip->PGRAPH, 0x00000B68, NV_RD32(chip->PFB, 0x000002A8));
   1577            NV_WR32(chip->PGRAPH, 0x00000B6C, NV_RD32(chip->PFB, 0x000002AC));
   1578            NV_WR32(chip->PGRAPH, 0x00000B70, NV_RD32(chip->PFB, 0x000002B0));
   1579            NV_WR32(chip->PGRAPH, 0x00000B74, NV_RD32(chip->PFB, 0x000002B4));
   1580            NV_WR32(chip->PGRAPH, 0x00000B78, NV_RD32(chip->PFB, 0x000002B8));
   1581            NV_WR32(chip->PGRAPH, 0x00000B7C, NV_RD32(chip->PFB, 0x000002BC));
   1582            NV_WR32(chip->PGRAPH, 0x00000F40, 0x10000000);
   1583            NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000000);
   1584            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
   1585            NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000008);
   1586            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000200);
   1587            for (i = 0; i < (3*16); i++)
   1588                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1589            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
   1590            NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1591            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000800);
   1592            for (i = 0; i < (16*16); i++)
   1593                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1594            NV_WR32(chip->PGRAPH, 0x00000F40, 0x30000000);
   1595            NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000004);
   1596            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006400);
   1597            for (i = 0; i < (59*4); i++)
   1598                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1599            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006800);
   1600            for (i = 0; i < (47*4); i++)
   1601                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1602            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006C00);
   1603            for (i = 0; i < (3*4); i++)
   1604                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1605            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007000);
   1606            for (i = 0; i < (19*4); i++)
   1607                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1608            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007400);
   1609            for (i = 0; i < (12*4); i++)
   1610                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1611            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007800);
   1612            for (i = 0; i < (12*4); i++)
   1613                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1614            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00004400);
   1615            for (i = 0; i < (8*4); i++)
   1616                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1617            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000000);
   1618            for (i = 0; i < 16; i++)
   1619                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1620            NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
   1621            for (i = 0; i < 4; i++)
   1622                NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
   1623
   1624            NV_WR32(chip->PCRTC, 0x00000810, state->cursorConfig);
   1625
   1626            if(chip->flatPanel) {
   1627               if((chip->Chipset & 0x0ff0) == 0x0110) {
   1628                   NV_WR32(chip->PRAMDAC, 0x0528, state->dither);
   1629               } else 
   1630               if((chip->Chipset & 0x0ff0) >= 0x0170) {
   1631                   NV_WR32(chip->PRAMDAC, 0x083C, state->dither);
   1632               }
   1633            
   1634               VGA_WR08(chip->PCIO, 0x03D4, 0x53);
   1635               VGA_WR08(chip->PCIO, 0x03D5, 0);
   1636               VGA_WR08(chip->PCIO, 0x03D4, 0x54);
   1637               VGA_WR08(chip->PCIO, 0x03D5, 0);
   1638               VGA_WR08(chip->PCIO, 0x03D4, 0x21);
   1639               VGA_WR08(chip->PCIO, 0x03D5, 0xfa);
   1640            }
   1641
   1642            VGA_WR08(chip->PCIO, 0x03D4, 0x41);
   1643            VGA_WR08(chip->PCIO, 0x03D5, state->extra);
   1644    }
   1645    LOAD_FIXED_STATE(Riva,FIFO);
   1646    UpdateFifoState(chip);
   1647    /*
   1648     * Load HW mode state.
   1649     */
   1650    VGA_WR08(chip->PCIO, 0x03D4, 0x19);
   1651    VGA_WR08(chip->PCIO, 0x03D5, state->repaint0);
   1652    VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
   1653    VGA_WR08(chip->PCIO, 0x03D5, state->repaint1);
   1654    VGA_WR08(chip->PCIO, 0x03D4, 0x25);
   1655    VGA_WR08(chip->PCIO, 0x03D5, state->screen);
   1656    VGA_WR08(chip->PCIO, 0x03D4, 0x28);
   1657    VGA_WR08(chip->PCIO, 0x03D5, state->pixel);
   1658    VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
   1659    VGA_WR08(chip->PCIO, 0x03D5, state->horiz);
   1660    VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
   1661    VGA_WR08(chip->PCIO, 0x03D5, state->arbitration0);
   1662    VGA_WR08(chip->PCIO, 0x03D4, 0x20);
   1663    VGA_WR08(chip->PCIO, 0x03D5, state->arbitration1);
   1664    VGA_WR08(chip->PCIO, 0x03D4, 0x30);
   1665    VGA_WR08(chip->PCIO, 0x03D5, state->cursor0);
   1666    VGA_WR08(chip->PCIO, 0x03D4, 0x31);
   1667    VGA_WR08(chip->PCIO, 0x03D5, state->cursor1);
   1668    VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
   1669    VGA_WR08(chip->PCIO, 0x03D5, state->cursor2);
   1670    VGA_WR08(chip->PCIO, 0x03D4, 0x39);
   1671    VGA_WR08(chip->PCIO, 0x03D5, state->interlace);
   1672
   1673    if(!chip->flatPanel) {
   1674       NV_WR32(chip->PRAMDAC0, 0x00000508, state->vpll);
   1675       NV_WR32(chip->PRAMDAC0, 0x0000050C, state->pllsel);
   1676       if(chip->twoHeads)
   1677          NV_WR32(chip->PRAMDAC0, 0x00000520, state->vpll2);
   1678    }  else {
   1679       NV_WR32(chip->PRAMDAC, 0x00000848 , state->scale);
   1680    }  
   1681    NV_WR32(chip->PRAMDAC, 0x00000600 , state->general);
   1682
   1683    /*
   1684     * Turn off VBlank enable and reset.
   1685     */
   1686    NV_WR32(chip->PCRTC, 0x00000140, 0);
   1687    NV_WR32(chip->PCRTC, 0x00000100, chip->VBlankBit);
   1688    /*
   1689     * Set interrupt enable.
   1690     */    
   1691    NV_WR32(chip->PMC, 0x00000140, chip->EnableIRQ & 0x01);
   1692    /*
   1693     * Set current state pointer.
   1694     */
   1695    chip->CurrentState = state;
   1696    /*
   1697     * Reset FIFO free and empty counts.
   1698     */
   1699    chip->FifoFreeCount  = 0;
   1700    /* Free count from first subchannel */
   1701    chip->FifoEmptyCount = NV_RD32(&chip->Rop->FifoFree, 0);
   1702}
   1703static void UnloadStateExt
   1704(
   1705    RIVA_HW_INST  *chip,
   1706    RIVA_HW_STATE *state
   1707)
   1708{
   1709    /*
   1710     * Save current HW state.
   1711     */
   1712    VGA_WR08(chip->PCIO, 0x03D4, 0x19);
   1713    state->repaint0     = VGA_RD08(chip->PCIO, 0x03D5);
   1714    VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
   1715    state->repaint1     = VGA_RD08(chip->PCIO, 0x03D5);
   1716    VGA_WR08(chip->PCIO, 0x03D4, 0x25);
   1717    state->screen       = VGA_RD08(chip->PCIO, 0x03D5);
   1718    VGA_WR08(chip->PCIO, 0x03D4, 0x28);
   1719    state->pixel        = VGA_RD08(chip->PCIO, 0x03D5);
   1720    VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
   1721    state->horiz        = VGA_RD08(chip->PCIO, 0x03D5);
   1722    VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
   1723    state->arbitration0 = VGA_RD08(chip->PCIO, 0x03D5);
   1724    VGA_WR08(chip->PCIO, 0x03D4, 0x20);
   1725    state->arbitration1 = VGA_RD08(chip->PCIO, 0x03D5);
   1726    VGA_WR08(chip->PCIO, 0x03D4, 0x30);
   1727    state->cursor0      = VGA_RD08(chip->PCIO, 0x03D5);
   1728    VGA_WR08(chip->PCIO, 0x03D4, 0x31);
   1729    state->cursor1      = VGA_RD08(chip->PCIO, 0x03D5);
   1730    VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
   1731    state->cursor2      = VGA_RD08(chip->PCIO, 0x03D5);
   1732    VGA_WR08(chip->PCIO, 0x03D4, 0x39);
   1733    state->interlace    = VGA_RD08(chip->PCIO, 0x03D5);
   1734    state->vpll         = NV_RD32(chip->PRAMDAC0, 0x00000508);
   1735    state->vpll2        = NV_RD32(chip->PRAMDAC0, 0x00000520);
   1736    state->pllsel       = NV_RD32(chip->PRAMDAC0, 0x0000050C);
   1737    state->general      = NV_RD32(chip->PRAMDAC, 0x00000600);
   1738    state->scale        = NV_RD32(chip->PRAMDAC, 0x00000848);
   1739    state->config       = NV_RD32(chip->PFB, 0x00000200);
   1740    switch (chip->Architecture)
   1741    {
   1742        case NV_ARCH_03:
   1743            state->offset0  = NV_RD32(chip->PGRAPH, 0x00000630);
   1744            state->offset1  = NV_RD32(chip->PGRAPH, 0x00000634);
   1745            state->offset2  = NV_RD32(chip->PGRAPH, 0x00000638);
   1746            state->offset3  = NV_RD32(chip->PGRAPH, 0x0000063C);
   1747            state->pitch0   = NV_RD32(chip->PGRAPH, 0x00000650);
   1748            state->pitch1   = NV_RD32(chip->PGRAPH, 0x00000654);
   1749            state->pitch2   = NV_RD32(chip->PGRAPH, 0x00000658);
   1750            state->pitch3   = NV_RD32(chip->PGRAPH, 0x0000065C);
   1751            break;
   1752        case NV_ARCH_04:
   1753            state->offset0  = NV_RD32(chip->PGRAPH, 0x00000640);
   1754            state->offset1  = NV_RD32(chip->PGRAPH, 0x00000644);
   1755            state->offset2  = NV_RD32(chip->PGRAPH, 0x00000648);
   1756            state->offset3  = NV_RD32(chip->PGRAPH, 0x0000064C);
   1757            state->pitch0   = NV_RD32(chip->PGRAPH, 0x00000670);
   1758            state->pitch1   = NV_RD32(chip->PGRAPH, 0x00000674);
   1759            state->pitch2   = NV_RD32(chip->PGRAPH, 0x00000678);
   1760            state->pitch3   = NV_RD32(chip->PGRAPH, 0x0000067C);
   1761            break;
   1762        case NV_ARCH_10:
   1763        case NV_ARCH_20:
   1764        case NV_ARCH_30:
   1765            state->offset0  = NV_RD32(chip->PGRAPH, 0x00000640);
   1766            state->offset1  = NV_RD32(chip->PGRAPH, 0x00000644);
   1767            state->offset2  = NV_RD32(chip->PGRAPH, 0x00000648);
   1768            state->offset3  = NV_RD32(chip->PGRAPH, 0x0000064C);
   1769            state->pitch0   = NV_RD32(chip->PGRAPH, 0x00000670);
   1770            state->pitch1   = NV_RD32(chip->PGRAPH, 0x00000674);
   1771            state->pitch2   = NV_RD32(chip->PGRAPH, 0x00000678);
   1772            state->pitch3   = NV_RD32(chip->PGRAPH, 0x0000067C);
   1773            if(chip->twoHeads) {
   1774               state->head     = NV_RD32(chip->PCRTC0, 0x00000860);
   1775               state->head2    = NV_RD32(chip->PCRTC0, 0x00002860);
   1776               VGA_WR08(chip->PCIO, 0x03D4, 0x44);
   1777               state->crtcOwner = VGA_RD08(chip->PCIO, 0x03D5);
   1778            }
   1779            VGA_WR08(chip->PCIO, 0x03D4, 0x41);
   1780            state->extra = VGA_RD08(chip->PCIO, 0x03D5);
   1781            state->cursorConfig = NV_RD32(chip->PCRTC, 0x00000810);
   1782
   1783            if((chip->Chipset & 0x0ff0) == 0x0110) {
   1784                state->dither = NV_RD32(chip->PRAMDAC, 0x0528);
   1785            } else 
   1786            if((chip->Chipset & 0x0ff0) >= 0x0170) {
   1787                state->dither = NV_RD32(chip->PRAMDAC, 0x083C);
   1788            }
   1789            break;
   1790    }
   1791}
   1792static void SetStartAddress
   1793(
   1794    RIVA_HW_INST *chip,
   1795    unsigned      start
   1796)
   1797{
   1798    NV_WR32(chip->PCRTC, 0x800, start);
   1799}
   1800
   1801static void SetStartAddress3
   1802(
   1803    RIVA_HW_INST *chip,
   1804    unsigned      start
   1805)
   1806{
   1807    int offset = start >> 2;
   1808    int pan    = (start & 3) << 1;
   1809    unsigned char tmp;
   1810
   1811    /*
   1812     * Unlock extended registers.
   1813     */
   1814    chip->LockUnlock(chip, 0);
   1815    /*
   1816     * Set start address.
   1817     */
   1818    VGA_WR08(chip->PCIO, 0x3D4, 0x0D); VGA_WR08(chip->PCIO, 0x3D5, offset);
   1819    offset >>= 8;
   1820    VGA_WR08(chip->PCIO, 0x3D4, 0x0C); VGA_WR08(chip->PCIO, 0x3D5, offset);
   1821    offset >>= 8;
   1822    VGA_WR08(chip->PCIO, 0x3D4, 0x19); tmp = VGA_RD08(chip->PCIO, 0x3D5);
   1823    VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x01F) | (tmp & ~0x1F));
   1824    VGA_WR08(chip->PCIO, 0x3D4, 0x2D); tmp = VGA_RD08(chip->PCIO, 0x3D5);
   1825    VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x60) | (tmp & ~0x60));
   1826    /*
   1827     * 4 pixel pan register.
   1828     */
   1829    offset = VGA_RD08(chip->PCIO, chip->IO + 0x0A);
   1830    VGA_WR08(chip->PCIO, 0x3C0, 0x13);
   1831    VGA_WR08(chip->PCIO, 0x3C0, pan);
   1832}
   1833static void nv3SetSurfaces2D
   1834(
   1835    RIVA_HW_INST *chip,
   1836    unsigned     surf0,
   1837    unsigned     surf1
   1838)
   1839{
   1840    RivaSurface __iomem *Surface =
   1841	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
   1842
   1843    RIVA_FIFO_FREE(*chip,Tri03,5);
   1844    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
   1845    NV_WR32(&Surface->Offset, 0, surf0);
   1846    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
   1847    NV_WR32(&Surface->Offset, 0, surf1);
   1848    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
   1849}
   1850static void nv4SetSurfaces2D
   1851(
   1852    RIVA_HW_INST *chip,
   1853    unsigned     surf0,
   1854    unsigned     surf1
   1855)
   1856{
   1857    RivaSurface __iomem *Surface =
   1858	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
   1859
   1860    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
   1861    NV_WR32(&Surface->Offset, 0, surf0);
   1862    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
   1863    NV_WR32(&Surface->Offset, 0, surf1);
   1864    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
   1865}
   1866static void nv10SetSurfaces2D
   1867(
   1868    RIVA_HW_INST *chip,
   1869    unsigned     surf0,
   1870    unsigned     surf1
   1871)
   1872{
   1873    RivaSurface __iomem *Surface =
   1874	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
   1875
   1876    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
   1877    NV_WR32(&Surface->Offset, 0, surf0);
   1878    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
   1879    NV_WR32(&Surface->Offset, 0, surf1);
   1880    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
   1881}
   1882static void nv3SetSurfaces3D
   1883(
   1884    RIVA_HW_INST *chip,
   1885    unsigned     surf0,
   1886    unsigned     surf1
   1887)
   1888{
   1889    RivaSurface __iomem *Surface =
   1890	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
   1891
   1892    RIVA_FIFO_FREE(*chip,Tri03,5);
   1893    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
   1894    NV_WR32(&Surface->Offset, 0, surf0);
   1895    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
   1896    NV_WR32(&Surface->Offset, 0, surf1);
   1897    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
   1898}
   1899static void nv4SetSurfaces3D
   1900(
   1901    RIVA_HW_INST *chip,
   1902    unsigned     surf0,
   1903    unsigned     surf1
   1904)
   1905{
   1906    RivaSurface __iomem *Surface =
   1907	(RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
   1908
   1909    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
   1910    NV_WR32(&Surface->Offset, 0, surf0);
   1911    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
   1912    NV_WR32(&Surface->Offset, 0, surf1);
   1913    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
   1914}
   1915static void nv10SetSurfaces3D
   1916(
   1917    RIVA_HW_INST *chip,
   1918    unsigned     surf0,
   1919    unsigned     surf1
   1920)
   1921{
   1922    RivaSurface3D __iomem *Surfaces3D =
   1923	(RivaSurface3D __iomem *)&(chip->FIFO[0x0000E000/4]);
   1924
   1925    RIVA_FIFO_FREE(*chip,Tri03,4);
   1926    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000007);
   1927    NV_WR32(&Surfaces3D->RenderBufferOffset, 0, surf0);
   1928    NV_WR32(&Surfaces3D->ZBufferOffset, 0, surf1);
   1929    NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
   1930}
   1931
   1932/****************************************************************************\
   1933*                                                                            *
   1934*                      Probe RIVA Chip Configuration                         *
   1935*                                                                            *
   1936\****************************************************************************/
   1937
   1938static void nv3GetConfig
   1939(
   1940    RIVA_HW_INST *chip
   1941)
   1942{
   1943    /*
   1944     * Fill in chip configuration.
   1945     */
   1946    if (NV_RD32(&chip->PFB[0x00000000/4], 0) & 0x00000020)
   1947    {
   1948        if (((NV_RD32(chip->PMC, 0x00000000) & 0xF0) == 0x20)
   1949         && ((NV_RD32(chip->PMC, 0x00000000) & 0x0F) >= 0x02))
   1950        {        
   1951            /*
   1952             * SDRAM 128 ZX.
   1953             */
   1954            chip->RamBandwidthKBytesPerSec = 800000;
   1955            switch (NV_RD32(chip->PFB, 0x00000000) & 0x03)
   1956            {
   1957                case 2:
   1958                    chip->RamAmountKBytes = 1024 * 4;
   1959                    break;
   1960                case 1:
   1961                    chip->RamAmountKBytes = 1024 * 2;
   1962                    break;
   1963                default:
   1964                    chip->RamAmountKBytes = 1024 * 8;
   1965                    break;
   1966            }
   1967        }            
   1968        else            
   1969        {
   1970            chip->RamBandwidthKBytesPerSec = 1000000;
   1971            chip->RamAmountKBytes          = 1024 * 8;
   1972        }            
   1973    }
   1974    else
   1975    {
   1976        /*
   1977         * SGRAM 128.
   1978         */
   1979        chip->RamBandwidthKBytesPerSec = 1000000;
   1980        switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
   1981        {
   1982            case 0:
   1983                chip->RamAmountKBytes = 1024 * 8;
   1984                break;
   1985            case 2:
   1986                chip->RamAmountKBytes = 1024 * 4;
   1987                break;
   1988            default:
   1989                chip->RamAmountKBytes = 1024 * 2;
   1990                break;
   1991        }
   1992    }        
   1993    chip->CrystalFreqKHz   = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
   1994    chip->CURSOR           = &(chip->PRAMIN[0x00008000/4 - 0x0800/4]);
   1995    chip->VBlankBit        = 0x00000100;
   1996    chip->MaxVClockFreqKHz = 256000;
   1997    /*
   1998     * Set chip functions.
   1999     */
   2000    chip->Busy            = nv3Busy;
   2001    chip->ShowHideCursor  = ShowHideCursor;
   2002    chip->LoadStateExt    = LoadStateExt;
   2003    chip->UnloadStateExt  = UnloadStateExt;
   2004    chip->SetStartAddress = SetStartAddress3;
   2005    chip->SetSurfaces2D   = nv3SetSurfaces2D;
   2006    chip->SetSurfaces3D   = nv3SetSurfaces3D;
   2007    chip->LockUnlock      = nv3LockUnlock;
   2008}
   2009static void nv4GetConfig
   2010(
   2011    RIVA_HW_INST *chip
   2012)
   2013{
   2014    /*
   2015     * Fill in chip configuration.
   2016     */
   2017    if (NV_RD32(chip->PFB, 0x00000000) & 0x00000100)
   2018    {
   2019        chip->RamAmountKBytes = ((NV_RD32(chip->PFB, 0x00000000) >> 12) & 0x0F) * 1024 * 2
   2020                              + 1024 * 2;
   2021    }
   2022    else
   2023    {
   2024        switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
   2025        {
   2026            case 0:
   2027                chip->RamAmountKBytes = 1024 * 32;
   2028                break;
   2029            case 1:
   2030                chip->RamAmountKBytes = 1024 * 4;
   2031                break;
   2032            case 2:
   2033                chip->RamAmountKBytes = 1024 * 8;
   2034                break;
   2035            case 3:
   2036            default:
   2037                chip->RamAmountKBytes = 1024 * 16;
   2038                break;
   2039        }
   2040    }
   2041    switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
   2042    {
   2043        case 3:
   2044            chip->RamBandwidthKBytesPerSec = 800000;
   2045            break;
   2046        default:
   2047            chip->RamBandwidthKBytesPerSec = 1000000;
   2048            break;
   2049    }
   2050    chip->CrystalFreqKHz   = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
   2051    chip->CURSOR           = &(chip->PRAMIN[0x00010000/4 - 0x0800/4]);
   2052    chip->VBlankBit        = 0x00000001;
   2053    chip->MaxVClockFreqKHz = 350000;
   2054    /*
   2055     * Set chip functions.
   2056     */
   2057    chip->Busy            = nv4Busy;
   2058    chip->ShowHideCursor  = ShowHideCursor;
   2059    chip->LoadStateExt    = LoadStateExt;
   2060    chip->UnloadStateExt  = UnloadStateExt;
   2061    chip->SetStartAddress = SetStartAddress;
   2062    chip->SetSurfaces2D   = nv4SetSurfaces2D;
   2063    chip->SetSurfaces3D   = nv4SetSurfaces3D;
   2064    chip->LockUnlock      = nv4LockUnlock;
   2065}
   2066static void nv10GetConfig
   2067(
   2068    RIVA_HW_INST *chip,
   2069    struct pci_dev *pdev,
   2070    unsigned int chipset
   2071)
   2072{
   2073    struct pci_dev* dev;
   2074    int domain = pci_domain_nr(pdev->bus);
   2075    u32 amt;
   2076
   2077#ifdef __BIG_ENDIAN
   2078    /* turn on big endian register access */
   2079    if(!(NV_RD32(chip->PMC, 0x00000004) & 0x01000001))
   2080    	NV_WR32(chip->PMC, 0x00000004, 0x01000001);
   2081#endif
   2082
   2083    /*
   2084     * Fill in chip configuration.
   2085     */
   2086    if(chipset == NV_CHIP_IGEFORCE2) {
   2087        dev = pci_get_domain_bus_and_slot(domain, 0, 1);
   2088        pci_read_config_dword(dev, 0x7C, &amt);
   2089        pci_dev_put(dev);
   2090        chip->RamAmountKBytes = (((amt >> 6) & 31) + 1) * 1024;
   2091    } else if(chipset == NV_CHIP_0x01F0) {
   2092        dev = pci_get_domain_bus_and_slot(domain, 0, 1);
   2093        pci_read_config_dword(dev, 0x84, &amt);
   2094        pci_dev_put(dev);
   2095        chip->RamAmountKBytes = (((amt >> 4) & 127) + 1) * 1024;
   2096    } else {
   2097        switch ((NV_RD32(chip->PFB, 0x0000020C) >> 20) & 0x000000FF)
   2098        {
   2099            case 0x02:
   2100                chip->RamAmountKBytes = 1024 * 2;
   2101                break;
   2102            case 0x04:
   2103                chip->RamAmountKBytes = 1024 * 4;
   2104                break;
   2105            case 0x08:
   2106                chip->RamAmountKBytes = 1024 * 8;
   2107                break;
   2108            case 0x10:
   2109                chip->RamAmountKBytes = 1024 * 16;
   2110                break;
   2111            case 0x20:
   2112                chip->RamAmountKBytes = 1024 * 32;
   2113                break;
   2114            case 0x40:
   2115                chip->RamAmountKBytes = 1024 * 64;
   2116                break;
   2117            case 0x80:
   2118                chip->RamAmountKBytes = 1024 * 128;
   2119                break;
   2120            default:
   2121                chip->RamAmountKBytes = 1024 * 16;
   2122                break;
   2123        }
   2124    }
   2125    switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
   2126    {
   2127        case 3:
   2128            chip->RamBandwidthKBytesPerSec = 800000;
   2129            break;
   2130        default:
   2131            chip->RamBandwidthKBytesPerSec = 1000000;
   2132            break;
   2133    }
   2134    chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 6)) ?
   2135	14318 : 13500;
   2136
   2137    switch (chipset & 0x0ff0) {
   2138    case 0x0170:
   2139    case 0x0180:
   2140    case 0x01F0:
   2141    case 0x0250:
   2142    case 0x0280:
   2143    case 0x0300:
   2144    case 0x0310:
   2145    case 0x0320:
   2146    case 0x0330:
   2147    case 0x0340:
   2148       if(NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 22))
   2149           chip->CrystalFreqKHz = 27000;
   2150       break;
   2151    default:
   2152       break;
   2153    }
   2154
   2155    chip->CursorStart      = (chip->RamAmountKBytes - 128) * 1024;
   2156    chip->CURSOR           = NULL;  /* can't set this here */
   2157    chip->VBlankBit        = 0x00000001;
   2158    chip->MaxVClockFreqKHz = 350000;
   2159    /*
   2160     * Set chip functions.
   2161     */
   2162    chip->Busy            = nv10Busy;
   2163    chip->ShowHideCursor  = ShowHideCursor;
   2164    chip->LoadStateExt    = LoadStateExt;
   2165    chip->UnloadStateExt  = UnloadStateExt;
   2166    chip->SetStartAddress = SetStartAddress;
   2167    chip->SetSurfaces2D   = nv10SetSurfaces2D;
   2168    chip->SetSurfaces3D   = nv10SetSurfaces3D;
   2169    chip->LockUnlock      = nv4LockUnlock;
   2170
   2171    switch(chipset & 0x0ff0) {
   2172    case 0x0110:
   2173    case 0x0170:
   2174    case 0x0180:
   2175    case 0x01F0:
   2176    case 0x0250:
   2177    case 0x0280:
   2178    case 0x0300:
   2179    case 0x0310:
   2180    case 0x0320:
   2181    case 0x0330:
   2182    case 0x0340:
   2183        chip->twoHeads = TRUE;
   2184        break;
   2185    default:
   2186        chip->twoHeads = FALSE;
   2187        break;
   2188    }
   2189}
   2190int RivaGetConfig
   2191(
   2192    RIVA_HW_INST *chip,
   2193    struct pci_dev *pdev,
   2194    unsigned int chipset
   2195)
   2196{
   2197    /*
   2198     * Save this so future SW know whats it's dealing with.
   2199     */
   2200    chip->Version = RIVA_SW_VERSION;
   2201    /*
   2202     * Chip specific configuration.
   2203     */
   2204    switch (chip->Architecture)
   2205    {
   2206        case NV_ARCH_03:
   2207            nv3GetConfig(chip);
   2208            break;
   2209        case NV_ARCH_04:
   2210            nv4GetConfig(chip);
   2211            break;
   2212        case NV_ARCH_10:
   2213        case NV_ARCH_20:
   2214        case NV_ARCH_30:
   2215            nv10GetConfig(chip, pdev, chipset);
   2216            break;
   2217        default:
   2218            return (-1);
   2219    }
   2220    chip->Chipset = chipset;
   2221    /*
   2222     * Fill in FIFO pointers.
   2223     */
   2224    chip->Rop    = (RivaRop __iomem         *)&(chip->FIFO[0x00000000/4]);
   2225    chip->Clip   = (RivaClip __iomem        *)&(chip->FIFO[0x00002000/4]);
   2226    chip->Patt   = (RivaPattern __iomem     *)&(chip->FIFO[0x00004000/4]);
   2227    chip->Pixmap = (RivaPixmap __iomem      *)&(chip->FIFO[0x00006000/4]);
   2228    chip->Blt    = (RivaScreenBlt __iomem   *)&(chip->FIFO[0x00008000/4]);
   2229    chip->Bitmap = (RivaBitmap __iomem      *)&(chip->FIFO[0x0000A000/4]);
   2230    chip->Line   = (RivaLine __iomem        *)&(chip->FIFO[0x0000C000/4]);
   2231    chip->Tri03  = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
   2232    return (0);
   2233}
   2234