vserver 2.0 rc7
[linux-2.6.git] / drivers / char / agp / amd-k7-agp.c
index b1b5324..3a41672 100644 (file)
 #define AMD_TLBFLUSH   0x0c    /* In mmio region (32-bit register) */
 #define AMD_CACHEENTRY 0x10    /* In mmio region (32-bit register) */
 
+static struct pci_device_id agp_amdk7_pci_table[];
+
 struct amd_page_map {
        unsigned long *real;
-       unsigned long *remapped;
+       unsigned long __iomem *remapped;
 };
 
 static struct _amd_irongate_private {
-       volatile u8 *registers;
+       volatile u8 __iomem *registers;
        struct amd_page_map **gatt_pages;
        int num_tables;
 } amd_irongate_private;
@@ -41,7 +43,7 @@ static int amd_create_page_map(struct amd_page_map *page_map)
 
        SetPageReserved(virt_to_page(page_map->real));
        global_cache_flush();
-       page_map->remapped = ioremap_nocache(virt_to_phys(page_map->real), 
+       page_map->remapped = ioremap_nocache(virt_to_gart(page_map->real),
                                            PAGE_SIZE);
        if (page_map->remapped == NULL) {
                ClearPageReserved(virt_to_page(page_map->real));
@@ -51,8 +53,10 @@ static int amd_create_page_map(struct amd_page_map *page_map)
        }
        global_cache_flush();
 
-       for (i = 0; i < PAGE_SIZE / sizeof(unsigned long); i++)
-               page_map->remapped[i] = agp_bridge->scratch_page;
+       for (i = 0; i < PAGE_SIZE / sizeof(unsigned long); i++) {
+               writel(agp_bridge->scratch_page, page_map->remapped+i);
+               readl(page_map->remapped+i);    /* PCI Posting. */
+       }
 
        return 0;
 }
@@ -90,7 +94,7 @@ static int amd_create_gatt_pages(int nr_tables)
        int retval = 0;
        int i;
 
-       tables = kmalloc((nr_tables + 1) * sizeof(struct amd_page_map *), 
+       tables = kmalloc((nr_tables + 1) * sizeof(struct amd_page_map *),
                         GFP_KERNEL);
        if (tables == NULL)
                return -ENOMEM;
@@ -124,11 +128,11 @@ static int amd_create_gatt_pages(int nr_tables)
 #define GET_PAGE_DIR_OFF(addr) (addr >> 22)
 #define GET_PAGE_DIR_IDX(addr) (GET_PAGE_DIR_OFF(addr) - \
        GET_PAGE_DIR_OFF(agp_bridge->gart_bus_addr))
-#define GET_GATT_OFF(addr) ((addr & 0x003ff000) >> 12) 
+#define GET_GATT_OFF(addr) ((addr & 0x003ff000) >> 12)
 #define GET_GATT(addr) (amd_irongate_private.gatt_pages[\
        GET_PAGE_DIR_IDX(addr)]->remapped)
 
-static int amd_create_gatt_table(void)
+static int amd_create_gatt_table(struct agp_bridge_data *bridge)
 {
        struct aper_size_info_lvl2 *value;
        struct amd_page_map page_dir;
@@ -149,8 +153,8 @@ static int amd_create_gatt_table(void)
        }
 
        agp_bridge->gatt_table_real = (u32 *)page_dir.real;
-       agp_bridge->gatt_table = (u32 *)page_dir.remapped;
-       agp_bridge->gatt_bus_addr = virt_to_phys(page_dir.real);
+       agp_bridge->gatt_table = (u32 __iomem *)page_dir.remapped;
+       agp_bridge->gatt_bus_addr = virt_to_gart(page_dir.real);
 
        /* Get the address for the gart region.
         * This is a bus address even on the alpha, b/c its
@@ -163,20 +167,20 @@ static int amd_create_gatt_table(void)
 
        /* Calculate the agp offset */
        for (i = 0; i < value->num_entries / 1024; i++, addr += 0x00400000) {
-               page_dir.remapped[GET_PAGE_DIR_OFF(addr)] =
-                       virt_to_phys(amd_irongate_private.gatt_pages[i]->real);
-               page_dir.remapped[GET_PAGE_DIR_OFF(addr)] |= 0x00000001;
+               writel(virt_to_gart(amd_irongate_private.gatt_pages[i]->real) | 1,
+                       page_dir.remapped+GET_PAGE_DIR_OFF(addr));
+               readl(page_dir.remapped+GET_PAGE_DIR_OFF(addr));        /* PCI Posting. */
        }
 
        return 0;
 }
 
-static int amd_free_gatt_table(void)
+static int amd_free_gatt_table(struct agp_bridge_data *bridge)
 {
        struct amd_page_map page_dir;
-   
+
        page_dir.real = (unsigned long *)agp_bridge->gatt_table_real;
-       page_dir.remapped = (unsigned long *)agp_bridge->gatt_table;
+       page_dir.remapped = (unsigned long __iomem *)agp_bridge->gatt_table;
 
        amd_free_gatt_pages();
        amd_free_page_map(&page_dir);
@@ -216,32 +220,32 @@ static int amd_irongate_configure(void)
        /* Get the memory mapped registers */
        pci_read_config_dword(agp_bridge->dev, AMD_MMBASE, &temp);
        temp = (temp & PCI_BASE_ADDRESS_MEM_MASK);
-       amd_irongate_private.registers = (volatile u8 *) ioremap(temp, 4096);
+       amd_irongate_private.registers = (volatile u8 __iomem *) ioremap(temp, 4096);
 
        /* Write out the address of the gatt table */
-       OUTREG32(amd_irongate_private.registers, AMD_ATTBASE,
-                agp_bridge->gatt_bus_addr);
+       writel(agp_bridge->gatt_bus_addr, amd_irongate_private.registers+AMD_ATTBASE);
+       readl(amd_irongate_private.registers+AMD_ATTBASE);      /* PCI Posting. */
 
        /* Write the Sync register */
        pci_write_config_byte(agp_bridge->dev, AMD_MODECNTL, 0x80);
-   
-       /* Set indexing mode */
-       pci_write_config_byte(agp_bridge->dev, AMD_MODECNTL2, 0x00);
+
+       /* Set indexing mode */
+       pci_write_config_byte(agp_bridge->dev, AMD_MODECNTL2, 0x00);
 
        /* Write the enable register */
-       enable_reg = INREG16(amd_irongate_private.registers, AMD_GARTENABLE);
+       enable_reg = readw(amd_irongate_private.registers+AMD_GARTENABLE);
        enable_reg = (enable_reg | 0x0004);
-       OUTREG16(amd_irongate_private.registers, AMD_GARTENABLE, enable_reg);
+       writew(enable_reg, amd_irongate_private.registers+AMD_GARTENABLE);
+       readw(amd_irongate_private.registers+AMD_GARTENABLE);   /* PCI Posting. */
 
        /* Write out the size register */
        pci_read_config_dword(agp_bridge->dev, AMD_APSIZE, &temp);
-       temp = (((temp & ~(0x0000000e)) | current_size->size_value)
-               | 0x00000001);
+       temp = (((temp & ~(0x0000000e)) | current_size->size_value) | 1);
        pci_write_config_dword(agp_bridge->dev, AMD_APSIZE, temp);
 
        /* Flush the tlb */
-       OUTREG32(amd_irongate_private.registers, AMD_TLBFLUSH, 0x00000001);
-
+       writel(1, amd_irongate_private.registers+AMD_TLBFLUSH);
+       readl(amd_irongate_private.registers+AMD_TLBFLUSH);     /* PCI Posting.*/
        return 0;
 }
 
@@ -253,15 +257,16 @@ static void amd_irongate_cleanup(void)
 
        previous_size = A_SIZE_LVL2(agp_bridge->previous_size);
 
-       enable_reg = INREG16(amd_irongate_private.registers, AMD_GARTENABLE);
+       enable_reg = readw(amd_irongate_private.registers+AMD_GARTENABLE);
        enable_reg = (enable_reg & ~(0x0004));
-       OUTREG16(amd_irongate_private.registers, AMD_GARTENABLE, enable_reg);
+       writew(enable_reg, amd_irongate_private.registers+AMD_GARTENABLE);
+       readw(amd_irongate_private.registers+AMD_GARTENABLE);   /* PCI Posting. */
 
        /* Write back the previous size and disable gart translation */
        pci_read_config_dword(agp_bridge->dev, AMD_APSIZE, &temp);
        temp = ((temp & ~(0x0000000f)) | previous_size->size_value);
        pci_write_config_dword(agp_bridge->dev, AMD_APSIZE, temp);
-       iounmap((void *) amd_irongate_private.registers);
+       iounmap((void __iomem *) amd_irongate_private.registers);
 }
 
 /*
@@ -274,13 +279,14 @@ static void amd_irongate_cleanup(void)
 
 static void amd_irongate_tlbflush(struct agp_memory *temp)
 {
-       OUTREG32(amd_irongate_private.registers, AMD_TLBFLUSH, 0x00000001);
+       writel(1, amd_irongate_private.registers+AMD_TLBFLUSH);
+       readl(amd_irongate_private.registers+AMD_TLBFLUSH);     /* PCI Posting. */
 }
 
 static int amd_insert_memory(struct agp_memory *mem, off_t pg_start, int type)
 {
        int i, j, num_entries;
-       unsigned long *cur_gatt;
+       unsigned long __iomem *cur_gatt;
        unsigned long addr;
 
        num_entries = A_SIZE_LVL2(agp_bridge->current_size)->num_entries;
@@ -295,7 +301,7 @@ static int amd_insert_memory(struct agp_memory *mem, off_t pg_start, int type)
        while (j < (pg_start + mem->page_count)) {
                addr = (j * PAGE_SIZE) + agp_bridge->gart_bus_addr;
                cur_gatt = GET_GATT(addr);
-               if (!PGE_EMPTY(agp_bridge, cur_gatt[GET_GATT_OFF(addr)]))
+               if (!PGE_EMPTY(agp_bridge, readl(cur_gatt+GET_GATT_OFF(addr))))
                        return -EBUSY;
                j++;
        }
@@ -308,8 +314,9 @@ static int amd_insert_memory(struct agp_memory *mem, off_t pg_start, int type)
        for (i = 0, j = pg_start; i < mem->page_count; i++, j++) {
                addr = (j * PAGE_SIZE) + agp_bridge->gart_bus_addr;
                cur_gatt = GET_GATT(addr);
-               cur_gatt[GET_GATT_OFF(addr)] =
-                       agp_generic_mask_memory(mem->memory[i], mem->type);
+               writel(agp_generic_mask_memory(agp_bridge,
+                       mem->memory[i], mem->type), cur_gatt+GET_GATT_OFF(addr));
+               readl(cur_gatt+GET_GATT_OFF(addr));     /* PCI Posting. */
        }
        amd_irongate_tlbflush(mem);
        return 0;
@@ -318,7 +325,7 @@ static int amd_insert_memory(struct agp_memory *mem, off_t pg_start, int type)
 static int amd_remove_memory(struct agp_memory *mem, off_t pg_start, int type)
 {
        int i;
-       unsigned long *cur_gatt;
+       unsigned long __iomem *cur_gatt;
        unsigned long addr;
 
        if (type != 0 || mem->type != 0)
@@ -327,8 +334,8 @@ static int amd_remove_memory(struct agp_memory *mem, off_t pg_start, int type)
        for (i = pg_start; i < (mem->page_count + pg_start); i++) {
                addr = (i * PAGE_SIZE) + agp_bridge->gart_bus_addr;
                cur_gatt = GET_GATT(addr);
-               cur_gatt[GET_GATT_OFF(addr)] = 
-                       (unsigned long) agp_bridge->scratch_page;
+               writel(agp_bridge->scratch_page, cur_gatt+GET_GATT_OFF(addr));
+               readl(cur_gatt+GET_GATT_OFF(addr));     /* PCI Posting. */
        }
 
        amd_irongate_tlbflush(mem);
@@ -351,7 +358,7 @@ static struct gatt_mask amd_irongate_masks[] =
        {.mask = 1, .type = 0}
 };
 
-struct agp_bridge_driver amd_irongate_driver = {
+static struct agp_bridge_driver amd_irongate_driver = {
        .owner                  = THIS_MODULE,
        .aperture_sizes         = amd_irongate_sizes,
        .size_type              = LVL2_APER_SIZE,
@@ -394,7 +401,6 @@ static struct agp_device_ids amd_agp_device_ids[] __devinitdata =
 static int __devinit agp_amdk7_probe(struct pci_dev *pdev,
                                     const struct pci_device_id *ent)
 {
-       struct agp_device_ids *devs = amd_agp_device_ids;
        struct agp_bridge_data *bridge;
        u8 cap_ptr;
        int j;
@@ -403,19 +409,10 @@ static int __devinit agp_amdk7_probe(struct pci_dev *pdev,
        if (!cap_ptr)
                return -ENODEV;
 
-       for (j = 0; devs[j].chipset_name; j++) {
-               if (pdev->device == devs[j].device_id) {
-                       printk (KERN_INFO PFX "Detected AMD %s chipset\n",
-                                       devs[j].chipset_name);
-                       goto found;
-               }
-       }
-
-       printk(KERN_ERR PFX "Unsupported AMD chipset (device id: %04x)\n",
-                   pdev->device);
-       return -ENODEV;
+       j = ent - agp_amdk7_pci_table;
+       printk(KERN_INFO PFX "Detected AMD %s chipset\n",
+              amd_agp_device_ids[j].chipset_name);
 
-found:
        bridge = agp_alloc_bridge();
        if (!bridge)
                return -ENOMEM;
@@ -425,6 +422,53 @@ found:
        bridge->dev = pdev;
        bridge->capndx = cap_ptr;
 
+       /* 751 Errata (22564_B-1.PDF)
+          erratum 20: strobe glitch with Nvidia NV10 GeForce cards.
+          system controller may experience noise due to strong drive strengths
+        */
+       if (agp_bridge->dev->device == PCI_DEVICE_ID_AMD_FE_GATE_7006) {
+               u8 cap_ptr=0;
+               struct pci_dev *gfxcard=NULL;
+               while (!cap_ptr) {
+                       gfxcard = pci_get_class(PCI_CLASS_DISPLAY_VGA<<8, gfxcard);
+                       if (!gfxcard) {
+                               printk (KERN_INFO PFX "Couldn't find an AGP VGA controller.\n");
+                               return -ENODEV;
+                       }
+                       cap_ptr = pci_find_capability(gfxcard, PCI_CAP_ID_AGP);
+                       if (!cap_ptr) {
+                               pci_dev_put(gfxcard);
+                               continue;
+                       }
+               }
+
+               /* With so many variants of NVidia cards, it's simpler just
+                  to blacklist them all, and then whitelist them as needed
+                  (if necessary at all). */
+               if (gfxcard->vendor == PCI_VENDOR_ID_NVIDIA) {
+                       agp_bridge->flags |= AGP_ERRATA_1X;
+                       printk (KERN_INFO PFX "AMD 751 chipset with NVidia GeForce detected. Forcing to 1X due to errata.\n");
+               }
+               pci_dev_put(gfxcard);
+       }
+
+       /* 761 Errata (23613_F.pdf)
+        * Revisions B0/B1 were a disaster.
+        * erratum 44: SYSCLK/AGPCLK skew causes 2X failures -- Force mode to 1X
+        * erratum 45: Timing problem prevents fast writes -- Disable fast write.
+        * erratum 46: Setup violation on AGP SBA pins - Disable side band addressing.
+        * With this lot disabled, we should prevent lockups. */
+       if (agp_bridge->dev->device == PCI_DEVICE_ID_AMD_FE_GATE_700E) {
+               u8 revision=0;
+               pci_read_config_byte(pdev, PCI_REVISION_ID, &revision);
+               if (revision == 0x10 || revision == 0x11) {
+                       agp_bridge->flags = AGP_ERRATA_FASTWRITES;
+                       agp_bridge->flags |= AGP_ERRATA_SBA;
+                       agp_bridge->flags |= AGP_ERRATA_1X;
+                       printk (KERN_INFO PFX "AMD 761 chipset with errata detected - disabling AGP fast writes & SBA and forcing to 1X.\n");
+               }
+       }
+
        /* Fill in the mode register */
        pci_read_config_dword(pdev,
                        bridge->capndx+PCI_AGP_STATUS,
@@ -442,12 +486,29 @@ static void __devexit agp_amdk7_remove(struct pci_dev *pdev)
        agp_put_bridge(bridge);
 }
 
+/* must be the same order as name table above */
 static struct pci_device_id agp_amdk7_pci_table[] = {
        {
        .class          = (PCI_CLASS_BRIDGE_HOST << 8),
        .class_mask     = ~0,
        .vendor         = PCI_VENDOR_ID_AMD,
-       .device         = PCI_ANY_ID,
+       .device         = PCI_DEVICE_ID_AMD_FE_GATE_7006,
+       .subvendor      = PCI_ANY_ID,
+       .subdevice      = PCI_ANY_ID,
+       },
+       {
+       .class          = (PCI_CLASS_BRIDGE_HOST << 8),
+       .class_mask     = ~0,
+       .vendor         = PCI_VENDOR_ID_AMD,
+       .device         = PCI_DEVICE_ID_AMD_FE_GATE_700E,
+       .subvendor      = PCI_ANY_ID,
+       .subdevice      = PCI_ANY_ID,
+       },
+       {
+       .class          = (PCI_CLASS_BRIDGE_HOST << 8),
+       .class_mask     = ~0,
+       .vendor         = PCI_VENDOR_ID_AMD,
+       .device         = PCI_DEVICE_ID_AMD_FE_GATE_700C,
        .subvendor      = PCI_ANY_ID,
        .subdevice      = PCI_ANY_ID,
        },
@@ -465,7 +526,9 @@ static struct pci_driver agp_amdk7_pci_driver = {
 
 static int __init agp_amdk7_init(void)
 {
-       return pci_module_init(&agp_amdk7_pci_driver);
+       if (agp_off)
+               return -EINVAL;
+       return pci_register_driver(&agp_amdk7_pci_driver);
 }
 
 static void __exit agp_amdk7_cleanup(void)