| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* | 
|  | 2 | * Copyright 2001-2003 SuSE Labs. | 
|  | 3 | * Distributed under the GNU public license, v2. | 
|  | 4 | * | 
|  | 5 | * This is a GART driver for the AMD Opteron/Athlon64 on-CPU northbridge. | 
|  | 6 | * It also includes support for the AMD 8151 AGP bridge, | 
|  | 7 | * although it doesn't actually do much, as all the real | 
|  | 8 | * work is done in the northbridge(s). | 
|  | 9 | */ | 
|  | 10 |  | 
|  | 11 | #include <linux/config.h> | 
|  | 12 | #include <linux/module.h> | 
|  | 13 | #include <linux/pci.h> | 
|  | 14 | #include <linux/init.h> | 
|  | 15 | #include <linux/agp_backend.h> | 
| Tim Schmielau | 8c65b4a | 2005-11-07 00:59:43 -0800 | [diff] [blame] | 16 | #include <linux/mmzone.h> | 
| Tim Schmielau | 4e57b68 | 2005-10-30 15:03:48 -0800 | [diff] [blame] | 17 | #include <asm/page.h>		/* PAGE_SIZE */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 18 | #include "agp.h" | 
|  | 19 |  | 
|  | 20 | /* Will need to be increased if AMD64 ever goes >8-way. */ | 
|  | 21 | #define MAX_HAMMER_GARTS   8 | 
|  | 22 |  | 
|  | 23 | /* PTE bits. */ | 
|  | 24 | #define GPTE_VALID	1 | 
|  | 25 | #define GPTE_COHERENT	2 | 
|  | 26 |  | 
|  | 27 | /* Aperture control register bits. */ | 
|  | 28 | #define GARTEN		(1<<0) | 
|  | 29 | #define DISGARTCPU	(1<<4) | 
|  | 30 | #define DISGARTIO	(1<<5) | 
|  | 31 |  | 
|  | 32 | /* GART cache control register bits. */ | 
|  | 33 | #define INVGART		(1<<0) | 
|  | 34 | #define GARTPTEERR	(1<<1) | 
|  | 35 |  | 
|  | 36 | /* K8 On-cpu GART registers */ | 
|  | 37 | #define AMD64_GARTAPERTURECTL	0x90 | 
|  | 38 | #define AMD64_GARTAPERTUREBASE	0x94 | 
|  | 39 | #define AMD64_GARTTABLEBASE	0x98 | 
|  | 40 | #define AMD64_GARTCACHECTL	0x9c | 
|  | 41 | #define AMD64_GARTEN		(1<<0) | 
|  | 42 |  | 
|  | 43 | /* NVIDIA K8 registers */ | 
|  | 44 | #define NVIDIA_X86_64_0_APBASE		0x10 | 
|  | 45 | #define NVIDIA_X86_64_1_APBASE1		0x50 | 
|  | 46 | #define NVIDIA_X86_64_1_APLIMIT1	0x54 | 
|  | 47 | #define NVIDIA_X86_64_1_APSIZE		0xa8 | 
|  | 48 | #define NVIDIA_X86_64_1_APBASE2		0xd8 | 
|  | 49 | #define NVIDIA_X86_64_1_APLIMIT2	0xdc | 
|  | 50 |  | 
|  | 51 | /* ULi K8 registers */ | 
|  | 52 | #define ULI_X86_64_BASE_ADDR		0x10 | 
|  | 53 | #define ULI_X86_64_HTT_FEA_REG		0x50 | 
|  | 54 | #define ULI_X86_64_ENU_SCR_REG		0x54 | 
|  | 55 |  | 
|  | 56 | static int nr_garts; | 
|  | 57 | static struct pci_dev * hammers[MAX_HAMMER_GARTS]; | 
|  | 58 |  | 
|  | 59 | static struct resource *aperture_resource; | 
| Andi Kleen | 172efbb | 2005-11-05 17:25:54 +0100 | [diff] [blame] | 60 | static int __initdata agp_try_unsupported = 1; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 61 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 62 | #define for_each_nb() for(gart_iterator=0;gart_iterator<nr_garts;gart_iterator++) | 
|  | 63 |  | 
|  | 64 | static void flush_amd64_tlb(struct pci_dev *dev) | 
|  | 65 | { | 
|  | 66 | u32 tmp; | 
|  | 67 |  | 
|  | 68 | pci_read_config_dword (dev, AMD64_GARTCACHECTL, &tmp); | 
|  | 69 | tmp |= INVGART; | 
|  | 70 | pci_write_config_dword (dev, AMD64_GARTCACHECTL, tmp); | 
|  | 71 | } | 
|  | 72 |  | 
|  | 73 | static void amd64_tlbflush(struct agp_memory *temp) | 
|  | 74 | { | 
| Andi Kleen | 1d2e6bd | 2005-11-05 17:25:54 +0100 | [diff] [blame] | 75 | int gart_iterator; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 76 | for_each_nb() | 
|  | 77 | flush_amd64_tlb(hammers[gart_iterator]); | 
|  | 78 | } | 
|  | 79 |  | 
|  | 80 | static int amd64_insert_memory(struct agp_memory *mem, off_t pg_start, int type) | 
|  | 81 | { | 
|  | 82 | int i, j, num_entries; | 
|  | 83 | long long tmp; | 
|  | 84 | u32 pte; | 
|  | 85 |  | 
|  | 86 | num_entries = agp_num_entries(); | 
|  | 87 |  | 
|  | 88 | if (type != 0 || mem->type != 0) | 
|  | 89 | return -EINVAL; | 
|  | 90 |  | 
|  | 91 | /* Make sure we can fit the range in the gatt table. */ | 
|  | 92 | /* FIXME: could wrap */ | 
|  | 93 | if (((unsigned long)pg_start + mem->page_count) > num_entries) | 
|  | 94 | return -EINVAL; | 
|  | 95 |  | 
|  | 96 | j = pg_start; | 
|  | 97 |  | 
|  | 98 | /* gatt table should be empty. */ | 
|  | 99 | while (j < (pg_start + mem->page_count)) { | 
|  | 100 | if (!PGE_EMPTY(agp_bridge, readl(agp_bridge->gatt_table+j))) | 
|  | 101 | return -EBUSY; | 
|  | 102 | j++; | 
|  | 103 | } | 
|  | 104 |  | 
|  | 105 | if (mem->is_flushed == FALSE) { | 
|  | 106 | global_cache_flush(); | 
|  | 107 | mem->is_flushed = TRUE; | 
|  | 108 | } | 
|  | 109 |  | 
|  | 110 | for (i = 0, j = pg_start; i < mem->page_count; i++, j++) { | 
|  | 111 | tmp = agp_bridge->driver->mask_memory(agp_bridge, | 
|  | 112 | mem->memory[i], mem->type); | 
|  | 113 |  | 
|  | 114 | BUG_ON(tmp & 0xffffff0000000ffcULL); | 
|  | 115 | pte = (tmp & 0x000000ff00000000ULL) >> 28; | 
|  | 116 | pte |=(tmp & 0x00000000fffff000ULL); | 
|  | 117 | pte |= GPTE_VALID | GPTE_COHERENT; | 
|  | 118 |  | 
|  | 119 | writel(pte, agp_bridge->gatt_table+j); | 
|  | 120 | readl(agp_bridge->gatt_table+j);	/* PCI Posting. */ | 
|  | 121 | } | 
|  | 122 | amd64_tlbflush(mem); | 
|  | 123 | return 0; | 
|  | 124 | } | 
|  | 125 |  | 
|  | 126 | /* | 
|  | 127 | * This hack alters the order element according | 
|  | 128 | * to the size of a long. It sucks. I totally disown this, even | 
|  | 129 | * though it does appear to work for the most part. | 
|  | 130 | */ | 
|  | 131 | static struct aper_size_info_32 amd64_aperture_sizes[7] = | 
|  | 132 | { | 
|  | 133 | {32,   8192,   3+(sizeof(long)/8), 0 }, | 
|  | 134 | {64,   16384,  4+(sizeof(long)/8), 1<<1 }, | 
|  | 135 | {128,  32768,  5+(sizeof(long)/8), 1<<2 }, | 
|  | 136 | {256,  65536,  6+(sizeof(long)/8), 1<<1 | 1<<2 }, | 
|  | 137 | {512,  131072, 7+(sizeof(long)/8), 1<<3 }, | 
|  | 138 | {1024, 262144, 8+(sizeof(long)/8), 1<<1 | 1<<3}, | 
|  | 139 | {2048, 524288, 9+(sizeof(long)/8), 1<<2 | 1<<3} | 
|  | 140 | }; | 
|  | 141 |  | 
|  | 142 |  | 
|  | 143 | /* | 
|  | 144 | * Get the current Aperture size from the x86-64. | 
|  | 145 | * Note, that there may be multiple x86-64's, but we just return | 
|  | 146 | * the value from the first one we find. The set_size functions | 
|  | 147 | * keep the rest coherent anyway. Or at least should do. | 
|  | 148 | */ | 
|  | 149 | static int amd64_fetch_size(void) | 
|  | 150 | { | 
|  | 151 | struct pci_dev *dev; | 
|  | 152 | int i; | 
|  | 153 | u32 temp; | 
|  | 154 | struct aper_size_info_32 *values; | 
|  | 155 |  | 
|  | 156 | dev = hammers[0]; | 
|  | 157 | if (dev==NULL) | 
|  | 158 | return 0; | 
|  | 159 |  | 
|  | 160 | pci_read_config_dword(dev, AMD64_GARTAPERTURECTL, &temp); | 
|  | 161 | temp = (temp & 0xe); | 
|  | 162 | values = A_SIZE_32(amd64_aperture_sizes); | 
|  | 163 |  | 
|  | 164 | for (i = 0; i < agp_bridge->driver->num_aperture_sizes; i++) { | 
|  | 165 | if (temp == values[i].size_value) { | 
|  | 166 | agp_bridge->previous_size = | 
|  | 167 | agp_bridge->current_size = (void *) (values + i); | 
|  | 168 |  | 
|  | 169 | agp_bridge->aperture_size_idx = i; | 
|  | 170 | return values[i].size; | 
|  | 171 | } | 
|  | 172 | } | 
|  | 173 | return 0; | 
|  | 174 | } | 
|  | 175 |  | 
|  | 176 | /* | 
|  | 177 | * In a multiprocessor x86-64 system, this function gets | 
|  | 178 | * called once for each CPU. | 
|  | 179 | */ | 
|  | 180 | static u64 amd64_configure (struct pci_dev *hammer, u64 gatt_table) | 
|  | 181 | { | 
|  | 182 | u64 aperturebase; | 
|  | 183 | u32 tmp; | 
|  | 184 | u64 addr, aper_base; | 
|  | 185 |  | 
|  | 186 | /* Address to map to */ | 
|  | 187 | pci_read_config_dword (hammer, AMD64_GARTAPERTUREBASE, &tmp); | 
|  | 188 | aperturebase = tmp << 25; | 
|  | 189 | aper_base = (aperturebase & PCI_BASE_ADDRESS_MEM_MASK); | 
|  | 190 |  | 
|  | 191 | /* address of the mappings table */ | 
|  | 192 | addr = (u64) gatt_table; | 
|  | 193 | addr >>= 12; | 
|  | 194 | tmp = (u32) addr<<4; | 
|  | 195 | tmp &= ~0xf; | 
|  | 196 | pci_write_config_dword (hammer, AMD64_GARTTABLEBASE, tmp); | 
|  | 197 |  | 
|  | 198 | /* Enable GART translation for this hammer. */ | 
|  | 199 | pci_read_config_dword(hammer, AMD64_GARTAPERTURECTL, &tmp); | 
|  | 200 | tmp |= GARTEN; | 
|  | 201 | tmp &= ~(DISGARTCPU | DISGARTIO); | 
|  | 202 | pci_write_config_dword(hammer, AMD64_GARTAPERTURECTL, tmp); | 
|  | 203 |  | 
|  | 204 | /* keep CPU's coherent. */ | 
|  | 205 | flush_amd64_tlb (hammer); | 
|  | 206 |  | 
|  | 207 | return aper_base; | 
|  | 208 | } | 
|  | 209 |  | 
|  | 210 |  | 
|  | 211 | static struct aper_size_info_32 amd_8151_sizes[7] = | 
|  | 212 | { | 
|  | 213 | {2048, 524288, 9, 0x00000000 },	/* 0 0 0 0 0 0 */ | 
|  | 214 | {1024, 262144, 8, 0x00000400 },	/* 1 0 0 0 0 0 */ | 
|  | 215 | {512,  131072, 7, 0x00000600 },	/* 1 1 0 0 0 0 */ | 
|  | 216 | {256,  65536,  6, 0x00000700 },	/* 1 1 1 0 0 0 */ | 
|  | 217 | {128,  32768,  5, 0x00000720 },	/* 1 1 1 1 0 0 */ | 
|  | 218 | {64,   16384,  4, 0x00000730 },	/* 1 1 1 1 1 0 */ | 
|  | 219 | {32,   8192,   3, 0x00000738 } 	/* 1 1 1 1 1 1 */ | 
|  | 220 | }; | 
|  | 221 |  | 
|  | 222 | static int amd_8151_configure(void) | 
|  | 223 | { | 
| Keir Fraser | 07eee78 | 2005-03-30 13:17:04 -0800 | [diff] [blame] | 224 | unsigned long gatt_bus = virt_to_gart(agp_bridge->gatt_table_real); | 
| Andi Kleen | 1d2e6bd | 2005-11-05 17:25:54 +0100 | [diff] [blame] | 225 | int gart_iterator; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 226 |  | 
|  | 227 | /* Configure AGP regs in each x86-64 host bridge. */ | 
|  | 228 | for_each_nb() { | 
|  | 229 | agp_bridge->gart_bus_addr = | 
|  | 230 | amd64_configure(hammers[gart_iterator],gatt_bus); | 
|  | 231 | } | 
|  | 232 | return 0; | 
|  | 233 | } | 
|  | 234 |  | 
|  | 235 |  | 
|  | 236 | static void amd64_cleanup(void) | 
|  | 237 | { | 
|  | 238 | u32 tmp; | 
| Andi Kleen | 1d2e6bd | 2005-11-05 17:25:54 +0100 | [diff] [blame] | 239 | int gart_iterator; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 240 | for_each_nb() { | 
|  | 241 | /* disable gart translation */ | 
|  | 242 | pci_read_config_dword (hammers[gart_iterator], AMD64_GARTAPERTURECTL, &tmp); | 
|  | 243 | tmp &= ~AMD64_GARTEN; | 
|  | 244 | pci_write_config_dword (hammers[gart_iterator], AMD64_GARTAPERTURECTL, tmp); | 
|  | 245 | } | 
|  | 246 | } | 
|  | 247 |  | 
|  | 248 |  | 
| Adrian Bunk | 408b664 | 2005-05-01 08:59:29 -0700 | [diff] [blame] | 249 | static struct agp_bridge_driver amd_8151_driver = { | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 250 | .owner			= THIS_MODULE, | 
|  | 251 | .aperture_sizes		= amd_8151_sizes, | 
|  | 252 | .size_type		= U32_APER_SIZE, | 
|  | 253 | .num_aperture_sizes	= 7, | 
|  | 254 | .configure		= amd_8151_configure, | 
|  | 255 | .fetch_size		= amd64_fetch_size, | 
|  | 256 | .cleanup		= amd64_cleanup, | 
|  | 257 | .tlb_flush		= amd64_tlbflush, | 
|  | 258 | .mask_memory		= agp_generic_mask_memory, | 
|  | 259 | .masks			= NULL, | 
|  | 260 | .agp_enable		= agp_generic_enable, | 
|  | 261 | .cache_flush		= global_cache_flush, | 
|  | 262 | .create_gatt_table	= agp_generic_create_gatt_table, | 
|  | 263 | .free_gatt_table	= agp_generic_free_gatt_table, | 
|  | 264 | .insert_memory		= amd64_insert_memory, | 
|  | 265 | .remove_memory		= agp_generic_remove_memory, | 
|  | 266 | .alloc_by_type		= agp_generic_alloc_by_type, | 
|  | 267 | .free_by_type		= agp_generic_free_by_type, | 
|  | 268 | .agp_alloc_page		= agp_generic_alloc_page, | 
|  | 269 | .agp_destroy_page	= agp_generic_destroy_page, | 
|  | 270 | }; | 
|  | 271 |  | 
|  | 272 | /* Some basic sanity checks for the aperture. */ | 
|  | 273 | static int __devinit aperture_valid(u64 aper, u32 size) | 
|  | 274 | { | 
|  | 275 | u32 pfn, c; | 
|  | 276 | if (aper == 0) { | 
|  | 277 | printk(KERN_ERR PFX "No aperture\n"); | 
|  | 278 | return 0; | 
|  | 279 | } | 
|  | 280 | if (size < 32*1024*1024) { | 
|  | 281 | printk(KERN_ERR PFX "Aperture too small (%d MB)\n", size>>20); | 
|  | 282 | return 0; | 
|  | 283 | } | 
|  | 284 | if (aper + size > 0xffffffff) { | 
|  | 285 | printk(KERN_ERR PFX "Aperture out of bounds\n"); | 
|  | 286 | return 0; | 
|  | 287 | } | 
|  | 288 | pfn = aper >> PAGE_SHIFT; | 
|  | 289 | for (c = 0; c < size/PAGE_SIZE; c++) { | 
|  | 290 | if (!pfn_valid(pfn + c)) | 
|  | 291 | break; | 
|  | 292 | if (!PageReserved(pfn_to_page(pfn + c))) { | 
|  | 293 | printk(KERN_ERR PFX "Aperture pointing to RAM\n"); | 
|  | 294 | return 0; | 
|  | 295 | } | 
|  | 296 | } | 
|  | 297 |  | 
|  | 298 | /* Request the Aperture. This catches cases when someone else | 
|  | 299 | already put a mapping in there - happens with some very broken BIOS | 
|  | 300 |  | 
|  | 301 | Maybe better to use pci_assign_resource/pci_enable_device instead | 
|  | 302 | trusting the bridges? */ | 
|  | 303 | if (!aperture_resource && | 
|  | 304 | !(aperture_resource = request_mem_region(aper, size, "aperture"))) { | 
|  | 305 | printk(KERN_ERR PFX "Aperture conflicts with PCI mapping.\n"); | 
|  | 306 | return 0; | 
|  | 307 | } | 
|  | 308 | return 1; | 
|  | 309 | } | 
|  | 310 |  | 
|  | 311 | /* | 
|  | 312 | * W*s centric BIOS sometimes only set up the aperture in the AGP | 
|  | 313 | * bridge, not the northbridge. On AMD64 this is handled early | 
|  | 314 | * in aperture.c, but when GART_IOMMU is not enabled or we run | 
|  | 315 | * on a 32bit kernel this needs to be redone. | 
|  | 316 | * Unfortunately it is impossible to fix the aperture here because it's too late | 
|  | 317 | * to allocate that much memory. But at least error out cleanly instead of | 
|  | 318 | * crashing. | 
|  | 319 | */ | 
|  | 320 | static __devinit int fix_northbridge(struct pci_dev *nb, struct pci_dev *agp, | 
|  | 321 | u16 cap) | 
|  | 322 | { | 
|  | 323 | u32 aper_low, aper_hi; | 
|  | 324 | u64 aper, nb_aper; | 
|  | 325 | int order = 0; | 
|  | 326 | u32 nb_order, nb_base; | 
|  | 327 | u16 apsize; | 
|  | 328 |  | 
|  | 329 | pci_read_config_dword(nb, 0x90, &nb_order); | 
|  | 330 | nb_order = (nb_order >> 1) & 7; | 
|  | 331 | pci_read_config_dword(nb, 0x94, &nb_base); | 
|  | 332 | nb_aper = nb_base << 25; | 
|  | 333 | if (aperture_valid(nb_aper, (32*1024*1024)<<nb_order)) { | 
|  | 334 | return 0; | 
|  | 335 | } | 
|  | 336 |  | 
|  | 337 | /* Northbridge seems to contain crap. Try the AGP bridge. */ | 
|  | 338 |  | 
|  | 339 | pci_read_config_word(agp, cap+0x14, &apsize); | 
|  | 340 | if (apsize == 0xffff) | 
|  | 341 | return -1; | 
|  | 342 |  | 
|  | 343 | apsize &= 0xfff; | 
|  | 344 | /* Some BIOS use weird encodings not in the AGPv3 table. */ | 
|  | 345 | if (apsize & 0xff) | 
|  | 346 | apsize |= 0xf00; | 
|  | 347 | order = 7 - hweight16(apsize); | 
|  | 348 |  | 
|  | 349 | pci_read_config_dword(agp, 0x10, &aper_low); | 
|  | 350 | pci_read_config_dword(agp, 0x14, &aper_hi); | 
|  | 351 | aper = (aper_low & ~((1<<22)-1)) | ((u64)aper_hi << 32); | 
|  | 352 | printk(KERN_INFO PFX "Aperture from AGP @ %Lx size %u MB\n", aper, 32 << order); | 
|  | 353 | if (order < 0 || !aperture_valid(aper, (32*1024*1024)<<order)) | 
|  | 354 | return -1; | 
|  | 355 |  | 
|  | 356 | pci_write_config_dword(nb, 0x90, order << 1); | 
|  | 357 | pci_write_config_dword(nb, 0x94, aper >> 25); | 
|  | 358 |  | 
|  | 359 | return 0; | 
|  | 360 | } | 
|  | 361 |  | 
|  | 362 | static __devinit int cache_nbs (struct pci_dev *pdev, u32 cap_ptr) | 
|  | 363 | { | 
|  | 364 | struct pci_dev *loop_dev = NULL; | 
|  | 365 | int i = 0; | 
|  | 366 |  | 
|  | 367 | /* cache pci_devs of northbridges. */ | 
|  | 368 | while ((loop_dev = pci_get_device(PCI_VENDOR_ID_AMD, 0x1103, loop_dev)) | 
|  | 369 | != NULL) { | 
|  | 370 | if (i == MAX_HAMMER_GARTS) { | 
|  | 371 | printk(KERN_ERR PFX "Too many northbridges for AGP\n"); | 
|  | 372 | return -1; | 
|  | 373 | } | 
|  | 374 | if (fix_northbridge(loop_dev, pdev, cap_ptr) < 0) { | 
|  | 375 | printk(KERN_ERR PFX "No usable aperture found.\n"); | 
|  | 376 | #ifdef __x86_64__ | 
|  | 377 | /* should port this to i386 */ | 
|  | 378 | printk(KERN_ERR PFX "Consider rebooting with iommu=memaper=2 to get a good aperture.\n"); | 
|  | 379 | #endif | 
|  | 380 | return -1; | 
|  | 381 | } | 
|  | 382 | hammers[i++] = loop_dev; | 
|  | 383 | } | 
|  | 384 | nr_garts = i; | 
|  | 385 | return i == 0 ? -1 : 0; | 
|  | 386 | } | 
|  | 387 |  | 
|  | 388 | /* Handle AMD 8151 quirks */ | 
|  | 389 | static void __devinit amd8151_init(struct pci_dev *pdev, struct agp_bridge_data *bridge) | 
|  | 390 | { | 
|  | 391 | char *revstring; | 
|  | 392 | u8 rev_id; | 
|  | 393 |  | 
|  | 394 | pci_read_config_byte(pdev, PCI_REVISION_ID, &rev_id); | 
|  | 395 | switch (rev_id) { | 
|  | 396 | case 0x01: revstring="A0"; break; | 
|  | 397 | case 0x02: revstring="A1"; break; | 
|  | 398 | case 0x11: revstring="B0"; break; | 
|  | 399 | case 0x12: revstring="B1"; break; | 
|  | 400 | case 0x13: revstring="B2"; break; | 
|  | 401 | case 0x14: revstring="B3"; break; | 
|  | 402 | default:   revstring="??"; break; | 
|  | 403 | } | 
|  | 404 |  | 
|  | 405 | printk (KERN_INFO PFX "Detected AMD 8151 AGP Bridge rev %s\n", revstring); | 
|  | 406 |  | 
|  | 407 | /* | 
|  | 408 | * Work around errata. | 
|  | 409 | * Chips before B2 stepping incorrectly reporting v3.5 | 
|  | 410 | */ | 
|  | 411 | if (rev_id < 0x13) { | 
|  | 412 | printk (KERN_INFO PFX "Correcting AGP revision (reports 3.5, is really 3.0)\n"); | 
|  | 413 | bridge->major_version = 3; | 
|  | 414 | bridge->minor_version = 0; | 
|  | 415 | } | 
|  | 416 | } | 
|  | 417 |  | 
|  | 418 |  | 
| Dave Jones | a42ab7f | 2005-11-16 16:07:02 -0800 | [diff] [blame] | 419 | static const struct aper_size_info_32 uli_sizes[7] = | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 420 | { | 
|  | 421 | {256, 65536, 6, 10}, | 
|  | 422 | {128, 32768, 5, 9}, | 
|  | 423 | {64, 16384, 4, 8}, | 
|  | 424 | {32, 8192, 3, 7}, | 
|  | 425 | {16, 4096, 2, 6}, | 
|  | 426 | {8, 2048, 1, 4}, | 
|  | 427 | {4, 1024, 0, 3} | 
|  | 428 | }; | 
|  | 429 | static int __devinit uli_agp_init(struct pci_dev *pdev) | 
|  | 430 | { | 
|  | 431 | u32 httfea,baseaddr,enuscr; | 
|  | 432 | struct pci_dev *dev1; | 
|  | 433 | int i; | 
|  | 434 | unsigned size = amd64_fetch_size(); | 
| Dave Jones | 29db35e | 2005-09-01 10:50:13 -0700 | [diff] [blame] | 435 | printk(KERN_INFO "Setting up ULi AGP.\n"); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 436 | dev1 = pci_find_slot ((unsigned int)pdev->bus->number,PCI_DEVFN(0,0)); | 
|  | 437 | if (dev1 == NULL) { | 
|  | 438 | printk(KERN_INFO PFX "Detected a ULi chipset, " | 
|  | 439 | "but could not fine the secondary device.\n"); | 
|  | 440 | return -ENODEV; | 
|  | 441 | } | 
|  | 442 |  | 
|  | 443 | for (i = 0; i < ARRAY_SIZE(uli_sizes); i++) | 
|  | 444 | if (uli_sizes[i].size == size) | 
|  | 445 | break; | 
|  | 446 |  | 
|  | 447 | if (i == ARRAY_SIZE(uli_sizes)) { | 
|  | 448 | printk(KERN_INFO PFX "No ULi size found for %d\n", size); | 
|  | 449 | return -ENODEV; | 
|  | 450 | } | 
|  | 451 |  | 
|  | 452 | /* shadow x86-64 registers into ULi registers */ | 
|  | 453 | pci_read_config_dword (hammers[0], AMD64_GARTAPERTUREBASE, &httfea); | 
|  | 454 |  | 
|  | 455 | /* if x86-64 aperture base is beyond 4G, exit here */ | 
|  | 456 | if ((httfea & 0x7fff) >> (32 - 25)) | 
|  | 457 | return -ENODEV; | 
|  | 458 |  | 
|  | 459 | httfea = (httfea& 0x7fff) << 25; | 
|  | 460 |  | 
|  | 461 | pci_read_config_dword(pdev, ULI_X86_64_BASE_ADDR, &baseaddr); | 
|  | 462 | baseaddr&= ~PCI_BASE_ADDRESS_MEM_MASK; | 
|  | 463 | baseaddr|= httfea; | 
|  | 464 | pci_write_config_dword(pdev, ULI_X86_64_BASE_ADDR, baseaddr); | 
|  | 465 |  | 
|  | 466 | enuscr= httfea+ (size * 1024 * 1024) - 1; | 
|  | 467 | pci_write_config_dword(dev1, ULI_X86_64_HTT_FEA_REG, httfea); | 
|  | 468 | pci_write_config_dword(dev1, ULI_X86_64_ENU_SCR_REG, enuscr); | 
|  | 469 | return 0; | 
|  | 470 | } | 
|  | 471 |  | 
|  | 472 |  | 
| Dave Jones | a42ab7f | 2005-11-16 16:07:02 -0800 | [diff] [blame] | 473 | static const struct aper_size_info_32 nforce3_sizes[5] = | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 474 | { | 
|  | 475 | {512,  131072, 7, 0x00000000 }, | 
|  | 476 | {256,  65536,  6, 0x00000008 }, | 
|  | 477 | {128,  32768,  5, 0x0000000C }, | 
|  | 478 | {64,   16384,  4, 0x0000000E }, | 
|  | 479 | {32,   8192,   3, 0x0000000F } | 
|  | 480 | }; | 
|  | 481 |  | 
|  | 482 | /* Handle shadow device of the Nvidia NForce3 */ | 
|  | 483 | /* CHECK-ME original 2.4 version set up some IORRs. Check if that is needed. */ | 
|  | 484 | static int __devinit nforce3_agp_init(struct pci_dev *pdev) | 
|  | 485 | { | 
|  | 486 | u32 tmp, apbase, apbar, aplimit; | 
|  | 487 | struct pci_dev *dev1; | 
|  | 488 | int i; | 
|  | 489 | unsigned size = amd64_fetch_size(); | 
|  | 490 |  | 
|  | 491 | printk(KERN_INFO PFX "Setting up Nforce3 AGP.\n"); | 
|  | 492 |  | 
|  | 493 | dev1 = pci_find_slot((unsigned int)pdev->bus->number, PCI_DEVFN(11, 0)); | 
|  | 494 | if (dev1 == NULL) { | 
|  | 495 | printk(KERN_INFO PFX "agpgart: Detected an NVIDIA " | 
|  | 496 | "nForce3 chipset, but could not find " | 
|  | 497 | "the secondary device.\n"); | 
|  | 498 | return -ENODEV; | 
|  | 499 | } | 
|  | 500 |  | 
|  | 501 | for (i = 0; i < ARRAY_SIZE(nforce3_sizes); i++) | 
|  | 502 | if (nforce3_sizes[i].size == size) | 
|  | 503 | break; | 
|  | 504 |  | 
|  | 505 | if (i == ARRAY_SIZE(nforce3_sizes)) { | 
|  | 506 | printk(KERN_INFO PFX "No NForce3 size found for %d\n", size); | 
|  | 507 | return -ENODEV; | 
|  | 508 | } | 
|  | 509 |  | 
|  | 510 | pci_read_config_dword(dev1, NVIDIA_X86_64_1_APSIZE, &tmp); | 
|  | 511 | tmp &= ~(0xf); | 
|  | 512 | tmp |= nforce3_sizes[i].size_value; | 
|  | 513 | pci_write_config_dword(dev1, NVIDIA_X86_64_1_APSIZE, tmp); | 
|  | 514 |  | 
|  | 515 | /* shadow x86-64 registers into NVIDIA registers */ | 
|  | 516 | pci_read_config_dword (hammers[0], AMD64_GARTAPERTUREBASE, &apbase); | 
|  | 517 |  | 
|  | 518 | /* if x86-64 aperture base is beyond 4G, exit here */ | 
|  | 519 | if ( (apbase & 0x7fff) >> (32 - 25) ) | 
|  | 520 | return -ENODEV; | 
|  | 521 |  | 
|  | 522 | apbase = (apbase & 0x7fff) << 25; | 
|  | 523 |  | 
|  | 524 | pci_read_config_dword(pdev, NVIDIA_X86_64_0_APBASE, &apbar); | 
|  | 525 | apbar &= ~PCI_BASE_ADDRESS_MEM_MASK; | 
|  | 526 | apbar |= apbase; | 
|  | 527 | pci_write_config_dword(pdev, NVIDIA_X86_64_0_APBASE, apbar); | 
|  | 528 |  | 
|  | 529 | aplimit = apbase + (size * 1024 * 1024) - 1; | 
|  | 530 | pci_write_config_dword(dev1, NVIDIA_X86_64_1_APBASE1, apbase); | 
|  | 531 | pci_write_config_dword(dev1, NVIDIA_X86_64_1_APLIMIT1, aplimit); | 
|  | 532 | pci_write_config_dword(dev1, NVIDIA_X86_64_1_APBASE2, apbase); | 
|  | 533 | pci_write_config_dword(dev1, NVIDIA_X86_64_1_APLIMIT2, aplimit); | 
|  | 534 |  | 
|  | 535 | return 0; | 
|  | 536 | } | 
|  | 537 |  | 
|  | 538 | static int __devinit agp_amd64_probe(struct pci_dev *pdev, | 
|  | 539 | const struct pci_device_id *ent) | 
|  | 540 | { | 
|  | 541 | struct agp_bridge_data *bridge; | 
|  | 542 | u8 cap_ptr; | 
|  | 543 |  | 
|  | 544 | cap_ptr = pci_find_capability(pdev, PCI_CAP_ID_AGP); | 
|  | 545 | if (!cap_ptr) | 
|  | 546 | return -ENODEV; | 
|  | 547 |  | 
|  | 548 | /* Could check for AGPv3 here */ | 
|  | 549 |  | 
|  | 550 | bridge = agp_alloc_bridge(); | 
|  | 551 | if (!bridge) | 
|  | 552 | return -ENOMEM; | 
|  | 553 |  | 
|  | 554 | if (pdev->vendor == PCI_VENDOR_ID_AMD && | 
|  | 555 | pdev->device == PCI_DEVICE_ID_AMD_8151_0) { | 
|  | 556 | amd8151_init(pdev, bridge); | 
|  | 557 | } else { | 
|  | 558 | printk(KERN_INFO PFX "Detected AGP bridge %x\n", pdev->devfn); | 
|  | 559 | } | 
|  | 560 |  | 
|  | 561 | bridge->driver = &amd_8151_driver; | 
|  | 562 | bridge->dev = pdev; | 
|  | 563 | bridge->capndx = cap_ptr; | 
|  | 564 |  | 
|  | 565 | /* Fill in the mode register */ | 
|  | 566 | pci_read_config_dword(pdev, bridge->capndx+PCI_AGP_STATUS, &bridge->mode); | 
|  | 567 |  | 
|  | 568 | if (cache_nbs(pdev, cap_ptr) == -1) { | 
|  | 569 | agp_put_bridge(bridge); | 
|  | 570 | return -ENODEV; | 
|  | 571 | } | 
|  | 572 |  | 
|  | 573 | if (pdev->vendor == PCI_VENDOR_ID_NVIDIA) { | 
|  | 574 | int ret = nforce3_agp_init(pdev); | 
|  | 575 | if (ret) { | 
|  | 576 | agp_put_bridge(bridge); | 
|  | 577 | return ret; | 
|  | 578 | } | 
|  | 579 | } | 
|  | 580 |  | 
|  | 581 | if (pdev->vendor == PCI_VENDOR_ID_AL) { | 
|  | 582 | int ret = uli_agp_init(pdev); | 
|  | 583 | if (ret) { | 
|  | 584 | agp_put_bridge(bridge); | 
|  | 585 | return ret; | 
|  | 586 | } | 
|  | 587 | } | 
|  | 588 |  | 
|  | 589 | pci_set_drvdata(pdev, bridge); | 
|  | 590 | return agp_add_bridge(bridge); | 
|  | 591 | } | 
|  | 592 |  | 
|  | 593 | static void __devexit agp_amd64_remove(struct pci_dev *pdev) | 
|  | 594 | { | 
|  | 595 | struct agp_bridge_data *bridge = pci_get_drvdata(pdev); | 
|  | 596 |  | 
| Keir Fraser | 07eee78 | 2005-03-30 13:17:04 -0800 | [diff] [blame] | 597 | release_mem_region(virt_to_gart(bridge->gatt_table_real), | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 598 | amd64_aperture_sizes[bridge->aperture_size_idx].size); | 
|  | 599 | agp_remove_bridge(bridge); | 
|  | 600 | agp_put_bridge(bridge); | 
|  | 601 | } | 
|  | 602 |  | 
|  | 603 | static struct pci_device_id agp_amd64_pci_table[] = { | 
|  | 604 | { | 
|  | 605 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 606 | .class_mask	= ~0, | 
|  | 607 | .vendor		= PCI_VENDOR_ID_AMD, | 
|  | 608 | .device		= PCI_DEVICE_ID_AMD_8151_0, | 
|  | 609 | .subvendor	= PCI_ANY_ID, | 
|  | 610 | .subdevice	= PCI_ANY_ID, | 
|  | 611 | }, | 
|  | 612 | /* ULi M1689 */ | 
|  | 613 | { | 
|  | 614 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 615 | .class_mask	= ~0, | 
|  | 616 | .vendor		= PCI_VENDOR_ID_AL, | 
|  | 617 | .device		= PCI_DEVICE_ID_AL_M1689, | 
|  | 618 | .subvendor	= PCI_ANY_ID, | 
|  | 619 | .subdevice	= PCI_ANY_ID, | 
|  | 620 | }, | 
|  | 621 | /* VIA K8T800Pro */ | 
|  | 622 | { | 
|  | 623 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 624 | .class_mask	= ~0, | 
|  | 625 | .vendor		= PCI_VENDOR_ID_VIA, | 
|  | 626 | .device		= PCI_DEVICE_ID_VIA_K8T800PRO_0, | 
|  | 627 | .subvendor	= PCI_ANY_ID, | 
|  | 628 | .subdevice	= PCI_ANY_ID, | 
|  | 629 | }, | 
|  | 630 | /* VIA K8T800 */ | 
|  | 631 | { | 
|  | 632 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 633 | .class_mask	= ~0, | 
|  | 634 | .vendor		= PCI_VENDOR_ID_VIA, | 
|  | 635 | .device		= PCI_DEVICE_ID_VIA_8385_0, | 
|  | 636 | .subvendor	= PCI_ANY_ID, | 
|  | 637 | .subdevice	= PCI_ANY_ID, | 
|  | 638 | }, | 
|  | 639 | /* VIA K8M800 / K8N800 */ | 
|  | 640 | { | 
|  | 641 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 642 | .class_mask	= ~0, | 
|  | 643 | .vendor		= PCI_VENDOR_ID_VIA, | 
|  | 644 | .device		= PCI_DEVICE_ID_VIA_8380_0, | 
|  | 645 | .subvendor	= PCI_ANY_ID, | 
|  | 646 | .subdevice	= PCI_ANY_ID, | 
|  | 647 | }, | 
|  | 648 | /* VIA K8T890 */ | 
|  | 649 | { | 
|  | 650 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 651 | .class_mask	= ~0, | 
|  | 652 | .vendor		= PCI_VENDOR_ID_VIA, | 
|  | 653 | .device		= PCI_DEVICE_ID_VIA_3238_0, | 
|  | 654 | .subvendor	= PCI_ANY_ID, | 
|  | 655 | .subdevice	= PCI_ANY_ID, | 
|  | 656 | }, | 
|  | 657 | /* VIA K8T800/K8M800/K8N800 */ | 
|  | 658 | { | 
|  | 659 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 660 | .class_mask	= ~0, | 
|  | 661 | .vendor		= PCI_VENDOR_ID_VIA, | 
|  | 662 | .device		= PCI_DEVICE_ID_VIA_838X_1, | 
|  | 663 | .subvendor	= PCI_ANY_ID, | 
|  | 664 | .subdevice	= PCI_ANY_ID, | 
|  | 665 | }, | 
|  | 666 | /* NForce3 */ | 
|  | 667 | { | 
|  | 668 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 669 | .class_mask	= ~0, | 
|  | 670 | .vendor		= PCI_VENDOR_ID_NVIDIA, | 
|  | 671 | .device		= PCI_DEVICE_ID_NVIDIA_NFORCE3, | 
|  | 672 | .subvendor	= PCI_ANY_ID, | 
|  | 673 | .subdevice	= PCI_ANY_ID, | 
|  | 674 | }, | 
|  | 675 | { | 
|  | 676 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 677 | .class_mask	= ~0, | 
|  | 678 | .vendor		= PCI_VENDOR_ID_NVIDIA, | 
|  | 679 | .device		= PCI_DEVICE_ID_NVIDIA_NFORCE3S, | 
|  | 680 | .subvendor	= PCI_ANY_ID, | 
|  | 681 | .subdevice	= PCI_ANY_ID, | 
|  | 682 | }, | 
|  | 683 | /* SIS 755 */ | 
|  | 684 | { | 
|  | 685 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 686 | .class_mask	= ~0, | 
|  | 687 | .vendor		= PCI_VENDOR_ID_SI, | 
|  | 688 | .device		= PCI_DEVICE_ID_SI_755, | 
|  | 689 | .subvendor	= PCI_ANY_ID, | 
|  | 690 | .subdevice	= PCI_ANY_ID, | 
|  | 691 | }, | 
| Dave Jones | 2fa938b | 2005-06-28 20:08:29 -0400 | [diff] [blame] | 692 | /* SIS 760 */ | 
|  | 693 | { | 
|  | 694 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 695 | .class_mask	= ~0, | 
|  | 696 | .vendor		= PCI_VENDOR_ID_SI, | 
|  | 697 | .device		= PCI_DEVICE_ID_SI_760, | 
|  | 698 | .subvendor	= PCI_ANY_ID, | 
|  | 699 | .subdevice	= PCI_ANY_ID, | 
|  | 700 | }, | 
| Andi Kleen | 870b768 | 2005-11-05 17:25:54 +0100 | [diff] [blame] | 701 | /* ALI/ULI M1695 */ | 
|  | 702 | { | 
|  | 703 | .class		= (PCI_CLASS_BRIDGE_HOST << 8), | 
|  | 704 | .class_mask	= ~0, | 
|  | 705 | .vendor		= PCI_VENDOR_ID_AL, | 
|  | 706 | .device		= 0x1689, | 
|  | 707 | .subvendor	= PCI_ANY_ID, | 
|  | 708 | .subdevice	= PCI_ANY_ID, | 
|  | 709 | }, | 
|  | 710 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 711 | { } | 
|  | 712 | }; | 
|  | 713 |  | 
|  | 714 | MODULE_DEVICE_TABLE(pci, agp_amd64_pci_table); | 
|  | 715 |  | 
|  | 716 | static struct pci_driver agp_amd64_pci_driver = { | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 717 | .name		= "agpgart-amd64", | 
|  | 718 | .id_table	= agp_amd64_pci_table, | 
|  | 719 | .probe		= agp_amd64_probe, | 
|  | 720 | .remove		= agp_amd64_remove, | 
|  | 721 | }; | 
|  | 722 |  | 
|  | 723 |  | 
|  | 724 | /* Not static due to IOMMU code calling it early. */ | 
|  | 725 | int __init agp_amd64_init(void) | 
|  | 726 | { | 
|  | 727 | int err = 0; | 
|  | 728 | static struct pci_device_id amd64nb[] = { | 
|  | 729 | { PCI_DEVICE(PCI_VENDOR_ID_AMD, 0x1103) }, | 
|  | 730 | { }, | 
|  | 731 | }; | 
|  | 732 |  | 
|  | 733 | if (agp_off) | 
|  | 734 | return -EINVAL; | 
|  | 735 | if (pci_register_driver(&agp_amd64_pci_driver) > 0) { | 
|  | 736 | struct pci_dev *dev; | 
|  | 737 | if (!agp_try_unsupported && !agp_try_unsupported_boot) { | 
|  | 738 | printk(KERN_INFO PFX "No supported AGP bridge found.\n"); | 
|  | 739 | #ifdef MODULE | 
|  | 740 | printk(KERN_INFO PFX "You can try agp_try_unsupported=1\n"); | 
|  | 741 | #else | 
|  | 742 | printk(KERN_INFO PFX "You can boot with agp=try_unsupported\n"); | 
|  | 743 | #endif | 
|  | 744 | return -ENODEV; | 
|  | 745 | } | 
|  | 746 |  | 
|  | 747 | /* First check that we have at least one AMD64 NB */ | 
|  | 748 | if (!pci_dev_present(amd64nb)) | 
|  | 749 | return -ENODEV; | 
|  | 750 |  | 
|  | 751 | /* Look for any AGP bridge */ | 
|  | 752 | dev = NULL; | 
|  | 753 | err = -ENODEV; | 
|  | 754 | for_each_pci_dev(dev) { | 
|  | 755 | if (!pci_find_capability(dev, PCI_CAP_ID_AGP)) | 
|  | 756 | continue; | 
|  | 757 | /* Only one bridge supported right now */ | 
|  | 758 | if (agp_amd64_probe(dev, NULL) == 0) { | 
|  | 759 | err = 0; | 
|  | 760 | break; | 
|  | 761 | } | 
|  | 762 | } | 
|  | 763 | } | 
|  | 764 | return err; | 
|  | 765 | } | 
|  | 766 |  | 
|  | 767 | static void __exit agp_amd64_cleanup(void) | 
|  | 768 | { | 
|  | 769 | if (aperture_resource) | 
|  | 770 | release_resource(aperture_resource); | 
|  | 771 | pci_unregister_driver(&agp_amd64_pci_driver); | 
|  | 772 | } | 
|  | 773 |  | 
|  | 774 | /* On AMD64 the PCI driver needs to initialize this driver early | 
|  | 775 | for the IOMMU, so it has to be called via a backdoor. */ | 
|  | 776 | #ifndef CONFIG_GART_IOMMU | 
|  | 777 | module_init(agp_amd64_init); | 
|  | 778 | module_exit(agp_amd64_cleanup); | 
|  | 779 | #endif | 
|  | 780 |  | 
|  | 781 | MODULE_AUTHOR("Dave Jones <davej@codemonkey.org.uk>, Andi Kleen"); | 
|  | 782 | module_param(agp_try_unsupported, bool, 0); | 
|  | 783 | MODULE_LICENSE("GPL"); |