11da177e4SLinus Torvalds /*
21da177e4SLinus Torvalds * For documentation on the i460 AGP interface, see Chapter 7 (AGP Subsystem) of
31da177e4SLinus Torvalds * the "Intel 460GTX Chipset Software Developer's Manual":
4631dd1a8SJustin P. Mattock * http://www.intel.com/design/archives/itanium/downloads/248704.htm
51da177e4SLinus Torvalds */
61da177e4SLinus Torvalds /*
71da177e4SLinus Torvalds * 460GX support by Chris Ahna <christopher.j.ahna@intel.com>
81da177e4SLinus Torvalds * Clean up & simplification by David Mosberger-Tang <davidm@hpl.hp.com>
91da177e4SLinus Torvalds */
101da177e4SLinus Torvalds #include <linux/module.h>
111da177e4SLinus Torvalds #include <linux/pci.h>
121da177e4SLinus Torvalds #include <linux/init.h>
134e57b681STim Schmielau #include <linux/string.h>
144e57b681STim Schmielau #include <linux/slab.h>
151da177e4SLinus Torvalds #include <linux/agp_backend.h>
16e57aa839SFengguang Wu #include <linux/log2.h>
171da177e4SLinus Torvalds
181da177e4SLinus Torvalds #include "agp.h"
191da177e4SLinus Torvalds
201da177e4SLinus Torvalds #define INTEL_I460_BAPBASE 0x98
211da177e4SLinus Torvalds #define INTEL_I460_GXBCTL 0xa0
221da177e4SLinus Torvalds #define INTEL_I460_AGPSIZ 0xa2
231da177e4SLinus Torvalds #define INTEL_I460_ATTBASE 0xfe200000
241da177e4SLinus Torvalds #define INTEL_I460_GATT_VALID (1UL << 24)
251da177e4SLinus Torvalds #define INTEL_I460_GATT_COHERENT (1UL << 25)
261da177e4SLinus Torvalds
271da177e4SLinus Torvalds /*
281da177e4SLinus Torvalds * The i460 can operate with large (4MB) pages, but there is no sane way to support this
291da177e4SLinus Torvalds * within the current kernel/DRM environment, so we disable the relevant code for now.
301da177e4SLinus Torvalds * See also comments in ia64_alloc_page()...
311da177e4SLinus Torvalds */
321da177e4SLinus Torvalds #define I460_LARGE_IO_PAGES 0
331da177e4SLinus Torvalds
341da177e4SLinus Torvalds #if I460_LARGE_IO_PAGES
351da177e4SLinus Torvalds # define I460_IO_PAGE_SHIFT i460.io_page_shift
361da177e4SLinus Torvalds #else
371da177e4SLinus Torvalds # define I460_IO_PAGE_SHIFT 12
381da177e4SLinus Torvalds #endif
391da177e4SLinus Torvalds
401da177e4SLinus Torvalds #define I460_IOPAGES_PER_KPAGE (PAGE_SIZE >> I460_IO_PAGE_SHIFT)
411da177e4SLinus Torvalds #define I460_KPAGES_PER_IOPAGE (1 << (I460_IO_PAGE_SHIFT - PAGE_SHIFT))
421da177e4SLinus Torvalds #define I460_SRAM_IO_DISABLE (1 << 4)
431da177e4SLinus Torvalds #define I460_BAPBASE_ENABLE (1 << 3)
441da177e4SLinus Torvalds #define I460_AGPSIZ_MASK 0x7
451da177e4SLinus Torvalds #define I460_4M_PS (1 << 1)
461da177e4SLinus Torvalds
471da177e4SLinus Torvalds /* Control bits for Out-Of-GART coherency and Burst Write Combining */
481da177e4SLinus Torvalds #define I460_GXBCTL_OOG (1UL << 0)
491da177e4SLinus Torvalds #define I460_GXBCTL_BWC (1UL << 2)
501da177e4SLinus Torvalds
511da177e4SLinus Torvalds /*
521da177e4SLinus Torvalds * gatt_table entries are 32-bits wide on the i460; the generic code ought to declare the
531da177e4SLinus Torvalds * gatt_table and gatt_table_real pointers a "void *"...
541da177e4SLinus Torvalds */
551da177e4SLinus Torvalds #define RD_GATT(index) readl((u32 *) i460.gatt + (index))
561da177e4SLinus Torvalds #define WR_GATT(index, val) writel((val), (u32 *) i460.gatt + (index))
571da177e4SLinus Torvalds /*
581da177e4SLinus Torvalds * The 460 spec says we have to read the last location written to make sure that all
591da177e4SLinus Torvalds * writes have taken effect
601da177e4SLinus Torvalds */
611da177e4SLinus Torvalds #define WR_FLUSH_GATT(index) RD_GATT(index)
621da177e4SLinus Torvalds
6307613ba2SDave Airlie static unsigned long i460_mask_memory (struct agp_bridge_data *bridge,
642a4ceb6dSDavid Woodhouse dma_addr_t addr, int type);
6507613ba2SDave Airlie
661da177e4SLinus Torvalds static struct {
671da177e4SLinus Torvalds void *gatt; /* ioremap'd GATT area */
681da177e4SLinus Torvalds
691da177e4SLinus Torvalds /* i460 supports multiple GART page sizes, so GART pageshift is dynamic: */
701da177e4SLinus Torvalds u8 io_page_shift;
711da177e4SLinus Torvalds
721da177e4SLinus Torvalds /* BIOS configures chipset to one of 2 possible apbase values: */
731da177e4SLinus Torvalds u8 dynamic_apbase;
741da177e4SLinus Torvalds
751da177e4SLinus Torvalds /* structure for tracking partial use of 4MB GART pages: */
761da177e4SLinus Torvalds struct lp_desc {
771da177e4SLinus Torvalds unsigned long *alloced_map; /* bitmap of kernel-pages in use */
781da177e4SLinus Torvalds int refcount; /* number of kernel pages using the large page */
791da177e4SLinus Torvalds u64 paddr; /* physical address of large page */
8007613ba2SDave Airlie struct page *page; /* page pointer */
811da177e4SLinus Torvalds } *lp_desc;
821da177e4SLinus Torvalds } i460;
831da177e4SLinus Torvalds
84e5524f35SDave Jones static const struct aper_size_info_8 i460_sizes[3] =
851da177e4SLinus Torvalds {
861da177e4SLinus Torvalds /*
871da177e4SLinus Torvalds * The 32GB aperture is only available with a 4M GART page size. Due to the
881da177e4SLinus Torvalds * dynamic GART page size, we can't figure out page_order or num_entries until
891da177e4SLinus Torvalds * runtime.
901da177e4SLinus Torvalds */
911da177e4SLinus Torvalds {32768, 0, 0, 4},
921da177e4SLinus Torvalds {1024, 0, 0, 2},
931da177e4SLinus Torvalds {256, 0, 0, 1}
941da177e4SLinus Torvalds };
951da177e4SLinus Torvalds
961da177e4SLinus Torvalds static struct gatt_mask i460_masks[] =
971da177e4SLinus Torvalds {
981da177e4SLinus Torvalds {
991da177e4SLinus Torvalds .mask = INTEL_I460_GATT_VALID | INTEL_I460_GATT_COHERENT,
1001da177e4SLinus Torvalds .type = 0
1011da177e4SLinus Torvalds }
1021da177e4SLinus Torvalds };
1031da177e4SLinus Torvalds
i460_fetch_size(void)1041da177e4SLinus Torvalds static int i460_fetch_size (void)
1051da177e4SLinus Torvalds {
1061da177e4SLinus Torvalds int i;
1071da177e4SLinus Torvalds u8 temp;
1081da177e4SLinus Torvalds struct aper_size_info_8 *values;
1091da177e4SLinus Torvalds
1101da177e4SLinus Torvalds /* Determine the GART page size */
1111da177e4SLinus Torvalds pci_read_config_byte(agp_bridge->dev, INTEL_I460_GXBCTL, &temp);
1121da177e4SLinus Torvalds i460.io_page_shift = (temp & I460_4M_PS) ? 22 : 12;
1131da177e4SLinus Torvalds pr_debug("i460_fetch_size: io_page_shift=%d\n", i460.io_page_shift);
1141da177e4SLinus Torvalds
1151da177e4SLinus Torvalds if (i460.io_page_shift != I460_IO_PAGE_SHIFT) {
1161da177e4SLinus Torvalds printk(KERN_ERR PFX
11749ebd7c6SAndrew Morton "I/O (GART) page-size %luKB doesn't match expected "
11849ebd7c6SAndrew Morton "size %luKB\n",
11949ebd7c6SAndrew Morton 1UL << (i460.io_page_shift - 10),
12049ebd7c6SAndrew Morton 1UL << (I460_IO_PAGE_SHIFT));
1211da177e4SLinus Torvalds return 0;
1221da177e4SLinus Torvalds }
1231da177e4SLinus Torvalds
1241da177e4SLinus Torvalds values = A_SIZE_8(agp_bridge->driver->aperture_sizes);
1251da177e4SLinus Torvalds
1261da177e4SLinus Torvalds pci_read_config_byte(agp_bridge->dev, INTEL_I460_AGPSIZ, &temp);
1271da177e4SLinus Torvalds
1281da177e4SLinus Torvalds /* Exit now if the IO drivers for the GART SRAMS are turned off */
1291da177e4SLinus Torvalds if (temp & I460_SRAM_IO_DISABLE) {
1301da177e4SLinus Torvalds printk(KERN_ERR PFX "GART SRAMS disabled on 460GX chipset\n");
1311da177e4SLinus Torvalds printk(KERN_ERR PFX "AGPGART operation not possible\n");
1321da177e4SLinus Torvalds return 0;
1331da177e4SLinus Torvalds }
1341da177e4SLinus Torvalds
1351da177e4SLinus Torvalds /* Make sure we don't try to create an 2 ^ 23 entry GATT */
1361da177e4SLinus Torvalds if ((i460.io_page_shift == 0) && ((temp & I460_AGPSIZ_MASK) == 4)) {
1371da177e4SLinus Torvalds printk(KERN_ERR PFX "We can't have a 32GB aperture with 4KB GART pages\n");
1381da177e4SLinus Torvalds return 0;
1391da177e4SLinus Torvalds }
1401da177e4SLinus Torvalds
1411da177e4SLinus Torvalds /* Determine the proper APBASE register */
1421da177e4SLinus Torvalds if (temp & I460_BAPBASE_ENABLE)
1431da177e4SLinus Torvalds i460.dynamic_apbase = INTEL_I460_BAPBASE;
1441da177e4SLinus Torvalds else
1451da177e4SLinus Torvalds i460.dynamic_apbase = AGP_APBASE;
1461da177e4SLinus Torvalds
1471da177e4SLinus Torvalds for (i = 0; i < agp_bridge->driver->num_aperture_sizes; i++) {
1481da177e4SLinus Torvalds /*
1491da177e4SLinus Torvalds * Dynamically calculate the proper num_entries and page_order values for
1501da177e4SLinus Torvalds * the define aperture sizes. Take care not to shift off the end of
1511da177e4SLinus Torvalds * values[i].size.
1521da177e4SLinus Torvalds */
1531da177e4SLinus Torvalds values[i].num_entries = (values[i].size << 8) >> (I460_IO_PAGE_SHIFT - 12);
154e57aa839SFengguang Wu values[i].page_order = ilog2((sizeof(u32)*values[i].num_entries) >> PAGE_SHIFT);
1551da177e4SLinus Torvalds }
1561da177e4SLinus Torvalds
1571da177e4SLinus Torvalds for (i = 0; i < agp_bridge->driver->num_aperture_sizes; i++) {
1581da177e4SLinus Torvalds /* Neglect control bits when matching up size_value */
1591da177e4SLinus Torvalds if ((temp & I460_AGPSIZ_MASK) == values[i].size_value) {
1601da177e4SLinus Torvalds agp_bridge->previous_size = agp_bridge->current_size = (void *) (values + i);
1611da177e4SLinus Torvalds agp_bridge->aperture_size_idx = i;
1621da177e4SLinus Torvalds return values[i].size;
1631da177e4SLinus Torvalds }
1641da177e4SLinus Torvalds }
1651da177e4SLinus Torvalds
1661da177e4SLinus Torvalds return 0;
1671da177e4SLinus Torvalds }
1681da177e4SLinus Torvalds
1691da177e4SLinus Torvalds /* There isn't anything to do here since 460 has no GART TLB. */
i460_tlb_flush(struct agp_memory * mem)1701da177e4SLinus Torvalds static void i460_tlb_flush (struct agp_memory *mem)
1711da177e4SLinus Torvalds {
1721da177e4SLinus Torvalds return;
1731da177e4SLinus Torvalds }
1741da177e4SLinus Torvalds
1751da177e4SLinus Torvalds /*
1761da177e4SLinus Torvalds * This utility function is needed to prevent corruption of the control bits
1771da177e4SLinus Torvalds * which are stored along with the aperture size in 460's AGPSIZ register
1781da177e4SLinus Torvalds */
i460_write_agpsiz(u8 size_value)1791da177e4SLinus Torvalds static void i460_write_agpsiz (u8 size_value)
1801da177e4SLinus Torvalds {
1811da177e4SLinus Torvalds u8 temp;
1821da177e4SLinus Torvalds
1831da177e4SLinus Torvalds pci_read_config_byte(agp_bridge->dev, INTEL_I460_AGPSIZ, &temp);
1841da177e4SLinus Torvalds pci_write_config_byte(agp_bridge->dev, INTEL_I460_AGPSIZ,
1851da177e4SLinus Torvalds ((temp & ~I460_AGPSIZ_MASK) | size_value));
1861da177e4SLinus Torvalds }
1871da177e4SLinus Torvalds
i460_cleanup(void)1881da177e4SLinus Torvalds static void i460_cleanup (void)
1891da177e4SLinus Torvalds {
1901da177e4SLinus Torvalds struct aper_size_info_8 *previous_size;
1911da177e4SLinus Torvalds
1921da177e4SLinus Torvalds previous_size = A_SIZE_8(agp_bridge->previous_size);
1931da177e4SLinus Torvalds i460_write_agpsiz(previous_size->size_value);
1941da177e4SLinus Torvalds
1951da177e4SLinus Torvalds if (I460_IO_PAGE_SHIFT > PAGE_SHIFT)
1961da177e4SLinus Torvalds kfree(i460.lp_desc);
1971da177e4SLinus Torvalds }
1981da177e4SLinus Torvalds
i460_configure(void)1991da177e4SLinus Torvalds static int i460_configure (void)
2001da177e4SLinus Torvalds {
2011da177e4SLinus Torvalds union {
2021da177e4SLinus Torvalds u32 small[2];
2031da177e4SLinus Torvalds u64 large;
2041da177e4SLinus Torvalds } temp;
2051da177e4SLinus Torvalds size_t size;
2061da177e4SLinus Torvalds u8 scratch;
2071da177e4SLinus Torvalds struct aper_size_info_8 *current_size;
2081da177e4SLinus Torvalds
2091da177e4SLinus Torvalds temp.large = 0;
2101da177e4SLinus Torvalds
2111da177e4SLinus Torvalds current_size = A_SIZE_8(agp_bridge->current_size);
2121da177e4SLinus Torvalds i460_write_agpsiz(current_size->size_value);
2131da177e4SLinus Torvalds
2141da177e4SLinus Torvalds /*
2151da177e4SLinus Torvalds * Do the necessary rigmarole to read all eight bytes of APBASE.
2161da177e4SLinus Torvalds * This has to be done since the AGP aperture can be above 4GB on
2171da177e4SLinus Torvalds * 460 based systems.
2181da177e4SLinus Torvalds */
2191da177e4SLinus Torvalds pci_read_config_dword(agp_bridge->dev, i460.dynamic_apbase, &(temp.small[0]));
2201da177e4SLinus Torvalds pci_read_config_dword(agp_bridge->dev, i460.dynamic_apbase + 4, &(temp.small[1]));
2211da177e4SLinus Torvalds
2221da177e4SLinus Torvalds /* Clear BAR control bits */
2231da177e4SLinus Torvalds agp_bridge->gart_bus_addr = temp.large & ~((1UL << 3) - 1);
2241da177e4SLinus Torvalds
2251da177e4SLinus Torvalds pci_read_config_byte(agp_bridge->dev, INTEL_I460_GXBCTL, &scratch);
2261da177e4SLinus Torvalds pci_write_config_byte(agp_bridge->dev, INTEL_I460_GXBCTL,
2271da177e4SLinus Torvalds (scratch & 0x02) | I460_GXBCTL_OOG | I460_GXBCTL_BWC);
2281da177e4SLinus Torvalds
2291da177e4SLinus Torvalds /*
2301da177e4SLinus Torvalds * Initialize partial allocation trackers if a GART page is bigger than a kernel
2311da177e4SLinus Torvalds * page.
2321da177e4SLinus Torvalds */
2331da177e4SLinus Torvalds if (I460_IO_PAGE_SHIFT > PAGE_SHIFT) {
2341da177e4SLinus Torvalds size = current_size->num_entries * sizeof(i460.lp_desc[0]);
2350ea27d9fSDave Jones i460.lp_desc = kzalloc(size, GFP_KERNEL);
2361da177e4SLinus Torvalds if (!i460.lp_desc)
2371da177e4SLinus Torvalds return -ENOMEM;
2381da177e4SLinus Torvalds }
2391da177e4SLinus Torvalds return 0;
2401da177e4SLinus Torvalds }
2411da177e4SLinus Torvalds
i460_create_gatt_table(struct agp_bridge_data * bridge)2421da177e4SLinus Torvalds static int i460_create_gatt_table (struct agp_bridge_data *bridge)
2431da177e4SLinus Torvalds {
2441da177e4SLinus Torvalds int page_order, num_entries, i;
2451da177e4SLinus Torvalds void *temp;
2461da177e4SLinus Torvalds
2471da177e4SLinus Torvalds /*
2481da177e4SLinus Torvalds * Load up the fixed address of the GART SRAMS which hold our GATT table.
2491da177e4SLinus Torvalds */
2501da177e4SLinus Torvalds temp = agp_bridge->current_size;
2511da177e4SLinus Torvalds page_order = A_SIZE_8(temp)->page_order;
2521da177e4SLinus Torvalds num_entries = A_SIZE_8(temp)->num_entries;
2531da177e4SLinus Torvalds
2541da177e4SLinus Torvalds i460.gatt = ioremap(INTEL_I460_ATTBASE, PAGE_SIZE << page_order);
2555bdbc7dcSScott Thompson if (!i460.gatt) {
2565bdbc7dcSScott Thompson printk(KERN_ERR PFX "ioremap failed\n");
2575bdbc7dcSScott Thompson return -ENOMEM;
2585bdbc7dcSScott Thompson }
2591da177e4SLinus Torvalds
2601da177e4SLinus Torvalds /* These are no good, the should be removed from the agp_bridge strucure... */
2611da177e4SLinus Torvalds agp_bridge->gatt_table_real = NULL;
2621da177e4SLinus Torvalds agp_bridge->gatt_table = NULL;
2631da177e4SLinus Torvalds agp_bridge->gatt_bus_addr = 0;
2641da177e4SLinus Torvalds
2651da177e4SLinus Torvalds for (i = 0; i < num_entries; ++i)
2661da177e4SLinus Torvalds WR_GATT(i, 0);
2671da177e4SLinus Torvalds WR_FLUSH_GATT(i - 1);
2681da177e4SLinus Torvalds return 0;
2691da177e4SLinus Torvalds }
2701da177e4SLinus Torvalds
i460_free_gatt_table(struct agp_bridge_data * bridge)2711da177e4SLinus Torvalds static int i460_free_gatt_table (struct agp_bridge_data *bridge)
2721da177e4SLinus Torvalds {
2731da177e4SLinus Torvalds int num_entries, i;
2741da177e4SLinus Torvalds void *temp;
2751da177e4SLinus Torvalds
2761da177e4SLinus Torvalds temp = agp_bridge->current_size;
2771da177e4SLinus Torvalds
2781da177e4SLinus Torvalds num_entries = A_SIZE_8(temp)->num_entries;
2791da177e4SLinus Torvalds
2801da177e4SLinus Torvalds for (i = 0; i < num_entries; ++i)
2811da177e4SLinus Torvalds WR_GATT(i, 0);
2821da177e4SLinus Torvalds WR_FLUSH_GATT(num_entries - 1);
2831da177e4SLinus Torvalds
2841da177e4SLinus Torvalds iounmap(i460.gatt);
2851da177e4SLinus Torvalds return 0;
2861da177e4SLinus Torvalds }
2871da177e4SLinus Torvalds
2881da177e4SLinus Torvalds /*
2891da177e4SLinus Torvalds * The following functions are called when the I/O (GART) page size is smaller than
2901da177e4SLinus Torvalds * PAGE_SIZE.
2911da177e4SLinus Torvalds */
2921da177e4SLinus Torvalds
i460_insert_memory_small_io_page(struct agp_memory * mem,off_t pg_start,int type)2931da177e4SLinus Torvalds static int i460_insert_memory_small_io_page (struct agp_memory *mem,
2941da177e4SLinus Torvalds off_t pg_start, int type)
2951da177e4SLinus Torvalds {
2961da177e4SLinus Torvalds unsigned long paddr, io_pg_start, io_page_size;
2971da177e4SLinus Torvalds int i, j, k, num_entries;
2981da177e4SLinus Torvalds void *temp;
2991da177e4SLinus Torvalds
3001da177e4SLinus Torvalds pr_debug("i460_insert_memory_small_io_page(mem=%p, pg_start=%ld, type=%d, paddr0=0x%lx)\n",
30107613ba2SDave Airlie mem, pg_start, type, page_to_phys(mem->pages[0]));
3021da177e4SLinus Torvalds
303a030ce44SThomas Hellstrom if (type >= AGP_USER_TYPES || mem->type >= AGP_USER_TYPES)
304a030ce44SThomas Hellstrom return -EINVAL;
305a030ce44SThomas Hellstrom
3061da177e4SLinus Torvalds io_pg_start = I460_IOPAGES_PER_KPAGE * pg_start;
3071da177e4SLinus Torvalds
3081da177e4SLinus Torvalds temp = agp_bridge->current_size;
3091da177e4SLinus Torvalds num_entries = A_SIZE_8(temp)->num_entries;
3101da177e4SLinus Torvalds
3111da177e4SLinus Torvalds if ((io_pg_start + I460_IOPAGES_PER_KPAGE * mem->page_count) > num_entries) {
3121da177e4SLinus Torvalds printk(KERN_ERR PFX "Looks like we're out of AGP memory\n");
3131da177e4SLinus Torvalds return -EINVAL;
3141da177e4SLinus Torvalds }
3151da177e4SLinus Torvalds
3161da177e4SLinus Torvalds j = io_pg_start;
3171da177e4SLinus Torvalds while (j < (io_pg_start + I460_IOPAGES_PER_KPAGE * mem->page_count)) {
3181da177e4SLinus Torvalds if (!PGE_EMPTY(agp_bridge, RD_GATT(j))) {
3191da177e4SLinus Torvalds pr_debug("i460_insert_memory_small_io_page: GATT[%d]=0x%x is busy\n",
3201da177e4SLinus Torvalds j, RD_GATT(j));
3211da177e4SLinus Torvalds return -EBUSY;
3221da177e4SLinus Torvalds }
3231da177e4SLinus Torvalds j++;
3241da177e4SLinus Torvalds }
3251da177e4SLinus Torvalds
3261da177e4SLinus Torvalds io_page_size = 1UL << I460_IO_PAGE_SHIFT;
3271da177e4SLinus Torvalds for (i = 0, j = io_pg_start; i < mem->page_count; i++) {
3286a12235cSDavid Woodhouse paddr = page_to_phys(mem->pages[i]);
3291da177e4SLinus Torvalds for (k = 0; k < I460_IOPAGES_PER_KPAGE; k++, j++, paddr += io_page_size)
33007613ba2SDave Airlie WR_GATT(j, i460_mask_memory(agp_bridge, paddr, mem->type));
3311da177e4SLinus Torvalds }
3321da177e4SLinus Torvalds WR_FLUSH_GATT(j - 1);
3331da177e4SLinus Torvalds return 0;
3341da177e4SLinus Torvalds }
3351da177e4SLinus Torvalds
i460_remove_memory_small_io_page(struct agp_memory * mem,off_t pg_start,int type)3361da177e4SLinus Torvalds static int i460_remove_memory_small_io_page(struct agp_memory *mem,
3371da177e4SLinus Torvalds off_t pg_start, int type)
3381da177e4SLinus Torvalds {
3391da177e4SLinus Torvalds int i;
3401da177e4SLinus Torvalds
3411da177e4SLinus Torvalds pr_debug("i460_remove_memory_small_io_page(mem=%p, pg_start=%ld, type=%d)\n",
3421da177e4SLinus Torvalds mem, pg_start, type);
3431da177e4SLinus Torvalds
3441da177e4SLinus Torvalds pg_start = I460_IOPAGES_PER_KPAGE * pg_start;
3451da177e4SLinus Torvalds
3461da177e4SLinus Torvalds for (i = pg_start; i < (pg_start + I460_IOPAGES_PER_KPAGE * mem->page_count); i++)
3471da177e4SLinus Torvalds WR_GATT(i, 0);
3481da177e4SLinus Torvalds WR_FLUSH_GATT(i - 1);
3491da177e4SLinus Torvalds return 0;
3501da177e4SLinus Torvalds }
3511da177e4SLinus Torvalds
3521da177e4SLinus Torvalds #if I460_LARGE_IO_PAGES
3531da177e4SLinus Torvalds
3541da177e4SLinus Torvalds /*
3551da177e4SLinus Torvalds * These functions are called when the I/O (GART) page size exceeds PAGE_SIZE.
3561da177e4SLinus Torvalds *
3571da177e4SLinus Torvalds * This situation is interesting since AGP memory allocations that are smaller than a
3581da177e4SLinus Torvalds * single GART page are possible. The i460.lp_desc array tracks partial allocation of the
3591da177e4SLinus Torvalds * large GART pages to work around this issue.
3601da177e4SLinus Torvalds *
3611da177e4SLinus Torvalds * i460.lp_desc[pg_num].refcount tracks the number of kernel pages in use within GART page
3621da177e4SLinus Torvalds * pg_num. i460.lp_desc[pg_num].paddr is the physical address of the large page and
3631da177e4SLinus Torvalds * i460.lp_desc[pg_num].alloced_map is a bitmap of kernel pages that are in use (allocated).
3641da177e4SLinus Torvalds */
3651da177e4SLinus Torvalds
i460_alloc_large_page(struct lp_desc * lp)3661da177e4SLinus Torvalds static int i460_alloc_large_page (struct lp_desc *lp)
3671da177e4SLinus Torvalds {
3681da177e4SLinus Torvalds unsigned long order = I460_IO_PAGE_SHIFT - PAGE_SHIFT;
3691da177e4SLinus Torvalds size_t map_size;
3701da177e4SLinus Torvalds
37107613ba2SDave Airlie lp->page = alloc_pages(GFP_KERNEL, order);
37207613ba2SDave Airlie if (!lp->page) {
3731da177e4SLinus Torvalds printk(KERN_ERR PFX "Couldn't alloc 4M GART page...\n");
3741da177e4SLinus Torvalds return -ENOMEM;
3751da177e4SLinus Torvalds }
3761da177e4SLinus Torvalds
3771da177e4SLinus Torvalds map_size = ((I460_KPAGES_PER_IOPAGE + BITS_PER_LONG - 1) & -BITS_PER_LONG)/8;
3780ea27d9fSDave Jones lp->alloced_map = kzalloc(map_size, GFP_KERNEL);
3791da177e4SLinus Torvalds if (!lp->alloced_map) {
38007613ba2SDave Airlie __free_pages(lp->page, order);
3811da177e4SLinus Torvalds printk(KERN_ERR PFX "Out of memory, we're in trouble...\n");
3821da177e4SLinus Torvalds return -ENOMEM;
3831da177e4SLinus Torvalds }
3841da177e4SLinus Torvalds
3856a12235cSDavid Woodhouse lp->paddr = page_to_phys(lp->page);
3861da177e4SLinus Torvalds lp->refcount = 0;
3871da177e4SLinus Torvalds atomic_add(I460_KPAGES_PER_IOPAGE, &agp_bridge->current_memory_agp);
3881da177e4SLinus Torvalds return 0;
3891da177e4SLinus Torvalds }
3901da177e4SLinus Torvalds
i460_free_large_page(struct lp_desc * lp)3911da177e4SLinus Torvalds static void i460_free_large_page (struct lp_desc *lp)
3921da177e4SLinus Torvalds {
3931da177e4SLinus Torvalds kfree(lp->alloced_map);
3941da177e4SLinus Torvalds lp->alloced_map = NULL;
3951da177e4SLinus Torvalds
39607613ba2SDave Airlie __free_pages(lp->page, I460_IO_PAGE_SHIFT - PAGE_SHIFT);
3971da177e4SLinus Torvalds atomic_sub(I460_KPAGES_PER_IOPAGE, &agp_bridge->current_memory_agp);
3981da177e4SLinus Torvalds }
3991da177e4SLinus Torvalds
i460_insert_memory_large_io_page(struct agp_memory * mem,off_t pg_start,int type)4001da177e4SLinus Torvalds static int i460_insert_memory_large_io_page (struct agp_memory *mem,
4011da177e4SLinus Torvalds off_t pg_start, int type)
4021da177e4SLinus Torvalds {
4031da177e4SLinus Torvalds int i, start_offset, end_offset, idx, pg, num_entries;
4041da177e4SLinus Torvalds struct lp_desc *start, *end, *lp;
4051da177e4SLinus Torvalds void *temp;
4061da177e4SLinus Torvalds
407a030ce44SThomas Hellstrom if (type >= AGP_USER_TYPES || mem->type >= AGP_USER_TYPES)
408a030ce44SThomas Hellstrom return -EINVAL;
409a030ce44SThomas Hellstrom
4101da177e4SLinus Torvalds temp = agp_bridge->current_size;
4111da177e4SLinus Torvalds num_entries = A_SIZE_8(temp)->num_entries;
4121da177e4SLinus Torvalds
4131da177e4SLinus Torvalds /* Figure out what pg_start means in terms of our large GART pages */
4141da177e4SLinus Torvalds start = &i460.lp_desc[pg_start / I460_KPAGES_PER_IOPAGE];
4151da177e4SLinus Torvalds end = &i460.lp_desc[(pg_start + mem->page_count - 1) / I460_KPAGES_PER_IOPAGE];
4161da177e4SLinus Torvalds start_offset = pg_start % I460_KPAGES_PER_IOPAGE;
4171da177e4SLinus Torvalds end_offset = (pg_start + mem->page_count - 1) % I460_KPAGES_PER_IOPAGE;
4181da177e4SLinus Torvalds
4191da177e4SLinus Torvalds if (end > i460.lp_desc + num_entries) {
4201da177e4SLinus Torvalds printk(KERN_ERR PFX "Looks like we're out of AGP memory\n");
4211da177e4SLinus Torvalds return -EINVAL;
4221da177e4SLinus Torvalds }
4231da177e4SLinus Torvalds
4241da177e4SLinus Torvalds /* Check if the requested region of the aperture is free */
4251da177e4SLinus Torvalds for (lp = start; lp <= end; ++lp) {
4261da177e4SLinus Torvalds if (!lp->alloced_map)
4271da177e4SLinus Torvalds continue; /* OK, the entire large page is available... */
4281da177e4SLinus Torvalds
4291da177e4SLinus Torvalds for (idx = ((lp == start) ? start_offset : 0);
4301da177e4SLinus Torvalds idx < ((lp == end) ? (end_offset + 1) : I460_KPAGES_PER_IOPAGE);
4311da177e4SLinus Torvalds idx++)
4321da177e4SLinus Torvalds {
4331da177e4SLinus Torvalds if (test_bit(idx, lp->alloced_map))
4341da177e4SLinus Torvalds return -EBUSY;
4351da177e4SLinus Torvalds }
4361da177e4SLinus Torvalds }
4371da177e4SLinus Torvalds
4381da177e4SLinus Torvalds for (lp = start, i = 0; lp <= end; ++lp) {
4391da177e4SLinus Torvalds if (!lp->alloced_map) {
4401da177e4SLinus Torvalds /* Allocate new GART pages... */
4411da177e4SLinus Torvalds if (i460_alloc_large_page(lp) < 0)
4421da177e4SLinus Torvalds return -ENOMEM;
4431da177e4SLinus Torvalds pg = lp - i460.lp_desc;
44407613ba2SDave Airlie WR_GATT(pg, i460_mask_memory(agp_bridge,
4451da177e4SLinus Torvalds lp->paddr, 0));
4461da177e4SLinus Torvalds WR_FLUSH_GATT(pg);
4471da177e4SLinus Torvalds }
4481da177e4SLinus Torvalds
4491da177e4SLinus Torvalds for (idx = ((lp == start) ? start_offset : 0);
4501da177e4SLinus Torvalds idx < ((lp == end) ? (end_offset + 1) : I460_KPAGES_PER_IOPAGE);
4511da177e4SLinus Torvalds idx++, i++)
4521da177e4SLinus Torvalds {
45307613ba2SDave Airlie mem->pages[i] = lp->page;
4541da177e4SLinus Torvalds __set_bit(idx, lp->alloced_map);
4551da177e4SLinus Torvalds ++lp->refcount;
4561da177e4SLinus Torvalds }
4571da177e4SLinus Torvalds }
4581da177e4SLinus Torvalds return 0;
4591da177e4SLinus Torvalds }
4601da177e4SLinus Torvalds
i460_remove_memory_large_io_page(struct agp_memory * mem,off_t pg_start,int type)4611da177e4SLinus Torvalds static int i460_remove_memory_large_io_page (struct agp_memory *mem,
4621da177e4SLinus Torvalds off_t pg_start, int type)
4631da177e4SLinus Torvalds {
4641da177e4SLinus Torvalds int i, pg, start_offset, end_offset, idx, num_entries;
4651da177e4SLinus Torvalds struct lp_desc *start, *end, *lp;
4661da177e4SLinus Torvalds void *temp;
4671da177e4SLinus Torvalds
46807613ba2SDave Airlie temp = agp_bridge->current_size;
4691da177e4SLinus Torvalds num_entries = A_SIZE_8(temp)->num_entries;
4701da177e4SLinus Torvalds
4711da177e4SLinus Torvalds /* Figure out what pg_start means in terms of our large GART pages */
4721da177e4SLinus Torvalds start = &i460.lp_desc[pg_start / I460_KPAGES_PER_IOPAGE];
4731da177e4SLinus Torvalds end = &i460.lp_desc[(pg_start + mem->page_count - 1) / I460_KPAGES_PER_IOPAGE];
4741da177e4SLinus Torvalds start_offset = pg_start % I460_KPAGES_PER_IOPAGE;
4751da177e4SLinus Torvalds end_offset = (pg_start + mem->page_count - 1) % I460_KPAGES_PER_IOPAGE;
4761da177e4SLinus Torvalds
4771da177e4SLinus Torvalds for (i = 0, lp = start; lp <= end; ++lp) {
4781da177e4SLinus Torvalds for (idx = ((lp == start) ? start_offset : 0);
4791da177e4SLinus Torvalds idx < ((lp == end) ? (end_offset + 1) : I460_KPAGES_PER_IOPAGE);
4801da177e4SLinus Torvalds idx++, i++)
4811da177e4SLinus Torvalds {
48207613ba2SDave Airlie mem->pages[i] = NULL;
4831da177e4SLinus Torvalds __clear_bit(idx, lp->alloced_map);
4841da177e4SLinus Torvalds --lp->refcount;
4851da177e4SLinus Torvalds }
4861da177e4SLinus Torvalds
4871da177e4SLinus Torvalds /* Free GART pages if they are unused */
4881da177e4SLinus Torvalds if (lp->refcount == 0) {
4891da177e4SLinus Torvalds pg = lp - i460.lp_desc;
4901da177e4SLinus Torvalds WR_GATT(pg, 0);
4911da177e4SLinus Torvalds WR_FLUSH_GATT(pg);
4921da177e4SLinus Torvalds i460_free_large_page(lp);
4931da177e4SLinus Torvalds }
4941da177e4SLinus Torvalds }
4951da177e4SLinus Torvalds return 0;
4961da177e4SLinus Torvalds }
4971da177e4SLinus Torvalds
4981da177e4SLinus Torvalds /* Wrapper routines to call the approriate {small_io_page,large_io_page} function */
4991da177e4SLinus Torvalds
i460_insert_memory(struct agp_memory * mem,off_t pg_start,int type)5001da177e4SLinus Torvalds static int i460_insert_memory (struct agp_memory *mem,
5011da177e4SLinus Torvalds off_t pg_start, int type)
5021da177e4SLinus Torvalds {
5031da177e4SLinus Torvalds if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT)
5041da177e4SLinus Torvalds return i460_insert_memory_small_io_page(mem, pg_start, type);
5051da177e4SLinus Torvalds else
5061da177e4SLinus Torvalds return i460_insert_memory_large_io_page(mem, pg_start, type);
5071da177e4SLinus Torvalds }
5081da177e4SLinus Torvalds
i460_remove_memory(struct agp_memory * mem,off_t pg_start,int type)5091da177e4SLinus Torvalds static int i460_remove_memory (struct agp_memory *mem,
5101da177e4SLinus Torvalds off_t pg_start, int type)
5111da177e4SLinus Torvalds {
5121da177e4SLinus Torvalds if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT)
5131da177e4SLinus Torvalds return i460_remove_memory_small_io_page(mem, pg_start, type);
5141da177e4SLinus Torvalds else
5151da177e4SLinus Torvalds return i460_remove_memory_large_io_page(mem, pg_start, type);
5161da177e4SLinus Torvalds }
5171da177e4SLinus Torvalds
5181da177e4SLinus Torvalds /*
5191da177e4SLinus Torvalds * If the I/O (GART) page size is bigger than the kernel page size, we don't want to
5201da177e4SLinus Torvalds * allocate memory until we know where it is to be bound in the aperture (a
5211da177e4SLinus Torvalds * multi-kernel-page alloc might fit inside of an already allocated GART page).
5221da177e4SLinus Torvalds *
5231da177e4SLinus Torvalds * Let's just hope nobody counts on the allocated AGP memory being there before bind time
5241da177e4SLinus Torvalds * (I don't think current drivers do)...
5251da177e4SLinus Torvalds */
i460_alloc_page(struct agp_bridge_data * bridge)52607613ba2SDave Airlie static struct page *i460_alloc_page (struct agp_bridge_data *bridge)
5271da177e4SLinus Torvalds {
5281da177e4SLinus Torvalds void *page;
5291da177e4SLinus Torvalds
53088d51967SAlan Hourihane if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT) {
5311da177e4SLinus Torvalds page = agp_generic_alloc_page(agp_bridge);
53288d51967SAlan Hourihane } else
5331da177e4SLinus Torvalds /* Returning NULL would cause problems */
5341da177e4SLinus Torvalds /* AK: really dubious code. */
5351da177e4SLinus Torvalds page = (void *)~0UL;
5361da177e4SLinus Torvalds return page;
5371da177e4SLinus Torvalds }
5381da177e4SLinus Torvalds
i460_destroy_page(struct page * page,int flags)53907613ba2SDave Airlie static void i460_destroy_page (struct page *page, int flags)
5401da177e4SLinus Torvalds {
54188d51967SAlan Hourihane if (I460_IO_PAGE_SHIFT <= PAGE_SHIFT) {
542a2721e99SDave Airlie agp_generic_destroy_page(page, flags);
54388d51967SAlan Hourihane }
5441da177e4SLinus Torvalds }
5451da177e4SLinus Torvalds
5461da177e4SLinus Torvalds #endif /* I460_LARGE_IO_PAGES */
5471da177e4SLinus Torvalds
i460_mask_memory(struct agp_bridge_data * bridge,dma_addr_t addr,int type)5481da177e4SLinus Torvalds static unsigned long i460_mask_memory (struct agp_bridge_data *bridge,
5492a4ceb6dSDavid Woodhouse dma_addr_t addr, int type)
5501da177e4SLinus Torvalds {
5511da177e4SLinus Torvalds /* Make sure the returned address is a valid GATT entry */
5521da177e4SLinus Torvalds return bridge->driver->masks[0].mask
55349ebd7c6SAndrew Morton | (((addr & ~((1 << I460_IO_PAGE_SHIFT) - 1)) & 0xfffff000) >> 12);
5541da177e4SLinus Torvalds }
5551da177e4SLinus Torvalds
556e047d1cfSRyusuke Konishi const struct agp_bridge_driver intel_i460_driver = {
5571da177e4SLinus Torvalds .owner = THIS_MODULE,
5581da177e4SLinus Torvalds .aperture_sizes = i460_sizes,
5591da177e4SLinus Torvalds .size_type = U8_APER_SIZE,
5601da177e4SLinus Torvalds .num_aperture_sizes = 3,
5611da177e4SLinus Torvalds .configure = i460_configure,
5621da177e4SLinus Torvalds .fetch_size = i460_fetch_size,
5631da177e4SLinus Torvalds .cleanup = i460_cleanup,
5641da177e4SLinus Torvalds .tlb_flush = i460_tlb_flush,
5652a4ceb6dSDavid Woodhouse .mask_memory = i460_mask_memory,
5661da177e4SLinus Torvalds .masks = i460_masks,
5671da177e4SLinus Torvalds .agp_enable = agp_generic_enable,
5681da177e4SLinus Torvalds .cache_flush = global_cache_flush,
5691da177e4SLinus Torvalds .create_gatt_table = i460_create_gatt_table,
5701da177e4SLinus Torvalds .free_gatt_table = i460_free_gatt_table,
5711da177e4SLinus Torvalds #if I460_LARGE_IO_PAGES
5721da177e4SLinus Torvalds .insert_memory = i460_insert_memory,
5731da177e4SLinus Torvalds .remove_memory = i460_remove_memory,
5741da177e4SLinus Torvalds .agp_alloc_page = i460_alloc_page,
5751da177e4SLinus Torvalds .agp_destroy_page = i460_destroy_page,
5761da177e4SLinus Torvalds #else
5771da177e4SLinus Torvalds .insert_memory = i460_insert_memory_small_io_page,
5781da177e4SLinus Torvalds .remove_memory = i460_remove_memory_small_io_page,
5791da177e4SLinus Torvalds .agp_alloc_page = agp_generic_alloc_page,
5805f310b63SRene Herman .agp_alloc_pages = agp_generic_alloc_pages,
5811da177e4SLinus Torvalds .agp_destroy_page = agp_generic_destroy_page,
5825f310b63SRene Herman .agp_destroy_pages = agp_generic_destroy_pages,
5831da177e4SLinus Torvalds #endif
5841da177e4SLinus Torvalds .alloc_by_type = agp_generic_alloc_by_type,
5851da177e4SLinus Torvalds .free_by_type = agp_generic_free_by_type,
586a030ce44SThomas Hellstrom .agp_type_to_mask_type = agp_generic_type_to_mask_type,
587c7258012SJoe Perches .cant_use_aperture = true,
5881da177e4SLinus Torvalds };
5891da177e4SLinus Torvalds
agp_intel_i460_probe(struct pci_dev * pdev,const struct pci_device_id * ent)590bcd2982aSGreg Kroah-Hartman static int agp_intel_i460_probe(struct pci_dev *pdev,
5911da177e4SLinus Torvalds const struct pci_device_id *ent)
5921da177e4SLinus Torvalds {
5931da177e4SLinus Torvalds struct agp_bridge_data *bridge;
5941da177e4SLinus Torvalds u8 cap_ptr;
5951da177e4SLinus Torvalds
5961da177e4SLinus Torvalds cap_ptr = pci_find_capability(pdev, PCI_CAP_ID_AGP);
5971da177e4SLinus Torvalds if (!cap_ptr)
5981da177e4SLinus Torvalds return -ENODEV;
5991da177e4SLinus Torvalds
6001da177e4SLinus Torvalds bridge = agp_alloc_bridge();
6011da177e4SLinus Torvalds if (!bridge)
6021da177e4SLinus Torvalds return -ENOMEM;
6031da177e4SLinus Torvalds
6041da177e4SLinus Torvalds bridge->driver = &intel_i460_driver;
6051da177e4SLinus Torvalds bridge->dev = pdev;
6061da177e4SLinus Torvalds bridge->capndx = cap_ptr;
6071da177e4SLinus Torvalds
6081da177e4SLinus Torvalds printk(KERN_INFO PFX "Detected Intel 460GX chipset\n");
6091da177e4SLinus Torvalds
6101da177e4SLinus Torvalds pci_set_drvdata(pdev, bridge);
6111da177e4SLinus Torvalds return agp_add_bridge(bridge);
6121da177e4SLinus Torvalds }
6131da177e4SLinus Torvalds
agp_intel_i460_remove(struct pci_dev * pdev)61439af33fcSBill Pemberton static void agp_intel_i460_remove(struct pci_dev *pdev)
6151da177e4SLinus Torvalds {
6161da177e4SLinus Torvalds struct agp_bridge_data *bridge = pci_get_drvdata(pdev);
6171da177e4SLinus Torvalds
6181da177e4SLinus Torvalds agp_remove_bridge(bridge);
6191da177e4SLinus Torvalds agp_put_bridge(bridge);
6201da177e4SLinus Torvalds }
6211da177e4SLinus Torvalds
6221da177e4SLinus Torvalds static struct pci_device_id agp_intel_i460_pci_table[] = {
6231da177e4SLinus Torvalds {
6241da177e4SLinus Torvalds .class = (PCI_CLASS_BRIDGE_HOST << 8),
6251da177e4SLinus Torvalds .class_mask = ~0,
6261da177e4SLinus Torvalds .vendor = PCI_VENDOR_ID_INTEL,
6271da177e4SLinus Torvalds .device = PCI_DEVICE_ID_INTEL_84460GX,
6281da177e4SLinus Torvalds .subvendor = PCI_ANY_ID,
6291da177e4SLinus Torvalds .subdevice = PCI_ANY_ID,
6301da177e4SLinus Torvalds },
6311da177e4SLinus Torvalds { }
6321da177e4SLinus Torvalds };
6331da177e4SLinus Torvalds
6341da177e4SLinus Torvalds MODULE_DEVICE_TABLE(pci, agp_intel_i460_pci_table);
6351da177e4SLinus Torvalds
6361da177e4SLinus Torvalds static struct pci_driver agp_intel_i460_pci_driver = {
6371da177e4SLinus Torvalds .name = "agpgart-intel-i460",
6381da177e4SLinus Torvalds .id_table = agp_intel_i460_pci_table,
6391da177e4SLinus Torvalds .probe = agp_intel_i460_probe,
640bcd2982aSGreg Kroah-Hartman .remove = agp_intel_i460_remove,
6411da177e4SLinus Torvalds };
6421da177e4SLinus Torvalds
agp_intel_i460_init(void)6431da177e4SLinus Torvalds static int __init agp_intel_i460_init(void)
6441da177e4SLinus Torvalds {
6451da177e4SLinus Torvalds if (agp_off)
6461da177e4SLinus Torvalds return -EINVAL;
6471da177e4SLinus Torvalds return pci_register_driver(&agp_intel_i460_pci_driver);
6481da177e4SLinus Torvalds }
6491da177e4SLinus Torvalds
agp_intel_i460_cleanup(void)6501da177e4SLinus Torvalds static void __exit agp_intel_i460_cleanup(void)
6511da177e4SLinus Torvalds {
6521da177e4SLinus Torvalds pci_unregister_driver(&agp_intel_i460_pci_driver);
6531da177e4SLinus Torvalds }
6541da177e4SLinus Torvalds
6551da177e4SLinus Torvalds module_init(agp_intel_i460_init);
6561da177e4SLinus Torvalds module_exit(agp_intel_i460_cleanup);
6571da177e4SLinus Torvalds
6581da177e4SLinus Torvalds MODULE_AUTHOR("Chris Ahna <Christopher.J.Ahna@intel.com>");
6591da177e4SLinus Torvalds MODULE_LICENSE("GPL and additional rights");
660