2 * Intel GTT (Graphics Translation Table) routines
4 * Caveat: This driver implements the linux agp interface, but this is far from
5 * a agp driver! GTT support ended up here for purely historical reasons: The
6 * old userspace intel graphics drivers needed an interface to map memory into
7 * the GTT. And the drm provides a default interface for graphic devices sitting
8 * on an agp port. So it made sense to fake the GTT support as an agp port to
9 * avoid having to create a new api.
11 * With gem this does not make much sense anymore, just needlessly complicates
12 * the code. But as long as the old graphics stack is still support, it's stuck
15 * /fairy-tale-mode off
18 #include <linux/module.h>
19 #include <linux/pci.h>
20 #include <linux/init.h>
21 #include <linux/kernel.h>
22 #include <linux/pagemap.h>
23 #include <linux/agp_backend.h>
24 #include <linux/delay.h>
27 #include "intel-agp.h"
28 #include <drm/intel-gtt.h>
31 * If we have Intel graphics, we're not going to have anything other than
32 * an Intel IOMMU. So make the correct use of the PCI DMA API contingent
33 * on the Intel IOMMU support (CONFIG_INTEL_IOMMU).
34 * Only newer chipsets need to bother with this, of course.
36 #ifdef CONFIG_INTEL_IOMMU
37 #define USE_PCI_DMA_API 1
39 #define USE_PCI_DMA_API 0
42 struct intel_gtt_driver {
44 unsigned int is_g33 : 1;
45 unsigned int is_pineview : 1;
46 unsigned int is_ironlake : 1;
47 unsigned int has_pgtbl_enable : 1;
48 unsigned int dma_mask_size : 8;
49 /* Chipset specific GTT setup */
51 /* This should undo anything done in ->setup() save the unmapping
52 * of the mmio register file, that's done in the generic code. */
53 void (*cleanup)(void);
54 void (*write_entry)(dma_addr_t addr, unsigned int entry, unsigned int flags);
55 /* Flags is a more or less chipset specific opaque value.
56 * For chipsets that need to support old ums (non-gem) code, this
57 * needs to be identical to the various supported agp memory types! */
58 bool (*check_flags)(unsigned int flags);
59 void (*chipset_flush)(void);
62 static struct _intel_private {
63 struct intel_gtt base;
64 const struct intel_gtt_driver *driver;
65 struct pci_dev *pcidev; /* device one */
66 struct pci_dev *bridge_dev;
67 u8 __iomem *registers;
68 phys_addr_t gtt_bus_addr;
69 phys_addr_t gma_bus_addr;
71 u32 __iomem *gtt; /* I915G */
72 bool clear_fake_agp; /* on first access via agp, fill with scratch */
73 int num_dcache_entries;
74 void __iomem *i9xx_flush_page;
76 struct resource ifp_resource;
78 struct page *scratch_page;
81 #define INTEL_GTT_GEN intel_private.driver->gen
82 #define IS_G33 intel_private.driver->is_g33
83 #define IS_PINEVIEW intel_private.driver->is_pineview
84 #define IS_IRONLAKE intel_private.driver->is_ironlake
85 #define HAS_PGTBL_EN intel_private.driver->has_pgtbl_enable
87 int intel_gtt_map_memory(struct page **pages, unsigned int num_entries,
88 struct scatterlist **sg_list, int *num_sg)
91 struct scatterlist *sg;
95 return 0; /* already mapped (for e.g. resume */
97 DBG("try mapping %lu pages\n", (unsigned long)num_entries);
99 if (sg_alloc_table(&st, num_entries, GFP_KERNEL))
102 *sg_list = sg = st.sgl;
104 for (i = 0 ; i < num_entries; i++, sg = sg_next(sg))
105 sg_set_page(sg, pages[i], PAGE_SIZE, 0);
107 *num_sg = pci_map_sg(intel_private.pcidev, *sg_list,
108 num_entries, PCI_DMA_BIDIRECTIONAL);
109 if (unlikely(!*num_sg))
118 EXPORT_SYMBOL(intel_gtt_map_memory);
120 void intel_gtt_unmap_memory(struct scatterlist *sg_list, int num_sg)
123 DBG("try unmapping %lu pages\n", (unsigned long)mem->page_count);
125 pci_unmap_sg(intel_private.pcidev, sg_list,
126 num_sg, PCI_DMA_BIDIRECTIONAL);
129 st.orig_nents = st.nents = num_sg;
133 EXPORT_SYMBOL(intel_gtt_unmap_memory);
135 static void intel_fake_agp_enable(struct agp_bridge_data *bridge, u32 mode)
140 /* Exists to support ARGB cursors */
141 static struct page *i8xx_alloc_pages(void)
145 page = alloc_pages(GFP_KERNEL | GFP_DMA32, 2);
150 if (xen_create_contiguous_region((unsigned long)page_address(page), 2, 32)) {
151 __free_pages(page, 2);
156 if (set_pages_uc(page, 4) < 0) {
157 set_pages_wb(page, 4);
159 xen_destroy_contiguous_region((unsigned long)page_address(page),
162 __free_pages(page, 2);
166 atomic_inc(&agp_bridge->current_memory_agp);
170 static void i8xx_destroy_pages(struct page *page)
175 set_pages_wb(page, 4);
177 xen_destroy_contiguous_region((unsigned long)page_address(page), 2);
180 __free_pages(page, 2);
181 atomic_dec(&agp_bridge->current_memory_agp);
184 #define I810_GTT_ORDER 4
185 static int i810_setup(void)
190 /* i81x does not preallocate the gtt. It's always 64kb in size. */
191 gtt_table = alloc_gatt_pages(I810_GTT_ORDER);
192 if (gtt_table == NULL)
194 intel_private.i81x_gtt_table = gtt_table;
196 pci_read_config_dword(intel_private.pcidev, I810_MMADDR, ®_addr);
197 reg_addr &= 0xfff80000;
199 intel_private.registers = ioremap(reg_addr, KB(64));
200 if (!intel_private.registers)
203 writel(virt_to_phys(gtt_table) | I810_PGETBL_ENABLED,
204 intel_private.registers+I810_PGETBL_CTL);
206 intel_private.gtt_bus_addr = reg_addr + I810_PTE_BASE;
208 if ((readl(intel_private.registers+I810_DRAM_CTL)
209 & I810_DRAM_ROW_0) == I810_DRAM_ROW_0_SDRAM) {
210 dev_info(&intel_private.pcidev->dev,
211 "detected 4MB dedicated video ram\n");
212 intel_private.num_dcache_entries = 1024;
218 static void i810_cleanup(void)
220 writel(0, intel_private.registers+I810_PGETBL_CTL);
221 free_gatt_pages(intel_private.i81x_gtt_table, I810_GTT_ORDER);
224 static int i810_insert_dcache_entries(struct agp_memory *mem, off_t pg_start,
229 if ((pg_start + mem->page_count)
230 > intel_private.num_dcache_entries)
233 if (!mem->is_flushed)
234 global_cache_flush();
236 for (i = pg_start; i < (pg_start + mem->page_count); i++) {
237 dma_addr_t addr = i << PAGE_SHIFT;
238 intel_private.driver->write_entry(addr,
241 readl(intel_private.gtt+i-1);
247 * The i810/i830 requires a physical address to program its mouse
248 * pointer into hardware.
249 * However the Xserver still writes to it through the agp aperture.
251 static struct agp_memory *alloc_agpphysmem_i8xx(size_t pg_count, int type)
253 struct agp_memory *new;
257 case 1: page = agp_bridge->driver->agp_alloc_page(agp_bridge);
260 /* kludge to get 4 physical pages for ARGB cursor */
261 page = i8xx_alloc_pages();
270 new = agp_create_memory(pg_count);
274 new->pages[0] = page;
276 /* kludge to get 4 physical pages for ARGB cursor */
277 new->pages[1] = new->pages[0] + 1;
278 new->pages[2] = new->pages[1] + 1;
279 new->pages[3] = new->pages[2] + 1;
281 new->page_count = pg_count;
282 new->num_scratch_pages = pg_count;
283 new->type = AGP_PHYS_MEMORY;
285 new->physical = page_to_phys(new->pages[0]);
287 new->physical = page_to_pseudophys(new->pages[0]);
292 static void intel_i810_free_by_type(struct agp_memory *curr)
294 agp_free_key(curr->key);
295 if (curr->type == AGP_PHYS_MEMORY) {
296 if (curr->page_count == 4)
297 i8xx_destroy_pages(curr->pages[0]);
299 agp_bridge->driver->agp_destroy_page(curr->pages[0],
300 AGP_PAGE_DESTROY_UNMAP);
301 agp_bridge->driver->agp_destroy_page(curr->pages[0],
302 AGP_PAGE_DESTROY_FREE);
304 agp_free_page_array(curr);
309 static int intel_gtt_setup_scratch_page(void)
314 page = alloc_page(GFP_KERNEL | GFP_DMA32 | __GFP_ZERO);
318 set_pages_uc(page, 1);
320 if (intel_private.base.needs_dmar) {
321 dma_addr = pci_map_page(intel_private.pcidev, page, 0,
322 PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
323 if (pci_dma_mapping_error(intel_private.pcidev, dma_addr))
326 intel_private.base.scratch_page_dma = dma_addr;
328 intel_private.base.scratch_page_dma = page_to_phys(page);
330 intel_private.scratch_page = page;
335 static void i810_write_entry(dma_addr_t addr, unsigned int entry,
338 u32 pte_flags = I810_PTE_VALID;
341 case AGP_DCACHE_MEMORY:
342 pte_flags |= I810_PTE_LOCAL;
344 case AGP_USER_CACHED_MEMORY:
345 pte_flags |= I830_PTE_SYSTEM_CACHED;
349 writel(addr | pte_flags, intel_private.gtt + entry);
352 static const struct aper_size_info_fixed intel_fake_agp_sizes[] = {
360 static unsigned int intel_gtt_stolen_size(void)
365 static const int ddt[4] = { 0, 16, 32, 64 };
366 unsigned int stolen_size = 0;
368 if (INTEL_GTT_GEN == 1)
369 return 0; /* no stolen mem on i81x */
371 pci_read_config_word(intel_private.bridge_dev,
372 I830_GMCH_CTRL, &gmch_ctrl);
374 if (intel_private.bridge_dev->device == PCI_DEVICE_ID_INTEL_82830_HB ||
375 intel_private.bridge_dev->device == PCI_DEVICE_ID_INTEL_82845G_HB) {
376 switch (gmch_ctrl & I830_GMCH_GMS_MASK) {
377 case I830_GMCH_GMS_STOLEN_512:
378 stolen_size = KB(512);
380 case I830_GMCH_GMS_STOLEN_1024:
383 case I830_GMCH_GMS_STOLEN_8192:
386 case I830_GMCH_GMS_LOCAL:
387 rdct = readb(intel_private.registers+I830_RDRAM_CHANNEL_TYPE);
388 stolen_size = (I830_RDRAM_ND(rdct) + 1) *
389 MB(ddt[I830_RDRAM_DDT(rdct)]);
396 } else if (INTEL_GTT_GEN == 6) {
398 * SandyBridge has new memory control reg at 0x50.w
401 pci_read_config_word(intel_private.pcidev, SNB_GMCH_CTRL, &snb_gmch_ctl);
402 switch (snb_gmch_ctl & SNB_GMCH_GMS_STOLEN_MASK) {
403 case SNB_GMCH_GMS_STOLEN_32M:
404 stolen_size = MB(32);
406 case SNB_GMCH_GMS_STOLEN_64M:
407 stolen_size = MB(64);
409 case SNB_GMCH_GMS_STOLEN_96M:
410 stolen_size = MB(96);
412 case SNB_GMCH_GMS_STOLEN_128M:
413 stolen_size = MB(128);
415 case SNB_GMCH_GMS_STOLEN_160M:
416 stolen_size = MB(160);
418 case SNB_GMCH_GMS_STOLEN_192M:
419 stolen_size = MB(192);
421 case SNB_GMCH_GMS_STOLEN_224M:
422 stolen_size = MB(224);
424 case SNB_GMCH_GMS_STOLEN_256M:
425 stolen_size = MB(256);
427 case SNB_GMCH_GMS_STOLEN_288M:
428 stolen_size = MB(288);
430 case SNB_GMCH_GMS_STOLEN_320M:
431 stolen_size = MB(320);
433 case SNB_GMCH_GMS_STOLEN_352M:
434 stolen_size = MB(352);
436 case SNB_GMCH_GMS_STOLEN_384M:
437 stolen_size = MB(384);
439 case SNB_GMCH_GMS_STOLEN_416M:
440 stolen_size = MB(416);
442 case SNB_GMCH_GMS_STOLEN_448M:
443 stolen_size = MB(448);
445 case SNB_GMCH_GMS_STOLEN_480M:
446 stolen_size = MB(480);
448 case SNB_GMCH_GMS_STOLEN_512M:
449 stolen_size = MB(512);
453 switch (gmch_ctrl & I855_GMCH_GMS_MASK) {
454 case I855_GMCH_GMS_STOLEN_1M:
457 case I855_GMCH_GMS_STOLEN_4M:
460 case I855_GMCH_GMS_STOLEN_8M:
463 case I855_GMCH_GMS_STOLEN_16M:
464 stolen_size = MB(16);
466 case I855_GMCH_GMS_STOLEN_32M:
467 stolen_size = MB(32);
469 case I915_GMCH_GMS_STOLEN_48M:
470 stolen_size = MB(48);
472 case I915_GMCH_GMS_STOLEN_64M:
473 stolen_size = MB(64);
475 case G33_GMCH_GMS_STOLEN_128M:
476 stolen_size = MB(128);
478 case G33_GMCH_GMS_STOLEN_256M:
479 stolen_size = MB(256);
481 case INTEL_GMCH_GMS_STOLEN_96M:
482 stolen_size = MB(96);
484 case INTEL_GMCH_GMS_STOLEN_160M:
485 stolen_size = MB(160);
487 case INTEL_GMCH_GMS_STOLEN_224M:
488 stolen_size = MB(224);
490 case INTEL_GMCH_GMS_STOLEN_352M:
491 stolen_size = MB(352);
499 if (stolen_size > 0) {
500 dev_info(&intel_private.bridge_dev->dev, "detected %dK %s memory\n",
501 stolen_size / KB(1), local ? "local" : "stolen");
503 dev_info(&intel_private.bridge_dev->dev,
504 "no pre-allocated video memory detected\n");
511 static void i965_adjust_pgetbl_size(unsigned int size_flag)
513 u32 pgetbl_ctl, pgetbl_ctl2;
515 /* ensure that ppgtt is disabled */
516 pgetbl_ctl2 = readl(intel_private.registers+I965_PGETBL_CTL2);
517 pgetbl_ctl2 &= ~I810_PGETBL_ENABLED;
518 writel(pgetbl_ctl2, intel_private.registers+I965_PGETBL_CTL2);
520 /* write the new ggtt size */
521 pgetbl_ctl = readl(intel_private.registers+I810_PGETBL_CTL);
522 pgetbl_ctl &= ~I965_PGETBL_SIZE_MASK;
523 pgetbl_ctl |= size_flag;
524 writel(pgetbl_ctl, intel_private.registers+I810_PGETBL_CTL);
527 static unsigned int i965_gtt_total_entries(void)
533 pci_read_config_word(intel_private.bridge_dev,
534 I830_GMCH_CTRL, &gmch_ctl);
536 if (INTEL_GTT_GEN == 5) {
537 switch (gmch_ctl & G4x_GMCH_SIZE_MASK) {
538 case G4x_GMCH_SIZE_1M:
539 case G4x_GMCH_SIZE_VT_1M:
540 i965_adjust_pgetbl_size(I965_PGETBL_SIZE_1MB);
542 case G4x_GMCH_SIZE_VT_1_5M:
543 i965_adjust_pgetbl_size(I965_PGETBL_SIZE_1_5MB);
545 case G4x_GMCH_SIZE_2M:
546 case G4x_GMCH_SIZE_VT_2M:
547 i965_adjust_pgetbl_size(I965_PGETBL_SIZE_2MB);
552 pgetbl_ctl = readl(intel_private.registers+I810_PGETBL_CTL);
554 switch (pgetbl_ctl & I965_PGETBL_SIZE_MASK) {
555 case I965_PGETBL_SIZE_128KB:
558 case I965_PGETBL_SIZE_256KB:
561 case I965_PGETBL_SIZE_512KB:
564 /* GTT pagetable sizes bigger than 512KB are not possible on G33! */
565 case I965_PGETBL_SIZE_1MB:
568 case I965_PGETBL_SIZE_2MB:
571 case I965_PGETBL_SIZE_1_5MB:
572 size = KB(1024 + 512);
575 dev_info(&intel_private.pcidev->dev,
576 "unknown page table size, assuming 512KB\n");
583 static unsigned int intel_gtt_total_entries(void)
587 if (IS_G33 || INTEL_GTT_GEN == 4 || INTEL_GTT_GEN == 5)
588 return i965_gtt_total_entries();
589 else if (INTEL_GTT_GEN == 6) {
592 pci_read_config_word(intel_private.pcidev, SNB_GMCH_CTRL, &snb_gmch_ctl);
593 switch (snb_gmch_ctl & SNB_GTT_SIZE_MASK) {
595 case SNB_GTT_SIZE_0M:
596 printk(KERN_ERR "Bad GTT size mask: 0x%04x.\n", snb_gmch_ctl);
599 case SNB_GTT_SIZE_1M:
602 case SNB_GTT_SIZE_2M:
608 /* On previous hardware, the GTT size was just what was
609 * required to map the aperture.
611 return intel_private.base.gtt_mappable_entries;
615 static unsigned int intel_gtt_mappable_entries(void)
617 unsigned int aperture_size;
619 if (INTEL_GTT_GEN == 1) {
622 pci_read_config_dword(intel_private.bridge_dev,
623 I810_SMRAM_MISCC, &smram_miscc);
625 if ((smram_miscc & I810_GFX_MEM_WIN_SIZE)
626 == I810_GFX_MEM_WIN_32M)
627 aperture_size = MB(32);
629 aperture_size = MB(64);
630 } else if (INTEL_GTT_GEN == 2) {
633 pci_read_config_word(intel_private.bridge_dev,
634 I830_GMCH_CTRL, &gmch_ctrl);
636 if ((gmch_ctrl & I830_GMCH_MEM_MASK) == I830_GMCH_MEM_64M)
637 aperture_size = MB(64);
639 aperture_size = MB(128);
641 /* 9xx supports large sizes, just look at the length */
642 aperture_size = pci_resource_len(intel_private.pcidev, 2);
645 return aperture_size >> PAGE_SHIFT;
648 static void intel_gtt_teardown_scratch_page(void)
650 set_pages_wb(intel_private.scratch_page, 1);
651 pci_unmap_page(intel_private.pcidev, intel_private.base.scratch_page_dma,
652 PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
653 put_page(intel_private.scratch_page);
654 __free_page(intel_private.scratch_page);
657 static void intel_gtt_cleanup(void)
659 intel_private.driver->cleanup();
661 iounmap(intel_private.gtt);
662 iounmap(intel_private.registers);
664 intel_gtt_teardown_scratch_page();
667 static int intel_gtt_init(void)
672 ret = intel_private.driver->setup();
676 intel_private.base.gtt_mappable_entries = intel_gtt_mappable_entries();
677 intel_private.base.gtt_total_entries = intel_gtt_total_entries();
679 /* save the PGETBL reg for resume */
680 intel_private.PGETBL_save =
681 readl(intel_private.registers+I810_PGETBL_CTL)
682 & ~I810_PGETBL_ENABLED;
683 /* we only ever restore the register when enabling the PGTBL... */
685 intel_private.PGETBL_save |= I810_PGETBL_ENABLED;
687 dev_info(&intel_private.bridge_dev->dev,
688 "detected gtt size: %dK total, %dK mappable\n",
689 intel_private.base.gtt_total_entries * 4,
690 intel_private.base.gtt_mappable_entries * 4);
692 gtt_map_size = intel_private.base.gtt_total_entries * 4;
694 intel_private.gtt = ioremap(intel_private.gtt_bus_addr,
696 if (!intel_private.gtt) {
697 intel_private.driver->cleanup();
698 iounmap(intel_private.registers);
701 intel_private.base.gtt = intel_private.gtt;
703 global_cache_flush(); /* FIXME: ? */
705 intel_private.base.stolen_size = intel_gtt_stolen_size();
707 intel_private.base.needs_dmar = USE_PCI_DMA_API && INTEL_GTT_GEN > 2;
709 ret = intel_gtt_setup_scratch_page();
718 static int intel_fake_agp_fetch_size(void)
720 int num_sizes = ARRAY_SIZE(intel_fake_agp_sizes);
721 unsigned int aper_size;
724 aper_size = (intel_private.base.gtt_mappable_entries << PAGE_SHIFT)
727 for (i = 0; i < num_sizes; i++) {
728 if (aper_size == intel_fake_agp_sizes[i].size) {
729 agp_bridge->current_size =
730 (void *) (intel_fake_agp_sizes + i);
738 static void i830_cleanup(void)
742 /* The chipset_flush interface needs to get data that has already been
743 * flushed out of the CPU all the way out to main memory, because the GPU
744 * doesn't snoop those buffers.
746 * The 8xx series doesn't have the same lovely interface for flushing the
747 * chipset write buffers that the later chips do. According to the 865
748 * specs, it's 64 octwords, or 1KB. So, to get those previous things in
749 * that buffer out, we just fill 1KB and clflush it out, on the assumption
750 * that it'll push whatever was in there out. It appears to work.
752 static void i830_chipset_flush(void)
754 unsigned long timeout = jiffies + msecs_to_jiffies(1000);
756 /* Forcibly evict everything from the CPU write buffers.
757 * clflush appears to be insufficient.
759 wbinvd_on_all_cpus();
761 /* Now we've only seen documents for this magic bit on 855GM,
762 * we hope it exists for the other gen2 chipsets...
764 * Also works as advertised on my 845G.
766 writel(readl(intel_private.registers+I830_HIC) | (1<<31),
767 intel_private.registers+I830_HIC);
769 while (readl(intel_private.registers+I830_HIC) & (1<<31)) {
770 if (time_after(jiffies, timeout))
777 static void i830_write_entry(dma_addr_t addr, unsigned int entry,
780 u32 pte_flags = I810_PTE_VALID;
782 if (flags == AGP_USER_CACHED_MEMORY)
783 pte_flags |= I830_PTE_SYSTEM_CACHED;
785 writel(addr | pte_flags, intel_private.gtt + entry);
788 static bool intel_enable_gtt(void)
793 if (INTEL_GTT_GEN <= 2)
794 pci_read_config_dword(intel_private.pcidev, I810_GMADDR,
797 pci_read_config_dword(intel_private.pcidev, I915_GMADDR,
800 intel_private.gma_bus_addr = (gma_addr & PCI_BASE_ADDRESS_MEM_MASK);
802 if (INTEL_GTT_GEN >= 6)
805 if (INTEL_GTT_GEN == 2) {
808 pci_read_config_word(intel_private.bridge_dev,
809 I830_GMCH_CTRL, &gmch_ctrl);
810 gmch_ctrl |= I830_GMCH_ENABLED;
811 pci_write_config_word(intel_private.bridge_dev,
812 I830_GMCH_CTRL, gmch_ctrl);
814 pci_read_config_word(intel_private.bridge_dev,
815 I830_GMCH_CTRL, &gmch_ctrl);
816 if ((gmch_ctrl & I830_GMCH_ENABLED) == 0) {
817 dev_err(&intel_private.pcidev->dev,
818 "failed to enable the GTT: GMCH_CTRL=%x\n",
824 /* On the resume path we may be adjusting the PGTBL value, so
825 * be paranoid and flush all chipset write buffers...
827 if (INTEL_GTT_GEN >= 3)
828 writel(0, intel_private.registers+GFX_FLSH_CNTL);
830 reg = intel_private.registers+I810_PGETBL_CTL;
831 writel(intel_private.PGETBL_save, reg);
832 if (HAS_PGTBL_EN && (readl(reg) & I810_PGETBL_ENABLED) == 0) {
833 dev_err(&intel_private.pcidev->dev,
834 "failed to enable the GTT: PGETBL=%x [expected %x]\n",
835 readl(reg), intel_private.PGETBL_save);
839 if (INTEL_GTT_GEN >= 3)
840 writel(0, intel_private.registers+GFX_FLSH_CNTL);
845 static int i830_setup(void)
849 pci_read_config_dword(intel_private.pcidev, I810_MMADDR, ®_addr);
850 reg_addr &= 0xfff80000;
852 intel_private.registers = ioremap(reg_addr, KB(64));
853 if (!intel_private.registers)
856 intel_private.gtt_bus_addr = reg_addr + I810_PTE_BASE;
861 static int intel_fake_agp_create_gatt_table(struct agp_bridge_data *bridge)
863 agp_bridge->gatt_table_real = NULL;
864 agp_bridge->gatt_table = NULL;
865 agp_bridge->gatt_bus_addr = 0;
870 static int intel_fake_agp_free_gatt_table(struct agp_bridge_data *bridge)
875 static int intel_fake_agp_configure(void)
877 if (!intel_enable_gtt())
880 intel_private.clear_fake_agp = true;
881 agp_bridge->gart_bus_addr = intel_private.gma_bus_addr;
886 static bool i830_check_flags(unsigned int flags)
890 case AGP_PHYS_MEMORY:
891 case AGP_USER_CACHED_MEMORY:
892 case AGP_USER_MEMORY:
899 void intel_gtt_insert_sg_entries(struct scatterlist *sg_list,
901 unsigned int pg_start,
904 struct scatterlist *sg;
910 /* sg may merge pages, but we have to separate
911 * per-page addr for GTT */
912 for_each_sg(sg_list, sg, sg_len, i) {
913 len = sg_dma_len(sg) >> PAGE_SHIFT;
914 for (m = 0; m < len; m++) {
915 dma_addr_t addr = sg_dma_address(sg) + (m << PAGE_SHIFT);
916 intel_private.driver->write_entry(addr,
921 readl(intel_private.gtt+j-1);
923 EXPORT_SYMBOL(intel_gtt_insert_sg_entries);
925 void intel_gtt_insert_pages(unsigned int first_entry, unsigned int num_entries,
926 struct page **pages, unsigned int flags)
930 for (i = 0, j = first_entry; i < num_entries; i++, j++) {
931 dma_addr_t addr = page_to_phys(pages[i]);
932 intel_private.driver->write_entry(addr,
935 readl(intel_private.gtt+j-1);
937 EXPORT_SYMBOL(intel_gtt_insert_pages);
939 static int intel_fake_agp_insert_entries(struct agp_memory *mem,
940 off_t pg_start, int type)
944 if (intel_private.base.do_idle_maps)
947 if (intel_private.clear_fake_agp) {
948 int start = intel_private.base.stolen_size / PAGE_SIZE;
949 int end = intel_private.base.gtt_mappable_entries;
950 intel_gtt_clear_range(start, end - start);
951 intel_private.clear_fake_agp = false;
954 if (INTEL_GTT_GEN == 1 && type == AGP_DCACHE_MEMORY)
955 return i810_insert_dcache_entries(mem, pg_start, type);
957 if (mem->page_count == 0)
960 if (pg_start + mem->page_count > intel_private.base.gtt_total_entries)
963 if (type != mem->type)
966 if (!intel_private.driver->check_flags(type))
969 if (!mem->is_flushed)
970 global_cache_flush();
972 if (intel_private.base.needs_dmar) {
973 ret = intel_gtt_map_memory(mem->pages, mem->page_count,
974 &mem->sg_list, &mem->num_sg);
978 intel_gtt_insert_sg_entries(mem->sg_list, mem->num_sg,
981 intel_gtt_insert_pages(pg_start, mem->page_count, mem->pages,
987 mem->is_flushed = true;
991 void intel_gtt_clear_range(unsigned int first_entry, unsigned int num_entries)
995 for (i = first_entry; i < (first_entry + num_entries); i++) {
996 intel_private.driver->write_entry(intel_private.base.scratch_page_dma,
999 readl(intel_private.gtt+i-1);
1001 EXPORT_SYMBOL(intel_gtt_clear_range);
1003 static int intel_fake_agp_remove_entries(struct agp_memory *mem,
1004 off_t pg_start, int type)
1006 if (mem->page_count == 0)
1009 if (intel_private.base.do_idle_maps)
1012 intel_gtt_clear_range(pg_start, mem->page_count);
1014 if (intel_private.base.needs_dmar) {
1015 intel_gtt_unmap_memory(mem->sg_list, mem->num_sg);
1016 mem->sg_list = NULL;
1023 static struct agp_memory *intel_fake_agp_alloc_by_type(size_t pg_count,
1026 struct agp_memory *new;
1028 if (type == AGP_DCACHE_MEMORY && INTEL_GTT_GEN == 1) {
1029 if (pg_count != intel_private.num_dcache_entries)
1032 new = agp_create_memory(1);
1036 new->type = AGP_DCACHE_MEMORY;
1037 new->page_count = pg_count;
1038 new->num_scratch_pages = 0;
1039 agp_free_page_array(new);
1042 if (type == AGP_PHYS_MEMORY)
1043 return alloc_agpphysmem_i8xx(pg_count, type);
1044 /* always return NULL for other allocation types for now */
1048 static int intel_alloc_chipset_flush_resource(void)
1051 ret = pci_bus_alloc_resource(intel_private.bridge_dev->bus, &intel_private.ifp_resource, PAGE_SIZE,
1052 PAGE_SIZE, PCIBIOS_MIN_MEM, 0,
1053 pcibios_align_resource, intel_private.bridge_dev);
1058 static void intel_i915_setup_chipset_flush(void)
1063 pci_read_config_dword(intel_private.bridge_dev, I915_IFPADDR, &temp);
1064 if (!(temp & 0x1)) {
1065 intel_alloc_chipset_flush_resource();
1066 intel_private.resource_valid = 1;
1067 pci_write_config_dword(intel_private.bridge_dev, I915_IFPADDR, (intel_private.ifp_resource.start & 0xffffffff) | 0x1);
1071 intel_private.resource_valid = 1;
1072 intel_private.ifp_resource.start = temp;
1073 intel_private.ifp_resource.end = temp + PAGE_SIZE;
1074 ret = request_resource(&iomem_resource, &intel_private.ifp_resource);
1075 /* some BIOSes reserve this area in a pnp some don't */
1077 intel_private.resource_valid = 0;
1081 static void intel_i965_g33_setup_chipset_flush(void)
1083 u32 temp_hi, temp_lo;
1086 pci_read_config_dword(intel_private.bridge_dev, I965_IFPADDR + 4, &temp_hi);
1087 pci_read_config_dword(intel_private.bridge_dev, I965_IFPADDR, &temp_lo);
1089 if (!(temp_lo & 0x1)) {
1091 intel_alloc_chipset_flush_resource();
1093 intel_private.resource_valid = 1;
1094 pci_write_config_dword(intel_private.bridge_dev, I965_IFPADDR + 4,
1095 upper_32_bits(intel_private.ifp_resource.start));
1096 pci_write_config_dword(intel_private.bridge_dev, I965_IFPADDR, (intel_private.ifp_resource.start & 0xffffffff) | 0x1);
1101 l64 = ((u64)temp_hi << 32) | temp_lo;
1103 intel_private.resource_valid = 1;
1104 intel_private.ifp_resource.start = l64;
1105 intel_private.ifp_resource.end = l64 + PAGE_SIZE;
1106 ret = request_resource(&iomem_resource, &intel_private.ifp_resource);
1107 /* some BIOSes reserve this area in a pnp some don't */
1109 intel_private.resource_valid = 0;
1113 static void intel_i9xx_setup_flush(void)
1115 /* return if already configured */
1116 if (intel_private.ifp_resource.start)
1119 if (INTEL_GTT_GEN == 6)
1122 /* setup a resource for this object */
1123 intel_private.ifp_resource.name = "Intel Flush Page";
1124 intel_private.ifp_resource.flags = IORESOURCE_MEM;
1126 /* Setup chipset flush for 915 */
1127 if (IS_G33 || INTEL_GTT_GEN >= 4) {
1128 intel_i965_g33_setup_chipset_flush();
1130 intel_i915_setup_chipset_flush();
1133 if (intel_private.ifp_resource.start)
1134 intel_private.i9xx_flush_page = ioremap_nocache(intel_private.ifp_resource.start, PAGE_SIZE);
1135 if (!intel_private.i9xx_flush_page)
1136 dev_err(&intel_private.pcidev->dev,
1137 "can't ioremap flush page - no chipset flushing\n");
1140 static void i9xx_cleanup(void)
1142 if (intel_private.i9xx_flush_page)
1143 iounmap(intel_private.i9xx_flush_page);
1144 if (intel_private.resource_valid)
1145 release_resource(&intel_private.ifp_resource);
1146 intel_private.ifp_resource.start = 0;
1147 intel_private.resource_valid = 0;
1150 static void i9xx_chipset_flush(void)
1152 if (intel_private.i9xx_flush_page)
1153 writel(1, intel_private.i9xx_flush_page);
1156 static void i965_write_entry(dma_addr_t addr,
1162 pte_flags = I810_PTE_VALID;
1163 if (flags == AGP_USER_CACHED_MEMORY)
1164 pte_flags |= I830_PTE_SYSTEM_CACHED;
1166 /* Shift high bits down */
1167 addr |= (addr >> 28) & 0xf0;
1168 writel(addr | pte_flags, intel_private.gtt + entry);
1171 static bool gen6_check_flags(unsigned int flags)
1176 static void gen6_write_entry(dma_addr_t addr, unsigned int entry,
1179 unsigned int type_mask = flags & ~AGP_USER_CACHED_MEMORY_GFDT;
1180 unsigned int gfdt = flags & AGP_USER_CACHED_MEMORY_GFDT;
1183 if (type_mask == AGP_USER_MEMORY)
1184 pte_flags = GEN6_PTE_UNCACHED | I810_PTE_VALID;
1185 else if (type_mask == AGP_USER_CACHED_MEMORY_LLC_MLC) {
1186 pte_flags = GEN6_PTE_LLC_MLC | I810_PTE_VALID;
1188 pte_flags |= GEN6_PTE_GFDT;
1189 } else { /* set 'normal'/'cached' to LLC by default */
1190 pte_flags = GEN6_PTE_LLC | I810_PTE_VALID;
1192 pte_flags |= GEN6_PTE_GFDT;
1195 /* gen6 has bit11-4 for physical addr bit39-32 */
1196 addr |= (addr >> 28) & 0xff0;
1197 writel(addr | pte_flags, intel_private.gtt + entry);
1200 static void gen6_cleanup(void)
1204 /* Certain Gen5 chipsets require require idling the GPU before
1205 * unmapping anything from the GTT when VT-d is enabled.
1207 static inline int needs_idle_maps(void)
1209 #ifdef CONFIG_INTEL_IOMMU
1210 const unsigned short gpu_devid = intel_private.pcidev->device;
1212 /* Query intel_iommu to see if we need the workaround. Presumably that
1215 if ((gpu_devid == PCI_DEVICE_ID_INTEL_IRONLAKE_M_HB ||
1216 gpu_devid == PCI_DEVICE_ID_INTEL_IRONLAKE_M_IG) &&
1217 intel_iommu_gfx_mapped)
1223 static int i9xx_setup(void)
1227 pci_read_config_dword(intel_private.pcidev, I915_MMADDR, ®_addr);
1229 reg_addr &= 0xfff80000;
1231 intel_private.registers = ioremap(reg_addr, 128 * 4096);
1232 if (!intel_private.registers)
1235 if (INTEL_GTT_GEN == 3) {
1238 pci_read_config_dword(intel_private.pcidev,
1239 I915_PTEADDR, >t_addr);
1240 intel_private.gtt_bus_addr = gtt_addr;
1244 switch (INTEL_GTT_GEN) {
1251 gtt_offset = KB(512);
1254 intel_private.gtt_bus_addr = reg_addr + gtt_offset;
1257 if (needs_idle_maps())
1258 intel_private.base.do_idle_maps = 1;
1260 intel_i9xx_setup_flush();
1265 static const struct agp_bridge_driver intel_fake_agp_driver = {
1266 .owner = THIS_MODULE,
1267 .size_type = FIXED_APER_SIZE,
1268 .aperture_sizes = intel_fake_agp_sizes,
1269 .num_aperture_sizes = ARRAY_SIZE(intel_fake_agp_sizes),
1270 .configure = intel_fake_agp_configure,
1271 .fetch_size = intel_fake_agp_fetch_size,
1272 .cleanup = intel_gtt_cleanup,
1273 .agp_enable = intel_fake_agp_enable,
1274 .cache_flush = global_cache_flush,
1275 .create_gatt_table = intel_fake_agp_create_gatt_table,
1276 .free_gatt_table = intel_fake_agp_free_gatt_table,
1277 .insert_memory = intel_fake_agp_insert_entries,
1278 .remove_memory = intel_fake_agp_remove_entries,
1279 .alloc_by_type = intel_fake_agp_alloc_by_type,
1280 .free_by_type = intel_i810_free_by_type,
1281 .agp_alloc_page = agp_generic_alloc_page,
1282 .agp_alloc_pages = agp_generic_alloc_pages,
1283 .agp_destroy_page = agp_generic_destroy_page,
1284 .agp_destroy_pages = agp_generic_destroy_pages,
1287 static const struct intel_gtt_driver i81x_gtt_driver = {
1289 .has_pgtbl_enable = 1,
1290 .dma_mask_size = 32,
1291 .setup = i810_setup,
1292 .cleanup = i810_cleanup,
1293 .check_flags = i830_check_flags,
1294 .write_entry = i810_write_entry,
1296 static const struct intel_gtt_driver i8xx_gtt_driver = {
1298 .has_pgtbl_enable = 1,
1299 .setup = i830_setup,
1300 .cleanup = i830_cleanup,
1301 .write_entry = i830_write_entry,
1302 .dma_mask_size = 32,
1303 .check_flags = i830_check_flags,
1304 .chipset_flush = i830_chipset_flush,
1306 static const struct intel_gtt_driver i915_gtt_driver = {
1308 .has_pgtbl_enable = 1,
1309 .setup = i9xx_setup,
1310 .cleanup = i9xx_cleanup,
1311 /* i945 is the last gpu to need phys mem (for overlay and cursors). */
1312 .write_entry = i830_write_entry,
1313 .dma_mask_size = 32,
1314 .check_flags = i830_check_flags,
1315 .chipset_flush = i9xx_chipset_flush,
1317 static const struct intel_gtt_driver g33_gtt_driver = {
1320 .setup = i9xx_setup,
1321 .cleanup = i9xx_cleanup,
1322 .write_entry = i965_write_entry,
1323 .dma_mask_size = 36,
1324 .check_flags = i830_check_flags,
1325 .chipset_flush = i9xx_chipset_flush,
1327 static const struct intel_gtt_driver pineview_gtt_driver = {
1329 .is_pineview = 1, .is_g33 = 1,
1330 .setup = i9xx_setup,
1331 .cleanup = i9xx_cleanup,
1332 .write_entry = i965_write_entry,
1333 .dma_mask_size = 36,
1334 .check_flags = i830_check_flags,
1335 .chipset_flush = i9xx_chipset_flush,
1337 static const struct intel_gtt_driver i965_gtt_driver = {
1339 .has_pgtbl_enable = 1,
1340 .setup = i9xx_setup,
1341 .cleanup = i9xx_cleanup,
1342 .write_entry = i965_write_entry,
1343 .dma_mask_size = 36,
1344 .check_flags = i830_check_flags,
1345 .chipset_flush = i9xx_chipset_flush,
1347 static const struct intel_gtt_driver g4x_gtt_driver = {
1349 .setup = i9xx_setup,
1350 .cleanup = i9xx_cleanup,
1351 .write_entry = i965_write_entry,
1352 .dma_mask_size = 36,
1353 .check_flags = i830_check_flags,
1354 .chipset_flush = i9xx_chipset_flush,
1356 static const struct intel_gtt_driver ironlake_gtt_driver = {
1359 .setup = i9xx_setup,
1360 .cleanup = i9xx_cleanup,
1361 .write_entry = i965_write_entry,
1362 .dma_mask_size = 36,
1363 .check_flags = i830_check_flags,
1364 .chipset_flush = i9xx_chipset_flush,
1366 static const struct intel_gtt_driver sandybridge_gtt_driver = {
1368 .setup = i9xx_setup,
1369 .cleanup = gen6_cleanup,
1370 .write_entry = gen6_write_entry,
1371 .dma_mask_size = 40,
1372 .check_flags = gen6_check_flags,
1373 .chipset_flush = i9xx_chipset_flush,
1376 /* Table to describe Intel GMCH and AGP/PCIE GART drivers. At least one of
1377 * driver and gmch_driver must be non-null, and find_gmch will determine
1378 * which one should be used if a gmch_chip_id is present.
1380 static const struct intel_gtt_driver_description {
1381 unsigned int gmch_chip_id;
1383 const struct intel_gtt_driver *gtt_driver;
1384 } intel_gtt_chipsets[] = {
1385 { PCI_DEVICE_ID_INTEL_82810_IG1, "i810",
1387 { PCI_DEVICE_ID_INTEL_82810_IG3, "i810",
1389 { PCI_DEVICE_ID_INTEL_82810E_IG, "i810",
1391 { PCI_DEVICE_ID_INTEL_82815_CGC, "i815",
1393 { PCI_DEVICE_ID_INTEL_82830_CGC, "830M",
1395 { PCI_DEVICE_ID_INTEL_82845G_IG, "845G",
1397 { PCI_DEVICE_ID_INTEL_82854_IG, "854",
1399 { PCI_DEVICE_ID_INTEL_82855GM_IG, "855GM",
1401 { PCI_DEVICE_ID_INTEL_82865_IG, "865",
1403 { PCI_DEVICE_ID_INTEL_E7221_IG, "E7221 (i915)",
1405 { PCI_DEVICE_ID_INTEL_82915G_IG, "915G",
1407 { PCI_DEVICE_ID_INTEL_82915GM_IG, "915GM",
1409 { PCI_DEVICE_ID_INTEL_82945G_IG, "945G",
1411 { PCI_DEVICE_ID_INTEL_82945GM_IG, "945GM",
1413 { PCI_DEVICE_ID_INTEL_82945GME_IG, "945GME",
1415 { PCI_DEVICE_ID_INTEL_82946GZ_IG, "946GZ",
1417 { PCI_DEVICE_ID_INTEL_82G35_IG, "G35",
1419 { PCI_DEVICE_ID_INTEL_82965Q_IG, "965Q",
1421 { PCI_DEVICE_ID_INTEL_82965G_IG, "965G",
1423 { PCI_DEVICE_ID_INTEL_82965GM_IG, "965GM",
1425 { PCI_DEVICE_ID_INTEL_82965GME_IG, "965GME/GLE",
1427 { PCI_DEVICE_ID_INTEL_G33_IG, "G33",
1429 { PCI_DEVICE_ID_INTEL_Q35_IG, "Q35",
1431 { PCI_DEVICE_ID_INTEL_Q33_IG, "Q33",
1433 { PCI_DEVICE_ID_INTEL_PINEVIEW_M_IG, "GMA3150",
1434 &pineview_gtt_driver },
1435 { PCI_DEVICE_ID_INTEL_PINEVIEW_IG, "GMA3150",
1436 &pineview_gtt_driver },
1437 { PCI_DEVICE_ID_INTEL_GM45_IG, "GM45",
1439 { PCI_DEVICE_ID_INTEL_EAGLELAKE_IG, "Eaglelake",
1441 { PCI_DEVICE_ID_INTEL_Q45_IG, "Q45/Q43",
1443 { PCI_DEVICE_ID_INTEL_G45_IG, "G45/G43",
1445 { PCI_DEVICE_ID_INTEL_B43_IG, "B43",
1447 { PCI_DEVICE_ID_INTEL_B43_1_IG, "B43",
1449 { PCI_DEVICE_ID_INTEL_G41_IG, "G41",
1451 { PCI_DEVICE_ID_INTEL_IRONLAKE_D_IG,
1452 "HD Graphics", &ironlake_gtt_driver },
1453 { PCI_DEVICE_ID_INTEL_IRONLAKE_M_IG,
1454 "HD Graphics", &ironlake_gtt_driver },
1455 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_GT1_IG,
1456 "Sandybridge", &sandybridge_gtt_driver },
1457 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_GT2_IG,
1458 "Sandybridge", &sandybridge_gtt_driver },
1459 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_GT2_PLUS_IG,
1460 "Sandybridge", &sandybridge_gtt_driver },
1461 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_M_GT1_IG,
1462 "Sandybridge", &sandybridge_gtt_driver },
1463 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_M_GT2_IG,
1464 "Sandybridge", &sandybridge_gtt_driver },
1465 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_M_GT2_PLUS_IG,
1466 "Sandybridge", &sandybridge_gtt_driver },
1467 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_S_IG,
1468 "Sandybridge", &sandybridge_gtt_driver },
1469 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_GT1_IG,
1470 "Ivybridge", &sandybridge_gtt_driver },
1471 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_GT2_IG,
1472 "Ivybridge", &sandybridge_gtt_driver },
1473 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_M_GT1_IG,
1474 "Ivybridge", &sandybridge_gtt_driver },
1475 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_M_GT2_IG,
1476 "Ivybridge", &sandybridge_gtt_driver },
1477 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_S_GT1_IG,
1478 "Ivybridge", &sandybridge_gtt_driver },
1479 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_S_GT2_IG,
1480 "Ivybridge", &sandybridge_gtt_driver },
1484 static int find_gmch(u16 device)
1486 struct pci_dev *gmch_device;
1488 gmch_device = pci_get_device(PCI_VENDOR_ID_INTEL, device, NULL);
1489 if (gmch_device && PCI_FUNC(gmch_device->devfn) != 0) {
1490 gmch_device = pci_get_device(PCI_VENDOR_ID_INTEL,
1491 device, gmch_device);
1497 intel_private.pcidev = gmch_device;
1501 int intel_gmch_probe(struct pci_dev *pdev,
1502 struct agp_bridge_data *bridge)
1505 intel_private.driver = NULL;
1507 for (i = 0; intel_gtt_chipsets[i].name != NULL; i++) {
1508 if (find_gmch(intel_gtt_chipsets[i].gmch_chip_id)) {
1509 intel_private.driver =
1510 intel_gtt_chipsets[i].gtt_driver;
1515 if (!intel_private.driver)
1518 bridge->driver = &intel_fake_agp_driver;
1519 bridge->dev_private_data = &intel_private;
1522 intel_private.bridge_dev = pci_dev_get(pdev);
1524 dev_info(&pdev->dev, "Intel %s Chipset\n", intel_gtt_chipsets[i].name);
1526 mask = intel_private.driver->dma_mask_size;
1527 if (pci_set_dma_mask(intel_private.pcidev, DMA_BIT_MASK(mask)))
1528 dev_err(&intel_private.pcidev->dev,
1529 "set gfx device dma mask %d-bit failed!\n", mask);
1531 pci_set_consistent_dma_mask(intel_private.pcidev,
1532 DMA_BIT_MASK(mask));
1534 /*if (bridge->driver == &intel_810_driver)
1537 if (intel_gtt_init() != 0)
1542 EXPORT_SYMBOL(intel_gmch_probe);
1544 const struct intel_gtt *intel_gtt_get(void)
1546 return &intel_private.base;
1548 EXPORT_SYMBOL(intel_gtt_get);
1550 void intel_gtt_chipset_flush(void)
1552 if (intel_private.driver->chipset_flush)
1553 intel_private.driver->chipset_flush();
1555 EXPORT_SYMBOL(intel_gtt_chipset_flush);
1557 void intel_gmch_remove(struct pci_dev *pdev)
1559 if (intel_private.pcidev)
1560 pci_dev_put(intel_private.pcidev);
1561 if (intel_private.bridge_dev)
1562 pci_dev_put(intel_private.bridge_dev);
1564 EXPORT_SYMBOL(intel_gmch_remove);
1566 MODULE_AUTHOR("Dave Jones <davej@redhat.com>");
1567 MODULE_LICENSE("GPL and additional rights");