2 * Intel GTT (Graphics Translation Table) routines
4 * Caveat: This driver implements the linux agp interface, but this is far from
5 * a agp driver! GTT support ended up here for purely historical reasons: The
6 * old userspace intel graphics drivers needed an interface to map memory into
7 * the GTT. And the drm provides a default interface for graphic devices sitting
8 * on an agp port. So it made sense to fake the GTT support as an agp port to
9 * avoid having to create a new api.
11 * With gem this does not make much sense anymore, just needlessly complicates
12 * the code. But as long as the old graphics stack is still support, it's stuck
15 * /fairy-tale-mode off
18 #include <linux/module.h>
19 #include <linux/pci.h>
20 #include <linux/init.h>
21 #include <linux/kernel.h>
22 #include <linux/pagemap.h>
23 #include <linux/agp_backend.h>
24 #include <linux/delay.h>
27 #include "intel-agp.h"
28 #include <drm/intel-gtt.h>
31 * If we have Intel graphics, we're not going to have anything other than
32 * an Intel IOMMU. So make the correct use of the PCI DMA API contingent
33 * on the Intel IOMMU support (CONFIG_INTEL_IOMMU).
34 * Only newer chipsets need to bother with this, of course.
36 #ifdef CONFIG_INTEL_IOMMU
37 #define USE_PCI_DMA_API 1
39 #define USE_PCI_DMA_API 0
42 struct intel_gtt_driver {
44 unsigned int is_g33 : 1;
45 unsigned int is_pineview : 1;
46 unsigned int is_ironlake : 1;
47 unsigned int has_pgtbl_enable : 1;
48 unsigned int dma_mask_size : 8;
49 /* Chipset specific GTT setup */
51 /* This should undo anything done in ->setup() save the unmapping
52 * of the mmio register file, that's done in the generic code. */
53 void (*cleanup)(void);
54 void (*write_entry)(dma_addr_t addr, unsigned int entry, unsigned int flags);
55 /* Flags is a more or less chipset specific opaque value.
56 * For chipsets that need to support old ums (non-gem) code, this
57 * needs to be identical to the various supported agp memory types! */
58 bool (*check_flags)(unsigned int flags);
59 void (*chipset_flush)(void);
62 static struct _intel_private {
63 struct intel_gtt base;
64 const struct intel_gtt_driver *driver;
65 struct pci_dev *pcidev; /* device one */
66 struct pci_dev *bridge_dev;
67 u8 __iomem *registers;
68 phys_addr_t gtt_bus_addr;
69 phys_addr_t gma_bus_addr;
71 u32 __iomem *gtt; /* I915G */
72 bool clear_fake_agp; /* on first access via agp, fill with scratch */
73 int num_dcache_entries;
74 void __iomem *i9xx_flush_page;
76 struct resource ifp_resource;
78 struct page *scratch_page;
79 dma_addr_t scratch_page_dma;
82 #define INTEL_GTT_GEN intel_private.driver->gen
83 #define IS_G33 intel_private.driver->is_g33
84 #define IS_PINEVIEW intel_private.driver->is_pineview
85 #define IS_IRONLAKE intel_private.driver->is_ironlake
86 #define HAS_PGTBL_EN intel_private.driver->has_pgtbl_enable
88 int intel_gtt_map_memory(struct page **pages, unsigned int num_entries,
89 struct scatterlist **sg_list, int *num_sg)
92 struct scatterlist *sg;
96 return 0; /* already mapped (for e.g. resume */
98 DBG("try mapping %lu pages\n", (unsigned long)num_entries);
100 if (sg_alloc_table(&st, num_entries, GFP_KERNEL))
103 *sg_list = sg = st.sgl;
105 for (i = 0 ; i < num_entries; i++, sg = sg_next(sg))
106 sg_set_page(sg, pages[i], PAGE_SIZE, 0);
108 *num_sg = pci_map_sg(intel_private.pcidev, *sg_list,
109 num_entries, PCI_DMA_BIDIRECTIONAL);
110 if (unlikely(!*num_sg))
119 EXPORT_SYMBOL(intel_gtt_map_memory);
121 void intel_gtt_unmap_memory(struct scatterlist *sg_list, int num_sg)
124 DBG("try unmapping %lu pages\n", (unsigned long)mem->page_count);
126 pci_unmap_sg(intel_private.pcidev, sg_list,
127 num_sg, PCI_DMA_BIDIRECTIONAL);
130 st.orig_nents = st.nents = num_sg;
134 EXPORT_SYMBOL(intel_gtt_unmap_memory);
136 static void intel_fake_agp_enable(struct agp_bridge_data *bridge, u32 mode)
141 /* Exists to support ARGB cursors */
142 static struct page *i8xx_alloc_pages(void)
146 page = alloc_pages(GFP_KERNEL | GFP_DMA32, 2);
151 if (xen_create_contiguous_region((unsigned long)page_address(page), 2, 32)) {
152 __free_pages(page, 2);
157 if (set_pages_uc(page, 4) < 0) {
158 set_pages_wb(page, 4);
160 xen_destroy_contiguous_region((unsigned long)page_address(page),
163 __free_pages(page, 2);
167 atomic_inc(&agp_bridge->current_memory_agp);
171 static void i8xx_destroy_pages(struct page *page)
176 set_pages_wb(page, 4);
178 xen_destroy_contiguous_region((unsigned long)page_address(page), 2);
181 __free_pages(page, 2);
182 atomic_dec(&agp_bridge->current_memory_agp);
185 #define I810_GTT_ORDER 4
186 static int i810_setup(void)
191 /* i81x does not preallocate the gtt. It's always 64kb in size. */
192 gtt_table = alloc_gatt_pages(I810_GTT_ORDER);
193 if (gtt_table == NULL)
195 intel_private.i81x_gtt_table = gtt_table;
197 pci_read_config_dword(intel_private.pcidev, I810_MMADDR, ®_addr);
198 reg_addr &= 0xfff80000;
200 intel_private.registers = ioremap(reg_addr, KB(64));
201 if (!intel_private.registers)
204 writel(virt_to_phys(gtt_table) | I810_PGETBL_ENABLED,
205 intel_private.registers+I810_PGETBL_CTL);
207 intel_private.gtt_bus_addr = reg_addr + I810_PTE_BASE;
209 if ((readl(intel_private.registers+I810_DRAM_CTL)
210 & I810_DRAM_ROW_0) == I810_DRAM_ROW_0_SDRAM) {
211 dev_info(&intel_private.pcidev->dev,
212 "detected 4MB dedicated video ram\n");
213 intel_private.num_dcache_entries = 1024;
219 static void i810_cleanup(void)
221 writel(0, intel_private.registers+I810_PGETBL_CTL);
222 free_gatt_pages(intel_private.i81x_gtt_table, I810_GTT_ORDER);
225 static int i810_insert_dcache_entries(struct agp_memory *mem, off_t pg_start,
230 if ((pg_start + mem->page_count)
231 > intel_private.num_dcache_entries)
234 if (!mem->is_flushed)
235 global_cache_flush();
237 for (i = pg_start; i < (pg_start + mem->page_count); i++) {
238 dma_addr_t addr = i << PAGE_SHIFT;
239 intel_private.driver->write_entry(addr,
242 readl(intel_private.gtt+i-1);
248 * The i810/i830 requires a physical address to program its mouse
249 * pointer into hardware.
250 * However the Xserver still writes to it through the agp aperture.
252 static struct agp_memory *alloc_agpphysmem_i8xx(size_t pg_count, int type)
254 struct agp_memory *new;
258 case 1: page = agp_bridge->driver->agp_alloc_page(agp_bridge);
261 /* kludge to get 4 physical pages for ARGB cursor */
262 page = i8xx_alloc_pages();
271 new = agp_create_memory(pg_count);
275 new->pages[0] = page;
277 /* kludge to get 4 physical pages for ARGB cursor */
278 new->pages[1] = new->pages[0] + 1;
279 new->pages[2] = new->pages[1] + 1;
280 new->pages[3] = new->pages[2] + 1;
282 new->page_count = pg_count;
283 new->num_scratch_pages = pg_count;
284 new->type = AGP_PHYS_MEMORY;
286 new->physical = page_to_phys(new->pages[0]);
288 new->physical = page_to_pseudophys(new->pages[0]);
293 static void intel_i810_free_by_type(struct agp_memory *curr)
295 agp_free_key(curr->key);
296 if (curr->type == AGP_PHYS_MEMORY) {
297 if (curr->page_count == 4)
298 i8xx_destroy_pages(curr->pages[0]);
300 agp_bridge->driver->agp_destroy_page(curr->pages[0],
301 AGP_PAGE_DESTROY_UNMAP);
302 agp_bridge->driver->agp_destroy_page(curr->pages[0],
303 AGP_PAGE_DESTROY_FREE);
305 agp_free_page_array(curr);
310 static int intel_gtt_setup_scratch_page(void)
315 page = alloc_page(GFP_KERNEL | GFP_DMA32 | __GFP_ZERO);
319 set_pages_uc(page, 1);
321 if (intel_private.base.needs_dmar) {
322 dma_addr = pci_map_page(intel_private.pcidev, page, 0,
323 PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
324 if (pci_dma_mapping_error(intel_private.pcidev, dma_addr))
327 intel_private.scratch_page_dma = dma_addr;
329 intel_private.scratch_page_dma = page_to_phys(page);
331 intel_private.scratch_page = page;
336 static void i810_write_entry(dma_addr_t addr, unsigned int entry,
339 u32 pte_flags = I810_PTE_VALID;
342 case AGP_DCACHE_MEMORY:
343 pte_flags |= I810_PTE_LOCAL;
345 case AGP_USER_CACHED_MEMORY:
346 pte_flags |= I830_PTE_SYSTEM_CACHED;
350 writel(addr | pte_flags, intel_private.gtt + entry);
353 static const struct aper_size_info_fixed intel_fake_agp_sizes[] = {
361 static unsigned int intel_gtt_stolen_size(void)
366 static const int ddt[4] = { 0, 16, 32, 64 };
367 unsigned int stolen_size = 0;
369 if (INTEL_GTT_GEN == 1)
370 return 0; /* no stolen mem on i81x */
372 pci_read_config_word(intel_private.bridge_dev,
373 I830_GMCH_CTRL, &gmch_ctrl);
375 if (intel_private.bridge_dev->device == PCI_DEVICE_ID_INTEL_82830_HB ||
376 intel_private.bridge_dev->device == PCI_DEVICE_ID_INTEL_82845G_HB) {
377 switch (gmch_ctrl & I830_GMCH_GMS_MASK) {
378 case I830_GMCH_GMS_STOLEN_512:
379 stolen_size = KB(512);
381 case I830_GMCH_GMS_STOLEN_1024:
384 case I830_GMCH_GMS_STOLEN_8192:
387 case I830_GMCH_GMS_LOCAL:
388 rdct = readb(intel_private.registers+I830_RDRAM_CHANNEL_TYPE);
389 stolen_size = (I830_RDRAM_ND(rdct) + 1) *
390 MB(ddt[I830_RDRAM_DDT(rdct)]);
397 } else if (INTEL_GTT_GEN == 6) {
399 * SandyBridge has new memory control reg at 0x50.w
402 pci_read_config_word(intel_private.pcidev, SNB_GMCH_CTRL, &snb_gmch_ctl);
403 switch (snb_gmch_ctl & SNB_GMCH_GMS_STOLEN_MASK) {
404 case SNB_GMCH_GMS_STOLEN_32M:
405 stolen_size = MB(32);
407 case SNB_GMCH_GMS_STOLEN_64M:
408 stolen_size = MB(64);
410 case SNB_GMCH_GMS_STOLEN_96M:
411 stolen_size = MB(96);
413 case SNB_GMCH_GMS_STOLEN_128M:
414 stolen_size = MB(128);
416 case SNB_GMCH_GMS_STOLEN_160M:
417 stolen_size = MB(160);
419 case SNB_GMCH_GMS_STOLEN_192M:
420 stolen_size = MB(192);
422 case SNB_GMCH_GMS_STOLEN_224M:
423 stolen_size = MB(224);
425 case SNB_GMCH_GMS_STOLEN_256M:
426 stolen_size = MB(256);
428 case SNB_GMCH_GMS_STOLEN_288M:
429 stolen_size = MB(288);
431 case SNB_GMCH_GMS_STOLEN_320M:
432 stolen_size = MB(320);
434 case SNB_GMCH_GMS_STOLEN_352M:
435 stolen_size = MB(352);
437 case SNB_GMCH_GMS_STOLEN_384M:
438 stolen_size = MB(384);
440 case SNB_GMCH_GMS_STOLEN_416M:
441 stolen_size = MB(416);
443 case SNB_GMCH_GMS_STOLEN_448M:
444 stolen_size = MB(448);
446 case SNB_GMCH_GMS_STOLEN_480M:
447 stolen_size = MB(480);
449 case SNB_GMCH_GMS_STOLEN_512M:
450 stolen_size = MB(512);
454 switch (gmch_ctrl & I855_GMCH_GMS_MASK) {
455 case I855_GMCH_GMS_STOLEN_1M:
458 case I855_GMCH_GMS_STOLEN_4M:
461 case I855_GMCH_GMS_STOLEN_8M:
464 case I855_GMCH_GMS_STOLEN_16M:
465 stolen_size = MB(16);
467 case I855_GMCH_GMS_STOLEN_32M:
468 stolen_size = MB(32);
470 case I915_GMCH_GMS_STOLEN_48M:
471 stolen_size = MB(48);
473 case I915_GMCH_GMS_STOLEN_64M:
474 stolen_size = MB(64);
476 case G33_GMCH_GMS_STOLEN_128M:
477 stolen_size = MB(128);
479 case G33_GMCH_GMS_STOLEN_256M:
480 stolen_size = MB(256);
482 case INTEL_GMCH_GMS_STOLEN_96M:
483 stolen_size = MB(96);
485 case INTEL_GMCH_GMS_STOLEN_160M:
486 stolen_size = MB(160);
488 case INTEL_GMCH_GMS_STOLEN_224M:
489 stolen_size = MB(224);
491 case INTEL_GMCH_GMS_STOLEN_352M:
492 stolen_size = MB(352);
500 if (stolen_size > 0) {
501 dev_info(&intel_private.bridge_dev->dev, "detected %dK %s memory\n",
502 stolen_size / KB(1), local ? "local" : "stolen");
504 dev_info(&intel_private.bridge_dev->dev,
505 "no pre-allocated video memory detected\n");
512 static void i965_adjust_pgetbl_size(unsigned int size_flag)
514 u32 pgetbl_ctl, pgetbl_ctl2;
516 /* ensure that ppgtt is disabled */
517 pgetbl_ctl2 = readl(intel_private.registers+I965_PGETBL_CTL2);
518 pgetbl_ctl2 &= ~I810_PGETBL_ENABLED;
519 writel(pgetbl_ctl2, intel_private.registers+I965_PGETBL_CTL2);
521 /* write the new ggtt size */
522 pgetbl_ctl = readl(intel_private.registers+I810_PGETBL_CTL);
523 pgetbl_ctl &= ~I965_PGETBL_SIZE_MASK;
524 pgetbl_ctl |= size_flag;
525 writel(pgetbl_ctl, intel_private.registers+I810_PGETBL_CTL);
528 static unsigned int i965_gtt_total_entries(void)
534 pci_read_config_word(intel_private.bridge_dev,
535 I830_GMCH_CTRL, &gmch_ctl);
537 if (INTEL_GTT_GEN == 5) {
538 switch (gmch_ctl & G4x_GMCH_SIZE_MASK) {
539 case G4x_GMCH_SIZE_1M:
540 case G4x_GMCH_SIZE_VT_1M:
541 i965_adjust_pgetbl_size(I965_PGETBL_SIZE_1MB);
543 case G4x_GMCH_SIZE_VT_1_5M:
544 i965_adjust_pgetbl_size(I965_PGETBL_SIZE_1_5MB);
546 case G4x_GMCH_SIZE_2M:
547 case G4x_GMCH_SIZE_VT_2M:
548 i965_adjust_pgetbl_size(I965_PGETBL_SIZE_2MB);
553 pgetbl_ctl = readl(intel_private.registers+I810_PGETBL_CTL);
555 switch (pgetbl_ctl & I965_PGETBL_SIZE_MASK) {
556 case I965_PGETBL_SIZE_128KB:
559 case I965_PGETBL_SIZE_256KB:
562 case I965_PGETBL_SIZE_512KB:
565 /* GTT pagetable sizes bigger than 512KB are not possible on G33! */
566 case I965_PGETBL_SIZE_1MB:
569 case I965_PGETBL_SIZE_2MB:
572 case I965_PGETBL_SIZE_1_5MB:
573 size = KB(1024 + 512);
576 dev_info(&intel_private.pcidev->dev,
577 "unknown page table size, assuming 512KB\n");
584 static unsigned int intel_gtt_total_entries(void)
588 if (IS_G33 || INTEL_GTT_GEN == 4 || INTEL_GTT_GEN == 5)
589 return i965_gtt_total_entries();
590 else if (INTEL_GTT_GEN == 6) {
593 pci_read_config_word(intel_private.pcidev, SNB_GMCH_CTRL, &snb_gmch_ctl);
594 switch (snb_gmch_ctl & SNB_GTT_SIZE_MASK) {
596 case SNB_GTT_SIZE_0M:
597 printk(KERN_ERR "Bad GTT size mask: 0x%04x.\n", snb_gmch_ctl);
600 case SNB_GTT_SIZE_1M:
603 case SNB_GTT_SIZE_2M:
609 /* On previous hardware, the GTT size was just what was
610 * required to map the aperture.
612 return intel_private.base.gtt_mappable_entries;
616 static unsigned int intel_gtt_mappable_entries(void)
618 unsigned int aperture_size;
620 if (INTEL_GTT_GEN == 1) {
623 pci_read_config_dword(intel_private.bridge_dev,
624 I810_SMRAM_MISCC, &smram_miscc);
626 if ((smram_miscc & I810_GFX_MEM_WIN_SIZE)
627 == I810_GFX_MEM_WIN_32M)
628 aperture_size = MB(32);
630 aperture_size = MB(64);
631 } else if (INTEL_GTT_GEN == 2) {
634 pci_read_config_word(intel_private.bridge_dev,
635 I830_GMCH_CTRL, &gmch_ctrl);
637 if ((gmch_ctrl & I830_GMCH_MEM_MASK) == I830_GMCH_MEM_64M)
638 aperture_size = MB(64);
640 aperture_size = MB(128);
642 /* 9xx supports large sizes, just look at the length */
643 aperture_size = pci_resource_len(intel_private.pcidev, 2);
646 return aperture_size >> PAGE_SHIFT;
649 static void intel_gtt_teardown_scratch_page(void)
651 set_pages_wb(intel_private.scratch_page, 1);
652 pci_unmap_page(intel_private.pcidev, intel_private.scratch_page_dma,
653 PAGE_SIZE, PCI_DMA_BIDIRECTIONAL);
654 put_page(intel_private.scratch_page);
655 __free_page(intel_private.scratch_page);
658 static void intel_gtt_cleanup(void)
660 intel_private.driver->cleanup();
662 iounmap(intel_private.gtt);
663 iounmap(intel_private.registers);
665 intel_gtt_teardown_scratch_page();
668 static int intel_gtt_init(void)
673 ret = intel_private.driver->setup();
677 intel_private.base.gtt_mappable_entries = intel_gtt_mappable_entries();
678 intel_private.base.gtt_total_entries = intel_gtt_total_entries();
680 /* save the PGETBL reg for resume */
681 intel_private.PGETBL_save =
682 readl(intel_private.registers+I810_PGETBL_CTL)
683 & ~I810_PGETBL_ENABLED;
684 /* we only ever restore the register when enabling the PGTBL... */
686 intel_private.PGETBL_save |= I810_PGETBL_ENABLED;
688 dev_info(&intel_private.bridge_dev->dev,
689 "detected gtt size: %dK total, %dK mappable\n",
690 intel_private.base.gtt_total_entries * 4,
691 intel_private.base.gtt_mappable_entries * 4);
693 gtt_map_size = intel_private.base.gtt_total_entries * 4;
695 intel_private.gtt = ioremap(intel_private.gtt_bus_addr,
697 if (!intel_private.gtt) {
698 intel_private.driver->cleanup();
699 iounmap(intel_private.registers);
703 global_cache_flush(); /* FIXME: ? */
705 intel_private.base.stolen_size = intel_gtt_stolen_size();
707 intel_private.base.needs_dmar = USE_PCI_DMA_API && INTEL_GTT_GEN > 2;
709 ret = intel_gtt_setup_scratch_page();
718 static int intel_fake_agp_fetch_size(void)
720 int num_sizes = ARRAY_SIZE(intel_fake_agp_sizes);
721 unsigned int aper_size;
724 aper_size = (intel_private.base.gtt_mappable_entries << PAGE_SHIFT)
727 for (i = 0; i < num_sizes; i++) {
728 if (aper_size == intel_fake_agp_sizes[i].size) {
729 agp_bridge->current_size =
730 (void *) (intel_fake_agp_sizes + i);
738 static void i830_cleanup(void)
742 /* The chipset_flush interface needs to get data that has already been
743 * flushed out of the CPU all the way out to main memory, because the GPU
744 * doesn't snoop those buffers.
746 * The 8xx series doesn't have the same lovely interface for flushing the
747 * chipset write buffers that the later chips do. According to the 865
748 * specs, it's 64 octwords, or 1KB. So, to get those previous things in
749 * that buffer out, we just fill 1KB and clflush it out, on the assumption
750 * that it'll push whatever was in there out. It appears to work.
752 static void i830_chipset_flush(void)
754 unsigned long timeout = jiffies + msecs_to_jiffies(1000);
756 /* Forcibly evict everything from the CPU write buffers.
757 * clflush appears to be insufficient.
759 wbinvd_on_all_cpus();
761 /* Now we've only seen documents for this magic bit on 855GM,
762 * we hope it exists for the other gen2 chipsets...
764 * Also works as advertised on my 845G.
766 writel(readl(intel_private.registers+I830_HIC) | (1<<31),
767 intel_private.registers+I830_HIC);
769 while (readl(intel_private.registers+I830_HIC) & (1<<31)) {
770 if (time_after(jiffies, timeout))
777 static void i830_write_entry(dma_addr_t addr, unsigned int entry,
780 u32 pte_flags = I810_PTE_VALID;
782 if (flags == AGP_USER_CACHED_MEMORY)
783 pte_flags |= I830_PTE_SYSTEM_CACHED;
785 writel(addr | pte_flags, intel_private.gtt + entry);
788 static bool intel_enable_gtt(void)
793 if (INTEL_GTT_GEN <= 2)
794 pci_read_config_dword(intel_private.pcidev, I810_GMADDR,
797 pci_read_config_dword(intel_private.pcidev, I915_GMADDR,
800 intel_private.gma_bus_addr = (gma_addr & PCI_BASE_ADDRESS_MEM_MASK);
802 if (INTEL_GTT_GEN >= 6)
805 if (INTEL_GTT_GEN == 2) {
808 pci_read_config_word(intel_private.bridge_dev,
809 I830_GMCH_CTRL, &gmch_ctrl);
810 gmch_ctrl |= I830_GMCH_ENABLED;
811 pci_write_config_word(intel_private.bridge_dev,
812 I830_GMCH_CTRL, gmch_ctrl);
814 pci_read_config_word(intel_private.bridge_dev,
815 I830_GMCH_CTRL, &gmch_ctrl);
816 if ((gmch_ctrl & I830_GMCH_ENABLED) == 0) {
817 dev_err(&intel_private.pcidev->dev,
818 "failed to enable the GTT: GMCH_CTRL=%x\n",
824 /* On the resume path we may be adjusting the PGTBL value, so
825 * be paranoid and flush all chipset write buffers...
827 if (INTEL_GTT_GEN >= 3)
828 writel(0, intel_private.registers+GFX_FLSH_CNTL);
830 reg = intel_private.registers+I810_PGETBL_CTL;
831 writel(intel_private.PGETBL_save, reg);
832 if (HAS_PGTBL_EN && (readl(reg) & I810_PGETBL_ENABLED) == 0) {
833 dev_err(&intel_private.pcidev->dev,
834 "failed to enable the GTT: PGETBL=%x [expected %x]\n",
835 readl(reg), intel_private.PGETBL_save);
839 if (INTEL_GTT_GEN >= 3)
840 writel(0, intel_private.registers+GFX_FLSH_CNTL);
845 static int i830_setup(void)
849 pci_read_config_dword(intel_private.pcidev, I810_MMADDR, ®_addr);
850 reg_addr &= 0xfff80000;
852 intel_private.registers = ioremap(reg_addr, KB(64));
853 if (!intel_private.registers)
856 intel_private.gtt_bus_addr = reg_addr + I810_PTE_BASE;
861 static int intel_fake_agp_create_gatt_table(struct agp_bridge_data *bridge)
863 agp_bridge->gatt_table_real = NULL;
864 agp_bridge->gatt_table = NULL;
865 agp_bridge->gatt_bus_addr = 0;
870 static int intel_fake_agp_free_gatt_table(struct agp_bridge_data *bridge)
875 static int intel_fake_agp_configure(void)
877 if (!intel_enable_gtt())
880 intel_private.clear_fake_agp = true;
881 agp_bridge->gart_bus_addr = intel_private.gma_bus_addr;
886 static bool i830_check_flags(unsigned int flags)
890 case AGP_PHYS_MEMORY:
891 case AGP_USER_CACHED_MEMORY:
892 case AGP_USER_MEMORY:
899 void intel_gtt_insert_sg_entries(struct scatterlist *sg_list,
901 unsigned int pg_start,
904 struct scatterlist *sg;
910 /* sg may merge pages, but we have to separate
911 * per-page addr for GTT */
912 for_each_sg(sg_list, sg, sg_len, i) {
913 len = sg_dma_len(sg) >> PAGE_SHIFT;
914 for (m = 0; m < len; m++) {
915 dma_addr_t addr = sg_dma_address(sg) + (m << PAGE_SHIFT);
916 intel_private.driver->write_entry(addr,
921 readl(intel_private.gtt+j-1);
923 EXPORT_SYMBOL(intel_gtt_insert_sg_entries);
925 void intel_gtt_insert_pages(unsigned int first_entry, unsigned int num_entries,
926 struct page **pages, unsigned int flags)
930 for (i = 0, j = first_entry; i < num_entries; i++, j++) {
931 dma_addr_t addr = page_to_phys(pages[i]);
932 intel_private.driver->write_entry(addr,
935 readl(intel_private.gtt+j-1);
937 EXPORT_SYMBOL(intel_gtt_insert_pages);
939 static int intel_fake_agp_insert_entries(struct agp_memory *mem,
940 off_t pg_start, int type)
944 if (intel_private.base.do_idle_maps)
947 if (intel_private.clear_fake_agp) {
948 int start = intel_private.base.stolen_size / PAGE_SIZE;
949 int end = intel_private.base.gtt_mappable_entries;
950 intel_gtt_clear_range(start, end - start);
951 intel_private.clear_fake_agp = false;
954 if (INTEL_GTT_GEN == 1 && type == AGP_DCACHE_MEMORY)
955 return i810_insert_dcache_entries(mem, pg_start, type);
957 if (mem->page_count == 0)
960 if (pg_start + mem->page_count > intel_private.base.gtt_total_entries)
963 if (type != mem->type)
966 if (!intel_private.driver->check_flags(type))
969 if (!mem->is_flushed)
970 global_cache_flush();
972 if (intel_private.base.needs_dmar) {
973 ret = intel_gtt_map_memory(mem->pages, mem->page_count,
974 &mem->sg_list, &mem->num_sg);
978 intel_gtt_insert_sg_entries(mem->sg_list, mem->num_sg,
981 intel_gtt_insert_pages(pg_start, mem->page_count, mem->pages,
987 mem->is_flushed = true;
991 void intel_gtt_clear_range(unsigned int first_entry, unsigned int num_entries)
995 for (i = first_entry; i < (first_entry + num_entries); i++) {
996 intel_private.driver->write_entry(intel_private.scratch_page_dma,
999 readl(intel_private.gtt+i-1);
1001 EXPORT_SYMBOL(intel_gtt_clear_range);
1003 static int intel_fake_agp_remove_entries(struct agp_memory *mem,
1004 off_t pg_start, int type)
1006 if (mem->page_count == 0)
1009 if (intel_private.base.do_idle_maps)
1012 intel_gtt_clear_range(pg_start, mem->page_count);
1014 if (intel_private.base.needs_dmar) {
1015 intel_gtt_unmap_memory(mem->sg_list, mem->num_sg);
1016 mem->sg_list = NULL;
1023 static struct agp_memory *intel_fake_agp_alloc_by_type(size_t pg_count,
1026 struct agp_memory *new;
1028 if (type == AGP_DCACHE_MEMORY && INTEL_GTT_GEN == 1) {
1029 if (pg_count != intel_private.num_dcache_entries)
1032 new = agp_create_memory(1);
1036 new->type = AGP_DCACHE_MEMORY;
1037 new->page_count = pg_count;
1038 new->num_scratch_pages = 0;
1039 agp_free_page_array(new);
1042 if (type == AGP_PHYS_MEMORY)
1043 return alloc_agpphysmem_i8xx(pg_count, type);
1044 /* always return NULL for other allocation types for now */
1048 static int intel_alloc_chipset_flush_resource(void)
1051 ret = pci_bus_alloc_resource(intel_private.bridge_dev->bus, &intel_private.ifp_resource, PAGE_SIZE,
1052 PAGE_SIZE, PCIBIOS_MIN_MEM, 0,
1053 pcibios_align_resource, intel_private.bridge_dev);
1058 static void intel_i915_setup_chipset_flush(void)
1063 pci_read_config_dword(intel_private.bridge_dev, I915_IFPADDR, &temp);
1064 if (!(temp & 0x1)) {
1065 intel_alloc_chipset_flush_resource();
1066 intel_private.resource_valid = 1;
1067 pci_write_config_dword(intel_private.bridge_dev, I915_IFPADDR, (intel_private.ifp_resource.start & 0xffffffff) | 0x1);
1071 intel_private.resource_valid = 1;
1072 intel_private.ifp_resource.start = temp;
1073 intel_private.ifp_resource.end = temp + PAGE_SIZE;
1074 ret = request_resource(&iomem_resource, &intel_private.ifp_resource);
1075 /* some BIOSes reserve this area in a pnp some don't */
1077 intel_private.resource_valid = 0;
1081 static void intel_i965_g33_setup_chipset_flush(void)
1083 u32 temp_hi, temp_lo;
1086 pci_read_config_dword(intel_private.bridge_dev, I965_IFPADDR + 4, &temp_hi);
1087 pci_read_config_dword(intel_private.bridge_dev, I965_IFPADDR, &temp_lo);
1089 if (!(temp_lo & 0x1)) {
1091 intel_alloc_chipset_flush_resource();
1093 intel_private.resource_valid = 1;
1094 pci_write_config_dword(intel_private.bridge_dev, I965_IFPADDR + 4,
1095 upper_32_bits(intel_private.ifp_resource.start));
1096 pci_write_config_dword(intel_private.bridge_dev, I965_IFPADDR, (intel_private.ifp_resource.start & 0xffffffff) | 0x1);
1101 l64 = ((u64)temp_hi << 32) | temp_lo;
1103 intel_private.resource_valid = 1;
1104 intel_private.ifp_resource.start = l64;
1105 intel_private.ifp_resource.end = l64 + PAGE_SIZE;
1106 ret = request_resource(&iomem_resource, &intel_private.ifp_resource);
1107 /* some BIOSes reserve this area in a pnp some don't */
1109 intel_private.resource_valid = 0;
1113 static void intel_i9xx_setup_flush(void)
1115 /* return if already configured */
1116 if (intel_private.ifp_resource.start)
1119 if (INTEL_GTT_GEN == 6)
1122 /* setup a resource for this object */
1123 intel_private.ifp_resource.name = "Intel Flush Page";
1124 intel_private.ifp_resource.flags = IORESOURCE_MEM;
1126 /* Setup chipset flush for 915 */
1127 if (IS_G33 || INTEL_GTT_GEN >= 4) {
1128 intel_i965_g33_setup_chipset_flush();
1130 intel_i915_setup_chipset_flush();
1133 if (intel_private.ifp_resource.start)
1134 intel_private.i9xx_flush_page = ioremap_nocache(intel_private.ifp_resource.start, PAGE_SIZE);
1135 if (!intel_private.i9xx_flush_page)
1136 dev_err(&intel_private.pcidev->dev,
1137 "can't ioremap flush page - no chipset flushing\n");
1140 static void i9xx_cleanup(void)
1142 if (intel_private.i9xx_flush_page)
1143 iounmap(intel_private.i9xx_flush_page);
1144 if (intel_private.resource_valid)
1145 release_resource(&intel_private.ifp_resource);
1146 intel_private.ifp_resource.start = 0;
1147 intel_private.resource_valid = 0;
1150 static void i9xx_chipset_flush(void)
1152 if (intel_private.i9xx_flush_page)
1153 writel(1, intel_private.i9xx_flush_page);
1156 static void i965_write_entry(dma_addr_t addr,
1162 pte_flags = I810_PTE_VALID;
1163 if (flags == AGP_USER_CACHED_MEMORY)
1164 pte_flags |= I830_PTE_SYSTEM_CACHED;
1166 /* Shift high bits down */
1167 addr |= (addr >> 28) & 0xf0;
1168 writel(addr | pte_flags, intel_private.gtt + entry);
1171 static bool gen6_check_flags(unsigned int flags)
1176 static void gen6_write_entry(dma_addr_t addr, unsigned int entry,
1179 unsigned int type_mask = flags & ~AGP_USER_CACHED_MEMORY_GFDT;
1180 unsigned int gfdt = flags & AGP_USER_CACHED_MEMORY_GFDT;
1183 if (type_mask == AGP_USER_MEMORY)
1184 pte_flags = GEN6_PTE_UNCACHED | I810_PTE_VALID;
1185 else if (type_mask == AGP_USER_CACHED_MEMORY_LLC_MLC) {
1186 pte_flags = GEN6_PTE_LLC_MLC | I810_PTE_VALID;
1188 pte_flags |= GEN6_PTE_GFDT;
1189 } else { /* set 'normal'/'cached' to LLC by default */
1190 pte_flags = GEN6_PTE_LLC | I810_PTE_VALID;
1192 pte_flags |= GEN6_PTE_GFDT;
1195 /* gen6 has bit11-4 for physical addr bit39-32 */
1196 addr |= (addr >> 28) & 0xff0;
1197 writel(addr | pte_flags, intel_private.gtt + entry);
1200 static void gen6_cleanup(void)
1204 /* Certain Gen5 chipsets require require idling the GPU before
1205 * unmapping anything from the GTT when VT-d is enabled.
1207 static inline int needs_idle_maps(void)
1209 #ifdef CONFIG_INTEL_IOMMU
1210 const unsigned short gpu_devid = intel_private.pcidev->device;
1211 extern int intel_iommu_gfx_mapped;
1213 /* Query intel_iommu to see if we need the workaround. Presumably that
1216 if ((gpu_devid == PCI_DEVICE_ID_INTEL_IRONLAKE_M_HB ||
1217 gpu_devid == PCI_DEVICE_ID_INTEL_IRONLAKE_M_IG) &&
1218 intel_iommu_gfx_mapped)
1224 static int i9xx_setup(void)
1228 pci_read_config_dword(intel_private.pcidev, I915_MMADDR, ®_addr);
1230 reg_addr &= 0xfff80000;
1232 intel_private.registers = ioremap(reg_addr, 128 * 4096);
1233 if (!intel_private.registers)
1236 if (INTEL_GTT_GEN == 3) {
1239 pci_read_config_dword(intel_private.pcidev,
1240 I915_PTEADDR, >t_addr);
1241 intel_private.gtt_bus_addr = gtt_addr;
1245 switch (INTEL_GTT_GEN) {
1252 gtt_offset = KB(512);
1255 intel_private.gtt_bus_addr = reg_addr + gtt_offset;
1258 if (needs_idle_maps())
1259 intel_private.base.do_idle_maps = 1;
1261 intel_i9xx_setup_flush();
1266 static const struct agp_bridge_driver intel_fake_agp_driver = {
1267 .owner = THIS_MODULE,
1268 .size_type = FIXED_APER_SIZE,
1269 .aperture_sizes = intel_fake_agp_sizes,
1270 .num_aperture_sizes = ARRAY_SIZE(intel_fake_agp_sizes),
1271 .configure = intel_fake_agp_configure,
1272 .fetch_size = intel_fake_agp_fetch_size,
1273 .cleanup = intel_gtt_cleanup,
1274 .agp_enable = intel_fake_agp_enable,
1275 .cache_flush = global_cache_flush,
1276 .create_gatt_table = intel_fake_agp_create_gatt_table,
1277 .free_gatt_table = intel_fake_agp_free_gatt_table,
1278 .insert_memory = intel_fake_agp_insert_entries,
1279 .remove_memory = intel_fake_agp_remove_entries,
1280 .alloc_by_type = intel_fake_agp_alloc_by_type,
1281 .free_by_type = intel_i810_free_by_type,
1282 .agp_alloc_page = agp_generic_alloc_page,
1283 .agp_alloc_pages = agp_generic_alloc_pages,
1284 .agp_destroy_page = agp_generic_destroy_page,
1285 .agp_destroy_pages = agp_generic_destroy_pages,
1288 static const struct intel_gtt_driver i81x_gtt_driver = {
1290 .has_pgtbl_enable = 1,
1291 .dma_mask_size = 32,
1292 .setup = i810_setup,
1293 .cleanup = i810_cleanup,
1294 .check_flags = i830_check_flags,
1295 .write_entry = i810_write_entry,
1297 static const struct intel_gtt_driver i8xx_gtt_driver = {
1299 .has_pgtbl_enable = 1,
1300 .setup = i830_setup,
1301 .cleanup = i830_cleanup,
1302 .write_entry = i830_write_entry,
1303 .dma_mask_size = 32,
1304 .check_flags = i830_check_flags,
1305 .chipset_flush = i830_chipset_flush,
1307 static const struct intel_gtt_driver i915_gtt_driver = {
1309 .has_pgtbl_enable = 1,
1310 .setup = i9xx_setup,
1311 .cleanup = i9xx_cleanup,
1312 /* i945 is the last gpu to need phys mem (for overlay and cursors). */
1313 .write_entry = i830_write_entry,
1314 .dma_mask_size = 32,
1315 .check_flags = i830_check_flags,
1316 .chipset_flush = i9xx_chipset_flush,
1318 static const struct intel_gtt_driver g33_gtt_driver = {
1321 .setup = i9xx_setup,
1322 .cleanup = i9xx_cleanup,
1323 .write_entry = i965_write_entry,
1324 .dma_mask_size = 36,
1325 .check_flags = i830_check_flags,
1326 .chipset_flush = i9xx_chipset_flush,
1328 static const struct intel_gtt_driver pineview_gtt_driver = {
1330 .is_pineview = 1, .is_g33 = 1,
1331 .setup = i9xx_setup,
1332 .cleanup = i9xx_cleanup,
1333 .write_entry = i965_write_entry,
1334 .dma_mask_size = 36,
1335 .check_flags = i830_check_flags,
1336 .chipset_flush = i9xx_chipset_flush,
1338 static const struct intel_gtt_driver i965_gtt_driver = {
1340 .has_pgtbl_enable = 1,
1341 .setup = i9xx_setup,
1342 .cleanup = i9xx_cleanup,
1343 .write_entry = i965_write_entry,
1344 .dma_mask_size = 36,
1345 .check_flags = i830_check_flags,
1346 .chipset_flush = i9xx_chipset_flush,
1348 static const struct intel_gtt_driver g4x_gtt_driver = {
1350 .setup = i9xx_setup,
1351 .cleanup = i9xx_cleanup,
1352 .write_entry = i965_write_entry,
1353 .dma_mask_size = 36,
1354 .check_flags = i830_check_flags,
1355 .chipset_flush = i9xx_chipset_flush,
1357 static const struct intel_gtt_driver ironlake_gtt_driver = {
1360 .setup = i9xx_setup,
1361 .cleanup = i9xx_cleanup,
1362 .write_entry = i965_write_entry,
1363 .dma_mask_size = 36,
1364 .check_flags = i830_check_flags,
1365 .chipset_flush = i9xx_chipset_flush,
1367 static const struct intel_gtt_driver sandybridge_gtt_driver = {
1369 .setup = i9xx_setup,
1370 .cleanup = gen6_cleanup,
1371 .write_entry = gen6_write_entry,
1372 .dma_mask_size = 40,
1373 .check_flags = gen6_check_flags,
1374 .chipset_flush = i9xx_chipset_flush,
1377 /* Table to describe Intel GMCH and AGP/PCIE GART drivers. At least one of
1378 * driver and gmch_driver must be non-null, and find_gmch will determine
1379 * which one should be used if a gmch_chip_id is present.
1381 static const struct intel_gtt_driver_description {
1382 unsigned int gmch_chip_id;
1384 const struct intel_gtt_driver *gtt_driver;
1385 } intel_gtt_chipsets[] = {
1386 { PCI_DEVICE_ID_INTEL_82810_IG1, "i810",
1388 { PCI_DEVICE_ID_INTEL_82810_IG3, "i810",
1390 { PCI_DEVICE_ID_INTEL_82810E_IG, "i810",
1392 { PCI_DEVICE_ID_INTEL_82815_CGC, "i815",
1394 { PCI_DEVICE_ID_INTEL_82830_CGC, "830M",
1396 { PCI_DEVICE_ID_INTEL_82845G_IG, "845G",
1398 { PCI_DEVICE_ID_INTEL_82854_IG, "854",
1400 { PCI_DEVICE_ID_INTEL_82855GM_IG, "855GM",
1402 { PCI_DEVICE_ID_INTEL_82865_IG, "865",
1404 { PCI_DEVICE_ID_INTEL_E7221_IG, "E7221 (i915)",
1406 { PCI_DEVICE_ID_INTEL_82915G_IG, "915G",
1408 { PCI_DEVICE_ID_INTEL_82915GM_IG, "915GM",
1410 { PCI_DEVICE_ID_INTEL_82945G_IG, "945G",
1412 { PCI_DEVICE_ID_INTEL_82945GM_IG, "945GM",
1414 { PCI_DEVICE_ID_INTEL_82945GME_IG, "945GME",
1416 { PCI_DEVICE_ID_INTEL_82946GZ_IG, "946GZ",
1418 { PCI_DEVICE_ID_INTEL_82G35_IG, "G35",
1420 { PCI_DEVICE_ID_INTEL_82965Q_IG, "965Q",
1422 { PCI_DEVICE_ID_INTEL_82965G_IG, "965G",
1424 { PCI_DEVICE_ID_INTEL_82965GM_IG, "965GM",
1426 { PCI_DEVICE_ID_INTEL_82965GME_IG, "965GME/GLE",
1428 { PCI_DEVICE_ID_INTEL_G33_IG, "G33",
1430 { PCI_DEVICE_ID_INTEL_Q35_IG, "Q35",
1432 { PCI_DEVICE_ID_INTEL_Q33_IG, "Q33",
1434 { PCI_DEVICE_ID_INTEL_PINEVIEW_M_IG, "GMA3150",
1435 &pineview_gtt_driver },
1436 { PCI_DEVICE_ID_INTEL_PINEVIEW_IG, "GMA3150",
1437 &pineview_gtt_driver },
1438 { PCI_DEVICE_ID_INTEL_GM45_IG, "GM45",
1440 { PCI_DEVICE_ID_INTEL_EAGLELAKE_IG, "Eaglelake",
1442 { PCI_DEVICE_ID_INTEL_Q45_IG, "Q45/Q43",
1444 { PCI_DEVICE_ID_INTEL_G45_IG, "G45/G43",
1446 { PCI_DEVICE_ID_INTEL_B43_IG, "B43",
1448 { PCI_DEVICE_ID_INTEL_B43_1_IG, "B43",
1450 { PCI_DEVICE_ID_INTEL_G41_IG, "G41",
1452 { PCI_DEVICE_ID_INTEL_IRONLAKE_D_IG,
1453 "HD Graphics", &ironlake_gtt_driver },
1454 { PCI_DEVICE_ID_INTEL_IRONLAKE_M_IG,
1455 "HD Graphics", &ironlake_gtt_driver },
1456 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_GT1_IG,
1457 "Sandybridge", &sandybridge_gtt_driver },
1458 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_GT2_IG,
1459 "Sandybridge", &sandybridge_gtt_driver },
1460 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_GT2_PLUS_IG,
1461 "Sandybridge", &sandybridge_gtt_driver },
1462 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_M_GT1_IG,
1463 "Sandybridge", &sandybridge_gtt_driver },
1464 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_M_GT2_IG,
1465 "Sandybridge", &sandybridge_gtt_driver },
1466 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_M_GT2_PLUS_IG,
1467 "Sandybridge", &sandybridge_gtt_driver },
1468 { PCI_DEVICE_ID_INTEL_SANDYBRIDGE_S_IG,
1469 "Sandybridge", &sandybridge_gtt_driver },
1470 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_GT1_IG,
1471 "Ivybridge", &sandybridge_gtt_driver },
1472 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_GT2_IG,
1473 "Ivybridge", &sandybridge_gtt_driver },
1474 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_M_GT1_IG,
1475 "Ivybridge", &sandybridge_gtt_driver },
1476 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_M_GT2_IG,
1477 "Ivybridge", &sandybridge_gtt_driver },
1478 { PCI_DEVICE_ID_INTEL_IVYBRIDGE_S_GT1_IG,
1479 "Ivybridge", &sandybridge_gtt_driver },
1483 static int find_gmch(u16 device)
1485 struct pci_dev *gmch_device;
1487 gmch_device = pci_get_device(PCI_VENDOR_ID_INTEL, device, NULL);
1488 if (gmch_device && PCI_FUNC(gmch_device->devfn) != 0) {
1489 gmch_device = pci_get_device(PCI_VENDOR_ID_INTEL,
1490 device, gmch_device);
1496 intel_private.pcidev = gmch_device;
1500 int intel_gmch_probe(struct pci_dev *pdev,
1501 struct agp_bridge_data *bridge)
1504 intel_private.driver = NULL;
1506 for (i = 0; intel_gtt_chipsets[i].name != NULL; i++) {
1507 if (find_gmch(intel_gtt_chipsets[i].gmch_chip_id)) {
1508 intel_private.driver =
1509 intel_gtt_chipsets[i].gtt_driver;
1514 if (!intel_private.driver)
1517 bridge->driver = &intel_fake_agp_driver;
1518 bridge->dev_private_data = &intel_private;
1521 intel_private.bridge_dev = pci_dev_get(pdev);
1523 dev_info(&pdev->dev, "Intel %s Chipset\n", intel_gtt_chipsets[i].name);
1525 mask = intel_private.driver->dma_mask_size;
1526 if (pci_set_dma_mask(intel_private.pcidev, DMA_BIT_MASK(mask)))
1527 dev_err(&intel_private.pcidev->dev,
1528 "set gfx device dma mask %d-bit failed!\n", mask);
1530 pci_set_consistent_dma_mask(intel_private.pcidev,
1531 DMA_BIT_MASK(mask));
1533 /*if (bridge->driver == &intel_810_driver)
1536 if (intel_gtt_init() != 0)
1541 EXPORT_SYMBOL(intel_gmch_probe);
1543 const struct intel_gtt *intel_gtt_get(void)
1545 return &intel_private.base;
1547 EXPORT_SYMBOL(intel_gtt_get);
1549 void intel_gtt_chipset_flush(void)
1551 if (intel_private.driver->chipset_flush)
1552 intel_private.driver->chipset_flush();
1554 EXPORT_SYMBOL(intel_gtt_chipset_flush);
1556 void intel_gmch_remove(struct pci_dev *pdev)
1558 if (intel_private.pcidev)
1559 pci_dev_put(intel_private.pcidev);
1560 if (intel_private.bridge_dev)
1561 pci_dev_put(intel_private.bridge_dev);
1563 EXPORT_SYMBOL(intel_gmch_remove);
1565 MODULE_AUTHOR("Dave Jones <davej@redhat.com>");
1566 MODULE_LICENSE("GPL and additional rights");