blob: 4b7e3d8b01ddfdeb5b1e49bbdfc4519e2b102ac1 [file] [log] [blame]
Glauber Costa459121c92008-04-08 13:20:43 -03001#include <linux/dma-mapping.h>
Joerg Roedel2118d0c2009-01-09 15:13:15 +01002#include <linux/dma-debug.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03003#include <linux/dmar.h>
Glauber Costa116890d2008-04-08 13:20:54 -03004#include <linux/bootmem.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09005#include <linux/gfp.h>
Glauber Costabca5c092008-04-08 13:20:53 -03006#include <linux/pci.h>
Catalin Marinasacde31d2009-08-27 14:29:20 +01007#include <linux/kmemleak.h>
Glauber Costacb5867a2008-04-08 13:20:51 -03008
Glauber Costa116890d2008-04-08 13:20:54 -03009#include <asm/proto.h>
10#include <asm/dma.h>
FUJITA Tomonori46a7fa22008-07-11 10:23:42 +090011#include <asm/iommu.h>
Joerg Roedel1d9b16d2008-11-27 18:39:15 +010012#include <asm/gart.h>
Glauber Costacb5867a2008-04-08 13:20:51 -030013#include <asm/calgary.h>
Joerg Roedela69ca342008-06-26 21:28:08 +020014#include <asm/amd_iommu.h>
Ingo Molnarb4941a92009-11-10 14:37:58 +010015#include <asm/x86_init.h>
Glauber Costa459121c92008-04-08 13:20:43 -030016
Fenghua Yu3b15e582008-10-23 16:51:00 -070017static int forbid_dac __read_mostly;
18
FUJITA Tomonoria3b28ee2009-11-14 20:46:36 +090019struct dma_map_ops *dma_ops = &nommu_dma_ops;
Glauber Costa85c246e2008-04-08 13:20:50 -030020EXPORT_SYMBOL(dma_ops);
21
Dmitri Vorobievb4cdc432008-04-28 03:15:58 +040022static int iommu_sac_force __read_mostly;
Glauber Costa8e0c3792008-04-08 13:20:55 -030023
Glauber Costaf9c258d2008-04-08 13:20:52 -030024#ifdef CONFIG_IOMMU_DEBUG
25int panic_on_overflow __read_mostly = 1;
26int force_iommu __read_mostly = 1;
27#else
28int panic_on_overflow __read_mostly = 0;
29int force_iommu __read_mostly = 0;
30#endif
31
Glauber Costafae9a0d2008-04-08 13:20:56 -030032int iommu_merge __read_mostly = 0;
33
34int no_iommu __read_mostly;
35/* Set this to 1 if there is a HW IOMMU in the system */
36int iommu_detected __read_mostly = 0;
37
Joerg Roedelac0101d2009-09-01 16:00:35 +020038/*
39 * This variable becomes 1 if iommu=pt is passed on the kernel command line.
Marin Mitove3be7852009-10-03 20:45:02 +030040 * If this variable is 1, IOMMU implementations do no DMA translation for
Joerg Roedelac0101d2009-09-01 16:00:35 +020041 * devices and allow every device to access to whole physical memory. This is
Justin P. Mattockfb637f32010-01-14 22:16:16 -080042 * useful if a user wants to use an IOMMU only for KVM device assignment to
Joerg Roedelac0101d2009-09-01 16:00:35 +020043 * guests and not for driver dma translation.
44 */
45int iommu_pass_through __read_mostly;
Fenghua Yuaed5d5f2009-04-30 17:57:11 -070046
Jan Beulicheb647132009-11-08 12:12:14 +010047/* Dummy device used for NULL arguments (normally ISA). */
Joerg Roedel6c505ce2008-08-19 16:32:45 +020048struct device x86_dma_fallback_dev = {
Kay Sievers1a927132008-10-30 02:17:49 +010049 .init_name = "fallback device",
Jan Beulicheb647132009-11-08 12:12:14 +010050 .coherent_dma_mask = ISA_DMA_BIT_MASK,
Joerg Roedel6c505ce2008-08-19 16:32:45 +020051 .dma_mask = &x86_dma_fallback_dev.coherent_dma_mask,
Glauber Costa098cb7f2008-04-09 13:18:10 -030052};
Joerg Roedel6c505ce2008-08-19 16:32:45 +020053EXPORT_SYMBOL(x86_dma_fallback_dev);
Glauber Costa098cb7f2008-04-09 13:18:10 -030054
Joerg Roedel2118d0c2009-01-09 15:13:15 +010055/* Number of entries preallocated for DMA-API debugging */
56#define PREALLOC_DMA_DEBUG_ENTRIES 32768
57
Glauber Costa459121c92008-04-08 13:20:43 -030058int dma_set_mask(struct device *dev, u64 mask)
59{
60 if (!dev->dma_mask || !dma_supported(dev, mask))
61 return -EIO;
62
63 *dev->dma_mask = mask;
64
65 return 0;
66}
67EXPORT_SYMBOL(dma_set_mask);
68
Yinghai Luc252a5b2010-02-10 01:20:19 -080069#if defined(CONFIG_X86_64) && !defined(CONFIG_NUMA)
Glauber Costa116890d2008-04-08 13:20:54 -030070static __initdata void *dma32_bootmem_ptr;
71static unsigned long dma32_bootmem_size __initdata = (128ULL<<20);
72
73static int __init parse_dma32_size_opt(char *p)
74{
75 if (!p)
76 return -EINVAL;
77 dma32_bootmem_size = memparse(p, &p);
78 return 0;
79}
80early_param("dma32_size", parse_dma32_size_opt);
81
82void __init dma32_reserve_bootmem(void)
83{
84 unsigned long size, align;
Yinghai Luc987d122008-06-24 22:14:09 -070085 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -030086 return;
87
Yinghai Lu7677b2e2008-04-14 20:40:37 -070088 /*
89 * check aperture_64.c allocate_aperture() for reason about
90 * using 512M as goal
91 */
Glauber Costa116890d2008-04-08 13:20:54 -030092 align = 64ULL<<20;
Joerg Roedel1ddb5512008-07-25 16:48:55 +020093 size = roundup(dma32_bootmem_size, align);
Glauber Costa116890d2008-04-08 13:20:54 -030094 dma32_bootmem_ptr = __alloc_bootmem_nopanic(size, align,
Yinghai Lu7677b2e2008-04-14 20:40:37 -070095 512ULL<<20);
Catalin Marinasacde31d2009-08-27 14:29:20 +010096 /*
97 * Kmemleak should not scan this block as it may not be mapped via the
98 * kernel direct mapping.
99 */
100 kmemleak_ignore(dma32_bootmem_ptr);
Glauber Costa116890d2008-04-08 13:20:54 -0300101 if (dma32_bootmem_ptr)
102 dma32_bootmem_size = size;
103 else
104 dma32_bootmem_size = 0;
105}
106static void __init dma32_free_bootmem(void)
107{
Glauber Costa116890d2008-04-08 13:20:54 -0300108
Yinghai Luc987d122008-06-24 22:14:09 -0700109 if (max_pfn <= MAX_DMA32_PFN)
Glauber Costa116890d2008-04-08 13:20:54 -0300110 return;
111
112 if (!dma32_bootmem_ptr)
113 return;
114
Yinghai Lu330fce22008-04-19 01:31:45 -0700115 free_bootmem(__pa(dma32_bootmem_ptr), dma32_bootmem_size);
Glauber Costa116890d2008-04-08 13:20:54 -0300116
117 dma32_bootmem_ptr = NULL;
118 dma32_bootmem_size = 0;
119}
Yinghai Luc252a5b2010-02-10 01:20:19 -0800120#else
121void __init dma32_reserve_bootmem(void)
122{
123}
124static void __init dma32_free_bootmem(void)
125{
126}
127
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800128#endif
Glauber Costa116890d2008-04-08 13:20:54 -0300129
130void __init pci_iommu_alloc(void)
131{
132 /* free the range so iommu could get some range less than 4G */
133 dma32_free_bootmem();
Yinghai Luc252a5b2010-02-10 01:20:19 -0800134
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900135 if (pci_swiotlb_detect())
136 goto out;
Jeremy Fitzhardingecfb80c92008-12-16 12:17:36 -0800137
Glauber Costa116890d2008-04-08 13:20:54 -0300138 gart_iommu_hole_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300139
Glauber Costa116890d2008-04-08 13:20:54 -0300140 detect_calgary();
Glauber Costa116890d2008-04-08 13:20:54 -0300141
142 detect_intel_iommu();
143
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900144 /* needs to be called after gart_iommu_hole_init */
Joerg Roedela69ca342008-06-26 21:28:08 +0200145 amd_iommu_detect();
FUJITA Tomonori186a2502009-12-15 20:47:56 +0900146out:
147 pci_swiotlb_init();
Glauber Costa116890d2008-04-08 13:20:54 -0300148}
FUJITA Tomonori8978b742008-07-29 13:38:53 +0900149
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900150void *dma_generic_alloc_coherent(struct device *dev, size_t size,
151 dma_addr_t *dma_addr, gfp_t flag)
152{
153 unsigned long dma_mask;
154 struct page *page;
155 dma_addr_t addr;
156
157 dma_mask = dma_alloc_coherent_mask(dev, flag);
158
159 flag |= __GFP_ZERO;
160again:
161 page = alloc_pages_node(dev_to_node(dev), flag, get_order(size));
162 if (!page)
163 return NULL;
164
165 addr = page_to_phys(page);
FUJITA Tomonoria4c2baa2009-07-10 10:04:55 +0900166 if (addr + size > dma_mask) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900167 __free_pages(page, get_order(size));
168
Yang Hongyang284901a2009-04-06 19:01:15 -0700169 if (dma_mask < DMA_BIT_MASK(32) && !(flag & GFP_DMA)) {
FUJITA Tomonori9f6ac572008-09-24 20:48:35 +0900170 flag = (flag & ~GFP_DMA32) | GFP_DMA;
171 goto again;
172 }
173
174 return NULL;
175 }
176
177 *dma_addr = addr;
178 return page_address(page);
179}
180
Glauber Costafae9a0d2008-04-08 13:20:56 -0300181/*
182 * See <Documentation/x86_64/boot-options.txt> for the iommu kernel parameter
183 * documentation.
184 */
185static __init int iommu_setup(char *p)
186{
187 iommu_merge = 1;
188
189 if (!p)
190 return -EINVAL;
191
192 while (*p) {
193 if (!strncmp(p, "off", 3))
194 no_iommu = 1;
195 /* gart_parse_options has more force support */
196 if (!strncmp(p, "force", 5))
197 force_iommu = 1;
198 if (!strncmp(p, "noforce", 7)) {
199 iommu_merge = 0;
200 force_iommu = 0;
201 }
202
203 if (!strncmp(p, "biomerge", 8)) {
Glauber Costafae9a0d2008-04-08 13:20:56 -0300204 iommu_merge = 1;
205 force_iommu = 1;
206 }
207 if (!strncmp(p, "panic", 5))
208 panic_on_overflow = 1;
209 if (!strncmp(p, "nopanic", 7))
210 panic_on_overflow = 0;
211 if (!strncmp(p, "merge", 5)) {
212 iommu_merge = 1;
213 force_iommu = 1;
214 }
215 if (!strncmp(p, "nomerge", 7))
216 iommu_merge = 0;
217 if (!strncmp(p, "forcesac", 8))
218 iommu_sac_force = 1;
219 if (!strncmp(p, "allowdac", 8))
220 forbid_dac = 0;
221 if (!strncmp(p, "nodac", 5))
Tejun Heo2ae8bb72009-10-26 15:41:46 +0100222 forbid_dac = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300223 if (!strncmp(p, "usedac", 6)) {
224 forbid_dac = -1;
225 return 1;
226 }
227#ifdef CONFIG_SWIOTLB
228 if (!strncmp(p, "soft", 4))
229 swiotlb = 1;
David Woodhouse3238c0c2009-07-01 18:56:16 +0100230#endif
Alex Williamson80286872009-07-30 16:15:18 -0600231 if (!strncmp(p, "pt", 2))
Fenghua Yu4ed0d3e2009-04-24 17:30:20 -0700232 iommu_pass_through = 1;
Glauber Costafae9a0d2008-04-08 13:20:56 -0300233
Glauber Costafae9a0d2008-04-08 13:20:56 -0300234 gart_parse_options(p);
Glauber Costafae9a0d2008-04-08 13:20:56 -0300235
236#ifdef CONFIG_CALGARY_IOMMU
237 if (!strncmp(p, "calgary", 7))
238 use_calgary = 1;
239#endif /* CONFIG_CALGARY_IOMMU */
240
241 p += strcspn(p, ",");
242 if (*p == ',')
243 ++p;
244 }
245 return 0;
246}
247early_param("iommu", iommu_setup);
248
Glauber Costa8e0c3792008-04-08 13:20:55 -0300249int dma_supported(struct device *dev, u64 mask)
250{
FUJITA Tomonori160c1d82009-01-05 23:59:02 +0900251 struct dma_map_ops *ops = get_dma_ops(dev);
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700252
Glauber Costa8e0c3792008-04-08 13:20:55 -0300253#ifdef CONFIG_PCI
254 if (mask > 0xffffffff && forbid_dac > 0) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200255 dev_info(dev, "PCI: Disallowing DAC for device\n");
Glauber Costa8e0c3792008-04-08 13:20:55 -0300256 return 0;
257 }
258#endif
259
FUJITA Tomonori8d8bb392008-07-25 19:44:49 -0700260 if (ops->dma_supported)
261 return ops->dma_supported(dev, mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300262
263 /* Copied from i386. Doesn't make much sense, because it will
264 only work for pci_alloc_coherent.
265 The caller just has to use GFP_DMA in this case. */
Yang Hongyang2f4f27d2009-04-06 19:01:18 -0700266 if (mask < DMA_BIT_MASK(24))
Glauber Costa8e0c3792008-04-08 13:20:55 -0300267 return 0;
268
269 /* Tell the device to use SAC when IOMMU force is on. This
270 allows the driver to use cheaper accesses in some cases.
271
272 Problem with this is that if we overflow the IOMMU area and
273 return DAC as fallback address the device may not handle it
274 correctly.
275
276 As a special case some controllers have a 39bit address
277 mode that is as efficient as 32bit (aic79xx). Don't force
278 SAC for these. Assume all masks <= 40 bits are of this
279 type. Normally this doesn't make any difference, but gives
280 more gentle handling of IOMMU overflow. */
Yang Hongyang50cf1562009-04-06 19:01:14 -0700281 if (iommu_sac_force && (mask >= DMA_BIT_MASK(40))) {
Greg Kroah-Hartmanfc3a8822008-05-02 06:02:41 +0200282 dev_info(dev, "Force SAC with mask %Lx\n", mask);
Glauber Costa8e0c3792008-04-08 13:20:55 -0300283 return 0;
284 }
285
286 return 1;
287}
288EXPORT_SYMBOL(dma_supported);
289
Glauber Costacb5867a2008-04-08 13:20:51 -0300290static int __init pci_iommu_init(void)
291{
Joerg Roedel2118d0c2009-01-09 15:13:15 +0100292 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
293
Joerg Roedel86f31952009-03-16 17:50:28 +0100294#ifdef CONFIG_PCI
295 dma_debug_add_bus(&pci_bus_type);
296#endif
FUJITA Tomonorid07c1be2009-11-10 19:46:12 +0900297 x86_init.iommu.iommu_init();
298
FUJITA Tomonori75f1cdf2009-11-10 19:46:20 +0900299 if (swiotlb) {
300 printk(KERN_INFO "PCI-DMA: "
301 "Using software bounce buffering for IO (SWIOTLB)\n");
302 swiotlb_print_info();
303 } else
304 swiotlb_free();
305
Glauber Costacb5867a2008-04-08 13:20:51 -0300306 return 0;
307}
Glauber Costacb5867a2008-04-08 13:20:51 -0300308/* Must execute after PCI subsystem */
David Woodhouse9a821b22009-10-12 12:59:29 +0100309rootfs_initcall(pci_iommu_init);
Fenghua Yu3b15e582008-10-23 16:51:00 -0700310
311#ifdef CONFIG_PCI
312/* Many VIA bridges seem to corrupt data for DAC. Disable it here */
313
314static __devinit void via_no_dac(struct pci_dev *dev)
315{
316 if ((dev->class >> 8) == PCI_CLASS_BRIDGE_PCI && forbid_dac == 0) {
Bjorn Helgaas13bf7572009-02-24 10:38:22 -0700317 dev_info(&dev->dev, "disabling DAC on VIA PCI bridge\n");
Fenghua Yu3b15e582008-10-23 16:51:00 -0700318 forbid_dac = 1;
319 }
320}
321DECLARE_PCI_FIXUP_FINAL(PCI_VENDOR_ID_VIA, PCI_ANY_ID, via_no_dac);
322#endif