blob: 1c8a25db24d2d2e2dc0c7fddec9b316a8873c971 [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Russell King0ddbccd2008-09-25 15:59:19 +01002 * linux/arch/arm/mm/dma-mapping.c
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
4 * Copyright (C) 2000-2004 Russell King
5 *
6 * This program is free software; you can redistribute it and/or modify
7 * it under the terms of the GNU General Public License version 2 as
8 * published by the Free Software Foundation.
9 *
10 * DMA uncached mapping support.
11 */
12#include <linux/module.h>
13#include <linux/mm.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090014#include <linux/gfp.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070015#include <linux/errno.h>
16#include <linux/list.h>
17#include <linux/init.h>
18#include <linux/device.h>
19#include <linux/dma-mapping.h>
Marek Szyprowskid4398df2011-12-29 13:09:51 +010020#include <linux/dma-contiguous.h>
Nicolas Pitre39af22a2010-12-15 15:14:45 -050021#include <linux/highmem.h>
Marek Szyprowskid4398df2011-12-29 13:09:51 +010022#include <linux/memblock.h>
Jon Medhurst99d17172011-08-02 17:28:27 +010023#include <linux/slab.h>
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +020024#include <linux/iommu.h>
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +020025#include <linux/io.h>
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +020026#include <linux/vmalloc.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070027
Lennert Buytenhek23759dc2006-04-02 00:07:39 +010028#include <asm/memory.h>
Nicolas Pitre43377452009-03-12 22:52:09 -040029#include <asm/highmem.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070030#include <asm/cacheflush.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070031#include <asm/tlbflush.h>
Kevin Hilman37134cd2006-01-12 16:12:21 +000032#include <asm/sizes.h>
Jon Medhurst99d17172011-08-02 17:28:27 +010033#include <asm/mach/arch.h>
Marek Szyprowskid4398df2011-12-29 13:09:51 +010034#include <asm/mach/map.h>
35#include <asm/system_info.h>
36#include <asm/dma-contiguous.h>
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +020037#include <asm/dma-iommu.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070038
Russell King022ae532011-07-08 21:26:59 +010039#include "mm.h"
40
Marek Szyprowski75cd6512012-02-10 19:55:20 +010041/*
42 * The DMA API is built upon the notion of "buffer ownership". A buffer
43 * is either exclusively owned by the CPU (and therefore may be accessed
44 * by it) or exclusively owned by the DMA device. These helper functions
45 * represent the transitions between these two ownership states.
46 *
47 * Note, however, that on later ARMs, this notion does not work due to
48 * speculative prefetches. We model our approach on the assumption that
49 * the CPU does do speculative prefetches, which means we clean caches
50 * before transfers and delay cache invalidation until transfer completion.
51 *
Marek Szyprowski75cd6512012-02-10 19:55:20 +010052 */
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +010053static void __dma_page_cpu_to_dev(struct page *, unsigned long,
Marek Szyprowski75cd6512012-02-10 19:55:20 +010054 size_t, enum dma_data_direction);
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +010055static void __dma_page_dev_to_cpu(struct page *, unsigned long,
Marek Szyprowski75cd6512012-02-10 19:55:20 +010056 size_t, enum dma_data_direction);
57
Marek Szyprowskif6fe2822012-02-10 19:55:20 +010058/**
59 * arm_dma_map_page - map a portion of a page for streaming DMA
60 * @dev: valid struct device pointer, or NULL for ISA and EISA-like devices
61 * @page: page that buffer resides in
62 * @offset: offset into page for start of buffer
63 * @size: size of buffer to map
64 * @dir: DMA transfer direction
65 *
66 * Ensure that any data held in the cache is appropriately discarded
67 * or written back.
68 *
69 * The device owns this memory once this call has completed. The CPU
70 * can regain ownership by calling dma_unmap_page().
71 */
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +010072static dma_addr_t arm_dma_map_page(struct device *dev, struct page *page,
Marek Szyprowskif6fe2822012-02-10 19:55:20 +010073 unsigned long offset, size_t size, enum dma_data_direction dir,
74 struct dma_attrs *attrs)
75{
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +010076 if (!arch_is_coherent())
77 __dma_page_cpu_to_dev(page, offset, size, dir);
78 return pfn_to_dma(dev, page_to_pfn(page)) + offset;
Marek Szyprowskif6fe2822012-02-10 19:55:20 +010079}
80
81/**
82 * arm_dma_unmap_page - unmap a buffer previously mapped through dma_map_page()
83 * @dev: valid struct device pointer, or NULL for ISA and EISA-like devices
84 * @handle: DMA address of buffer
85 * @size: size of buffer (same as passed to dma_map_page)
86 * @dir: DMA transfer direction (same as passed to dma_map_page)
87 *
88 * Unmap a page streaming mode DMA translation. The handle and size
89 * must match what was provided in the previous dma_map_page() call.
90 * All other usages are undefined.
91 *
92 * After this call, reads by the CPU to the buffer are guaranteed to see
93 * whatever the device wrote there.
94 */
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +010095static void arm_dma_unmap_page(struct device *dev, dma_addr_t handle,
Marek Szyprowskif6fe2822012-02-10 19:55:20 +010096 size_t size, enum dma_data_direction dir,
97 struct dma_attrs *attrs)
98{
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +010099 if (!arch_is_coherent())
100 __dma_page_dev_to_cpu(pfn_to_page(dma_to_pfn(dev, handle)),
101 handle & ~PAGE_MASK, size, dir);
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100102}
103
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +0100104static void arm_dma_sync_single_for_cpu(struct device *dev,
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100105 dma_addr_t handle, size_t size, enum dma_data_direction dir)
106{
107 unsigned int offset = handle & (PAGE_SIZE - 1);
108 struct page *page = pfn_to_page(dma_to_pfn(dev, handle-offset));
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +0100109 if (!arch_is_coherent())
110 __dma_page_dev_to_cpu(page, offset, size, dir);
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100111}
112
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +0100113static void arm_dma_sync_single_for_device(struct device *dev,
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100114 dma_addr_t handle, size_t size, enum dma_data_direction dir)
115{
116 unsigned int offset = handle & (PAGE_SIZE - 1);
117 struct page *page = pfn_to_page(dma_to_pfn(dev, handle-offset));
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +0100118 if (!arch_is_coherent())
119 __dma_page_cpu_to_dev(page, offset, size, dir);
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100120}
121
122static int arm_dma_set_mask(struct device *dev, u64 dma_mask);
123
124struct dma_map_ops arm_dma_ops = {
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200125 .alloc = arm_dma_alloc,
126 .free = arm_dma_free,
127 .mmap = arm_dma_mmap,
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100128 .map_page = arm_dma_map_page,
129 .unmap_page = arm_dma_unmap_page,
130 .map_sg = arm_dma_map_sg,
131 .unmap_sg = arm_dma_unmap_sg,
132 .sync_single_for_cpu = arm_dma_sync_single_for_cpu,
133 .sync_single_for_device = arm_dma_sync_single_for_device,
134 .sync_sg_for_cpu = arm_dma_sync_sg_for_cpu,
135 .sync_sg_for_device = arm_dma_sync_sg_for_device,
136 .set_dma_mask = arm_dma_set_mask,
137};
138EXPORT_SYMBOL(arm_dma_ops);
139
Catalin Marinasab6494f2009-07-24 12:35:02 +0100140static u64 get_coherent_dma_mask(struct device *dev)
141{
Russell King022ae532011-07-08 21:26:59 +0100142 u64 mask = (u64)arm_dma_limit;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700143
Catalin Marinasab6494f2009-07-24 12:35:02 +0100144 if (dev) {
145 mask = dev->coherent_dma_mask;
146
147 /*
148 * Sanity check the DMA mask - it must be non-zero, and
149 * must be able to be satisfied by a DMA allocation.
150 */
151 if (mask == 0) {
152 dev_warn(dev, "coherent DMA mask is unset\n");
153 return 0;
154 }
155
Russell King022ae532011-07-08 21:26:59 +0100156 if ((~mask) & (u64)arm_dma_limit) {
Catalin Marinasab6494f2009-07-24 12:35:02 +0100157 dev_warn(dev, "coherent DMA mask %#llx is smaller "
158 "than system GFP_DMA mask %#llx\n",
Russell King022ae532011-07-08 21:26:59 +0100159 mask, (u64)arm_dma_limit);
Catalin Marinasab6494f2009-07-24 12:35:02 +0100160 return 0;
161 }
162 }
163
164 return mask;
165}
166
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100167static void __dma_clear_buffer(struct page *page, size_t size)
168{
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100169 /*
170 * Ensure that the allocated pages are zeroed, and that any data
171 * lurking in the kernel direct-mapped region is invalidated.
172 */
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100173 if (!PageHighMem(page)) {
174 void *ptr = page_address(page);
175 if (ptr) {
176 memset(ptr, 0, size);
177 dmac_flush_range(ptr, ptr + size);
178 outer_flush_range(__pa(ptr), __pa(ptr) + size);
179 }
180 } else {
181 phys_addr_t base = __pfn_to_phys(page_to_pfn(page));
182 phys_addr_t end = base + size;
183 while (size > 0) {
184 void *ptr = kmap_atomic(page);
185 memset(ptr, 0, PAGE_SIZE);
186 dmac_flush_range(ptr, ptr + PAGE_SIZE);
187 kunmap_atomic(ptr);
188 page++;
189 size -= PAGE_SIZE;
190 }
191 outer_flush_range(base, end);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +0200192 }
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100193}
194
Russell King7a9a32a2009-11-19 15:31:07 +0000195/*
196 * Allocate a DMA buffer for 'dev' of size 'size' using the
197 * specified gfp mask. Note that 'size' must be page aligned.
198 */
199static struct page *__dma_alloc_buffer(struct device *dev, size_t size, gfp_t gfp)
200{
201 unsigned long order = get_order(size);
202 struct page *page, *p, *e;
Russell King7a9a32a2009-11-19 15:31:07 +0000203
204 page = alloc_pages(gfp, order);
205 if (!page)
206 return NULL;
207
208 /*
209 * Now split the huge page and free the excess pages
210 */
211 split_page(page, order);
212 for (p = page + (size >> PAGE_SHIFT), e = page + (1 << order); p < e; p++)
213 __free_page(p);
214
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100215 __dma_clear_buffer(page, size);
Russell King7a9a32a2009-11-19 15:31:07 +0000216
217 return page;
218}
219
220/*
221 * Free a DMA buffer. 'size' must be page aligned.
222 */
223static void __dma_free_buffer(struct page *page, size_t size)
224{
225 struct page *e = page + (size >> PAGE_SHIFT);
226
227 while (page < e) {
228 __free_page(page);
229 page++;
230 }
231}
232
Catalin Marinasab6494f2009-07-24 12:35:02 +0100233#ifdef CONFIG_MMU
Linus Torvalds1da177e2005-04-16 15:20:36 -0700234#ifdef CONFIG_HUGETLB_PAGE
235#error ARM Coherent DMA allocator does not (yet) support huge TLB
236#endif
237
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200238static void *__alloc_remap_buffer(struct device *dev, size_t size, gfp_t gfp,
239 pgprot_t prot, struct page **ret_page,
240 const void *caller);
241
242static void *
243__dma_alloc_remap(struct page *page, size_t size, gfp_t gfp, pgprot_t prot,
244 const void *caller)
Russell King88c58f32009-11-19 16:46:02 +0000245{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200246 struct vm_struct *area;
247 unsigned long addr;
Jon Medhurst99d17172011-08-02 17:28:27 +0100248
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200249 /*
250 * DMA allocation can be mapped to user space, so lets
251 * set VM_USERMAP flags too.
252 */
253 area = get_vm_area_caller(size, VM_ARM_DMA_CONSISTENT | VM_USERMAP,
254 caller);
255 if (!area)
256 return NULL;
257 addr = (unsigned long)area->addr;
258 area->phys_addr = __pfn_to_phys(page_to_pfn(page));
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100259
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200260 if (ioremap_page_range(addr, addr + size, area->phys_addr, prot)) {
261 vunmap((void *)addr);
262 return NULL;
Jon Medhurst99d17172011-08-02 17:28:27 +0100263 }
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200264 return (void *)addr;
Russell King88c58f32009-11-19 16:46:02 +0000265}
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200266
267static void __dma_free_remap(void *cpu_addr, size_t size, bool no_warn)
268{
269 unsigned int flags = VM_ARM_DMA_CONSISTENT | VM_USERMAP;
270 struct vm_struct *area = find_vm_area(cpu_addr);
271 if (!area || (area->flags & flags) != flags) {
272 if (!no_warn)
273 WARN(1, "trying to free invalid coherent area: %p\n",
274 cpu_addr);
275 return;
276 }
277 unmap_kernel_range((unsigned long)cpu_addr, size);
278 vunmap(cpu_addr);
279}
Russell King88c58f32009-11-19 16:46:02 +0000280
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100281static void *__alloc_from_contiguous(struct device *dev, size_t size,
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700282 pgprot_t prot, struct page **ret_page,
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100283 bool no_kernel_mapping, const void *caller);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100284
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200285struct dma_pool {
286 size_t size;
287 spinlock_t lock;
288 unsigned long *bitmap;
289 unsigned long nr_pages;
290 void *vaddr;
291 struct page *page;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100292};
293
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200294static struct dma_pool atomic_pool = {
295 .size = SZ_256K,
296};
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100297
298static int __init early_coherent_pool(char *p)
299{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200300 atomic_pool.size = memparse(p, &p);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100301 return 0;
302}
303early_param("coherent_pool", early_coherent_pool);
304
305/*
306 * Initialise the coherent pool for atomic allocations.
307 */
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200308static int __init atomic_pool_init(void)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100309{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200310 struct dma_pool *pool = &atomic_pool;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100311 pgprot_t prot = pgprot_dmacoherent(pgprot_kernel);
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200312 unsigned long nr_pages = pool->size >> PAGE_SHIFT;
313 unsigned long *bitmap;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100314 struct page *page;
315 void *ptr;
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200316 int bitmap_size = BITS_TO_LONGS(nr_pages) * sizeof(long);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100317
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200318 bitmap = kzalloc(bitmap_size, GFP_KERNEL);
319 if (!bitmap)
320 goto no_bitmap;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100321
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200322 if (IS_ENABLED(CONFIG_CMA))
323 ptr = __alloc_from_contiguous(NULL, pool->size, prot, &page,
324 false, atomic_pool_init);
325 else
326 ptr = __alloc_remap_buffer(NULL, pool->size, GFP_KERNEL, prot,
327 &page, NULL);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100328 if (ptr) {
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200329 spin_lock_init(&pool->lock);
330 pool->vaddr = ptr;
331 pool->page = page;
332 pool->bitmap = bitmap;
333 pool->nr_pages = nr_pages;
334 pr_info("DMA: preallocated %u KiB pool for atomic coherent allocations\n",
335 (unsigned)pool->size / 1024);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100336 return 0;
337 }
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200338 kfree(bitmap);
339no_bitmap:
340 pr_err("DMA: failed to allocate %u KiB pool for atomic coherent allocation\n",
341 (unsigned)pool->size / 1024);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100342 return -ENOMEM;
343}
344/*
345 * CMA is activated by core_initcall, so we must be called after it.
346 */
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200347postcore_initcall(atomic_pool_init);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100348
349struct dma_contig_early_reserve {
350 phys_addr_t base;
351 unsigned long size;
352};
353
354static struct dma_contig_early_reserve dma_mmu_remap[MAX_CMA_AREAS] __initdata;
355
356static int dma_mmu_remap_num __initdata;
357
358void __init dma_contiguous_early_fixup(phys_addr_t base, unsigned long size)
359{
360 dma_mmu_remap[dma_mmu_remap_num].base = base;
361 dma_mmu_remap[dma_mmu_remap_num].size = size;
362 dma_mmu_remap_num++;
363}
364
365void __init dma_contiguous_remap(void)
366{
367 int i;
368 for (i = 0; i < dma_mmu_remap_num; i++) {
369 phys_addr_t start = dma_mmu_remap[i].base;
370 phys_addr_t end = start + dma_mmu_remap[i].size;
371 struct map_desc map;
372 unsigned long addr;
373
374 if (end > arm_lowmem_limit)
375 end = arm_lowmem_limit;
376 if (start >= end)
Chris Brand8892fbb2012-08-07 14:01:14 +0200377 continue;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100378
379 map.pfn = __phys_to_pfn(start);
380 map.virtual = __phys_to_virt(start);
381 map.length = end - start;
382 map.type = MT_MEMORY_DMA_READY;
383
384 /*
385 * Clear previous low-memory mapping
386 */
387 for (addr = __phys_to_virt(start); addr < __phys_to_virt(end);
Vitaly Andrianov808e3032012-05-14 13:49:56 -0400388 addr += PMD_SIZE)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100389 pmd_clear(pmd_off_k(addr));
390
391 iotable_init(&map, 1);
392 }
393}
394
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100395static int __dma_update_pte(pte_t *pte, pgtable_t token, unsigned long addr,
396 void *data)
397{
398 struct page *page = virt_to_page(addr);
399 pgprot_t prot = *(pgprot_t *)data;
400
401 set_pte_ext(pte, mk_pte(page, prot), 0);
402 return 0;
403}
404
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700405static int __dma_clear_pte(pte_t *pte, pgtable_t token, unsigned long addr,
406 void *data)
407{
408 pte_clear(&init_mm, addr, pte);
409 return 0;
410}
411
412static void __dma_remap(struct page *page, size_t size, pgprot_t prot,
413 bool no_kernel_map)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100414{
415 unsigned long start = (unsigned long) page_address(page);
416 unsigned end = start + size;
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700417 int (*func)(pte_t *pte, pgtable_t token, unsigned long addr,
418 void *data);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100419
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700420 if (no_kernel_map)
421 func = __dma_clear_pte;
422 else
423 func = __dma_update_pte;
424
425 apply_to_page_range(&init_mm, start, size, func, &prot);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100426 dsb();
427 flush_tlb_kernel_range(start, end);
428}
429
430static void *__alloc_remap_buffer(struct device *dev, size_t size, gfp_t gfp,
431 pgprot_t prot, struct page **ret_page,
432 const void *caller)
433{
434 struct page *page;
435 void *ptr;
436 page = __dma_alloc_buffer(dev, size, gfp);
437 if (!page)
438 return NULL;
439
440 ptr = __dma_alloc_remap(page, size, gfp, prot, caller);
441 if (!ptr) {
442 __dma_free_buffer(page, size);
443 return NULL;
444 }
445
446 *ret_page = page;
447 return ptr;
448}
449
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200450static void *__alloc_from_pool(size_t size, struct page **ret_page)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100451{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200452 struct dma_pool *pool = &atomic_pool;
453 unsigned int count = PAGE_ALIGN(size) >> PAGE_SHIFT;
454 unsigned int pageno;
455 unsigned long flags;
456 void *ptr = NULL;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100457 size_t align;
458
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200459 if (!pool->vaddr) {
460 WARN(1, "coherent pool not initialised!\n");
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100461 return NULL;
462 }
463
464 /*
465 * Align the region allocation - allocations from pool are rather
466 * small, so align them to their order in pages, minimum is a page
467 * size. This helps reduce fragmentation of the DMA space.
468 */
469 align = PAGE_SIZE << get_order(size);
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200470
471 spin_lock_irqsave(&pool->lock, flags);
472 pageno = bitmap_find_next_zero_area(pool->bitmap, pool->nr_pages,
473 0, count, (1 << align) - 1);
474 if (pageno < pool->nr_pages) {
475 bitmap_set(pool->bitmap, pageno, count);
476 ptr = pool->vaddr + PAGE_SIZE * pageno;
477 *ret_page = pool->page + pageno;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100478 }
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200479 spin_unlock_irqrestore(&pool->lock, flags);
480
481 return ptr;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100482}
483
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200484static int __free_from_pool(void *start, size_t size)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100485{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200486 struct dma_pool *pool = &atomic_pool;
487 unsigned long pageno, count;
488 unsigned long flags;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100489
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200490 if (start < pool->vaddr || start > pool->vaddr + pool->size)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100491 return 0;
492
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200493 if (start + size > pool->vaddr + pool->size) {
494 WARN(1, "freeing wrong coherent size from pool\n");
495 return 0;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100496 }
497
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200498 pageno = (start - pool->vaddr) >> PAGE_SHIFT;
499 count = size >> PAGE_SHIFT;
500
501 spin_lock_irqsave(&pool->lock, flags);
502 bitmap_clear(pool->bitmap, pageno, count);
503 spin_unlock_irqrestore(&pool->lock, flags);
504
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100505 return 1;
506}
507
Laura Abbott5f06ec82013-01-16 18:23:19 -0800508#define NO_KERNEL_MAPPING_DUMMY 0x2222
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100509static void *__alloc_from_contiguous(struct device *dev, size_t size,
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700510 pgprot_t prot, struct page **ret_page,
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100511 bool no_kernel_mapping,
512 const void *caller)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100513{
514 unsigned long order = get_order(size);
515 size_t count = size >> PAGE_SHIFT;
516 struct page *page;
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100517 void *ptr;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100518
519 page = dma_alloc_from_contiguous(dev, count, order);
520 if (!page)
521 return NULL;
522
523 __dma_clear_buffer(page, size);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100524
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100525 if (!PageHighMem(page)) {
526 __dma_remap(page, size, prot, no_kernel_mapping);
527 ptr = page_address(page);
528 } else {
Laura Abbott5f06ec82013-01-16 18:23:19 -0800529 if (no_kernel_mapping) {
530 /*
531 * Something non-NULL needs to be returned here. Give
532 * back a dummy address that is unmapped to catch
533 * clients trying to use the address incorrectly
534 */
535 ptr = (void *)NO_KERNEL_MAPPING_DUMMY;
536 } else {
537 ptr = __dma_alloc_remap(page, size, GFP_KERNEL, prot,
538 caller);
539 if (!ptr) {
540 dma_release_from_contiguous(dev, page, count);
541 return NULL;
542 }
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100543 }
544 }
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100545 *ret_page = page;
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100546 return ptr;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100547}
548
549static void __free_from_contiguous(struct device *dev, struct page *page,
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100550 void *cpu_addr, size_t size)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100551{
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100552 if (!PageHighMem(page))
553 __dma_remap(page, size, pgprot_kernel, false);
554 else
Laura Abbott5f06ec82013-01-16 18:23:19 -0800555 __dma_free_remap(cpu_addr, size, true);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100556 dma_release_from_contiguous(dev, page, size >> PAGE_SHIFT);
557}
558
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200559static inline pgprot_t __get_dma_pgprot(struct dma_attrs *attrs, pgprot_t prot)
560{
Laura Abbottb2034022012-10-29 11:54:38 -0700561 if (dma_get_attr(DMA_ATTR_WRITE_COMBINE, attrs))
562 prot = pgprot_writecombine(prot);
563 else if (dma_get_attr(DMA_ATTR_STRONGLY_ORDERED, attrs))
564 prot = pgprot_stronglyordered(prot);
565 /* if non-consistent just pass back what was given */
566 else if (!dma_get_attr(DMA_ATTR_NON_CONSISTENT, attrs))
567 prot = pgprot_dmacoherent(prot);
568
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200569 return prot;
570}
571
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100572#define nommu() 0
573
Catalin Marinasab6494f2009-07-24 12:35:02 +0100574#else /* !CONFIG_MMU */
Russell King695ae0a2009-11-19 16:31:39 +0000575
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100576#define nommu() 1
577
578#define __alloc_remap_buffer(dev, size, gfp, prot, ret, c) NULL
579#define __alloc_from_pool(dev, size, ret_page, c) NULL
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700580#define __alloc_from_contiguous(dev, size, prot, ret, w) NULL
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100581#define __free_from_pool(cpu_addr, size) 0
582#define __free_from_contiguous(dev, page, size) do { } while (0)
583#define __dma_free_remap(cpu_addr, size) do { } while (0)
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200584#define __get_dma_pgprot(attrs, prot) __pgprot(0)
Russell King31ebf942009-11-19 21:12:17 +0000585
586#endif /* CONFIG_MMU */
587
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100588static void *__alloc_simple_buffer(struct device *dev, size_t size, gfp_t gfp,
589 struct page **ret_page)
Catalin Marinasab6494f2009-07-24 12:35:02 +0100590{
Russell King04da5692009-11-19 15:54:45 +0000591 struct page *page;
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100592 page = __dma_alloc_buffer(dev, size, gfp);
593 if (!page)
594 return NULL;
595
596 *ret_page = page;
597 return page_address(page);
598}
599
600
601
602static void *__dma_alloc(struct device *dev, size_t size, dma_addr_t *handle,
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700603 gfp_t gfp, pgprot_t prot, const void *caller,
604 bool no_kernel_mapping)
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100605{
606 u64 mask = get_coherent_dma_mask(dev);
607 struct page *page;
Russell King31ebf942009-11-19 21:12:17 +0000608 void *addr;
Catalin Marinasab6494f2009-07-24 12:35:02 +0100609
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100610#ifdef CONFIG_DMA_API_DEBUG
611 u64 limit = (mask + 1) & ~mask;
612 if (limit && size >= limit) {
613 dev_warn(dev, "coherent allocation too big (requested %#x mask %#llx)\n",
614 size, mask);
615 return NULL;
616 }
617#endif
618
619 if (!mask)
620 return NULL;
621
622 if (mask < 0xffffffffULL)
623 gfp |= GFP_DMA;
624
Sumit Bhattacharyaea2e7052011-11-24 00:47:12 +0100625 /*
626 * Following is a work-around (a.k.a. hack) to prevent pages
627 * with __GFP_COMP being passed to split_page() which cannot
628 * handle them. The real problem is that this flag probably
629 * should be 0 on ARM as it is not supported on this
630 * platform; see CONFIG_HUGETLBFS.
631 */
632 gfp &= ~(__GFP_COMP);
633
Marek Szyprowski1dc8f002012-02-29 14:45:28 +0100634 *handle = DMA_ERROR_CODE;
Russell King04da5692009-11-19 15:54:45 +0000635 size = PAGE_ALIGN(size);
636
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100637 if (arch_is_coherent() || nommu())
638 addr = __alloc_simple_buffer(dev, size, gfp, &page);
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +0200639 else if (gfp & GFP_ATOMIC)
640 addr = __alloc_from_pool(size, &page);
Marek Szyprowski5ee6b062012-05-30 10:48:29 +0200641 else if (!IS_ENABLED(CONFIG_CMA))
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100642 addr = __alloc_remap_buffer(dev, size, gfp, prot, &page, caller);
Russell King31ebf942009-11-19 21:12:17 +0000643 else
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700644 addr = __alloc_from_contiguous(dev, size, prot, &page,
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100645 no_kernel_mapping, caller);
Russell King31ebf942009-11-19 21:12:17 +0000646
647 if (addr)
Russell King9eedd962011-01-03 00:00:17 +0000648 *handle = pfn_to_dma(dev, page_to_pfn(page));
Russell King31ebf942009-11-19 21:12:17 +0000649
650 return addr;
Catalin Marinasab6494f2009-07-24 12:35:02 +0100651}
Russell King695ae0a2009-11-19 16:31:39 +0000652
Linus Torvalds1da177e2005-04-16 15:20:36 -0700653/*
654 * Allocate DMA-coherent memory space and return both the kernel remapped
655 * virtual and bus address for that space.
656 */
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200657void *arm_dma_alloc(struct device *dev, size_t size, dma_addr_t *handle,
658 gfp_t gfp, struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700659{
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200660 pgprot_t prot = __get_dma_pgprot(attrs, pgprot_kernel);
Dmitry Baryshkov1fe53262008-07-18 13:30:14 +0400661 void *memory;
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700662 bool no_kernel_mapping = dma_get_attr(DMA_ATTR_NO_KERNEL_MAPPING,
663 attrs);
Dmitry Baryshkov1fe53262008-07-18 13:30:14 +0400664
665 if (dma_alloc_from_coherent(dev, size, handle, &memory))
666 return memory;
667
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200668 return __dma_alloc(dev, size, handle, gfp, prot,
Laura Abbott4f5b9de2012-10-29 13:38:25 -0700669 __builtin_return_address(0), no_kernel_mapping);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700670}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700671
672/*
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200673 * Create userspace mapping for the DMA-coherent memory.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700674 */
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200675int arm_dma_mmap(struct device *dev, struct vm_area_struct *vma,
676 void *cpu_addr, dma_addr_t dma_addr, size_t size,
677 struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700678{
Catalin Marinasab6494f2009-07-24 12:35:02 +0100679 int ret = -ENXIO;
680#ifdef CONFIG_MMU
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100681 unsigned long pfn = dma_to_pfn(dev, dma_addr);
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200682 vma->vm_page_prot = __get_dma_pgprot(attrs, vma->vm_page_prot);
Marek Szyprowskif504f8e2012-05-15 19:04:13 +0200683
684 if (dma_mmap_from_coherent(dev, vma, cpu_addr, size, &ret))
685 return ret;
686
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100687 ret = remap_pfn_range(vma, vma->vm_start,
688 pfn + vma->vm_pgoff,
689 vma->vm_end - vma->vm_start,
690 vma->vm_page_prot);
Catalin Marinasab6494f2009-07-24 12:35:02 +0100691#endif /* CONFIG_MMU */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700692
693 return ret;
694}
695
Linus Torvalds1da177e2005-04-16 15:20:36 -0700696/*
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100697 * Free a buffer as defined by the above mapping.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700698 */
Marek Szyprowskia93786a2012-05-16 18:31:23 +0200699void arm_dma_free(struct device *dev, size_t size, void *cpu_addr,
700 dma_addr_t handle, struct dma_attrs *attrs)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701{
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100702 struct page *page = pfn_to_page(dma_to_pfn(dev, handle));
Russell King5edf71a2005-11-25 15:52:51 +0000703
Dmitry Baryshkov1fe53262008-07-18 13:30:14 +0400704 if (dma_release_from_coherent(dev, get_order(size), cpu_addr))
705 return;
706
Russell King3e82d012009-11-19 15:38:12 +0000707 size = PAGE_ALIGN(size);
708
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100709 if (arch_is_coherent() || nommu()) {
710 __dma_free_buffer(page, size);
Aaro Koskinen39b0f202012-08-07 14:44:05 +0200711 } else if (__free_from_pool(cpu_addr, size)) {
712 return;
Marek Szyprowski5ee6b062012-05-30 10:48:29 +0200713 } else if (!IS_ENABLED(CONFIG_CMA)) {
Laura Abbott5f06ec82013-01-16 18:23:19 -0800714 __dma_free_remap(cpu_addr, size, false);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100715 __dma_free_buffer(page, size);
716 } else {
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100717 /*
718 * Non-atomic allocations cannot be freed with IRQs disabled
719 */
720 WARN_ON(irqs_disabled());
Marek Szyprowski44d60d62013-01-16 16:31:22 +0100721 __free_from_contiguous(dev, page, cpu_addr, size);
Marek Szyprowskid4398df2011-12-29 13:09:51 +0100722 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700723}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700724
Russell King65af1912009-11-24 17:53:33 +0000725static void dma_cache_maint_page(struct page *page, unsigned long offset,
Russell Kinga9c91472009-11-26 16:19:58 +0000726 size_t size, enum dma_data_direction dir,
727 void (*op)(const void *, size_t, int))
Russell King65af1912009-11-24 17:53:33 +0000728{
Russell Kinge4e9dc82013-01-19 11:05:57 +0000729 unsigned long pfn;
730 size_t left = size;
731
732 pfn = page_to_pfn(page) + offset / PAGE_SIZE;
733 offset %= PAGE_SIZE;
734
Russell King65af1912009-11-24 17:53:33 +0000735 /*
736 * A single sg entry may refer to multiple physically contiguous
737 * pages. But we still need to process highmem pages individually.
738 * If highmem is not configured then the bulk of this loop gets
739 * optimized out.
740 */
Russell King65af1912009-11-24 17:53:33 +0000741 do {
742 size_t len = left;
Russell King93f1d622009-11-24 14:41:01 +0000743 void *vaddr;
744
Russell Kinge4e9dc82013-01-19 11:05:57 +0000745 page = pfn_to_page(pfn);
746
Russell King93f1d622009-11-24 14:41:01 +0000747 if (PageHighMem(page)) {
Russell Kinge4e9dc82013-01-19 11:05:57 +0000748 if (len + offset > PAGE_SIZE)
Russell King93f1d622009-11-24 14:41:01 +0000749 len = PAGE_SIZE - offset;
Russell King93f1d622009-11-24 14:41:01 +0000750 vaddr = kmap_high_get(page);
751 if (vaddr) {
752 vaddr += offset;
Russell Kinga9c91472009-11-26 16:19:58 +0000753 op(vaddr, len, dir);
Russell King93f1d622009-11-24 14:41:01 +0000754 kunmap_high(page);
Nicolas Pitre7e5a69e2010-03-29 21:46:02 +0100755 } else if (cache_is_vipt()) {
Nicolas Pitre39af22a2010-12-15 15:14:45 -0500756 /* unmapped pages might still be cached */
757 vaddr = kmap_atomic(page);
Nicolas Pitre7e5a69e2010-03-29 21:46:02 +0100758 op(vaddr + offset, len, dir);
Nicolas Pitre39af22a2010-12-15 15:14:45 -0500759 kunmap_atomic(vaddr);
Russell King93f1d622009-11-24 14:41:01 +0000760 }
761 } else {
762 vaddr = page_address(page) + offset;
Russell Kinga9c91472009-11-26 16:19:58 +0000763 op(vaddr, len, dir);
Russell King65af1912009-11-24 17:53:33 +0000764 }
Russell King65af1912009-11-24 17:53:33 +0000765 offset = 0;
Russell Kinge4e9dc82013-01-19 11:05:57 +0000766 pfn++;
Russell King65af1912009-11-24 17:53:33 +0000767 left -= len;
768 } while (left);
769}
770
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +0100771/*
772 * Make an area consistent for devices.
773 * Note: Drivers should NOT use this function directly, as it will break
774 * platforms with CONFIG_DMABOUNCE.
775 * Use the driver DMA support - see dma-mapping.h (dma_sync_*)
776 */
777static void __dma_page_cpu_to_dev(struct page *page, unsigned long off,
Russell King65af1912009-11-24 17:53:33 +0000778 size_t size, enum dma_data_direction dir)
779{
Nicolas Pitre43377452009-03-12 22:52:09 -0400780 unsigned long paddr;
Nicolas Pitre43377452009-03-12 22:52:09 -0400781
Russell Kinga9c91472009-11-26 16:19:58 +0000782 dma_cache_maint_page(page, off, size, dir, dmac_map_area);
Nicolas Pitre43377452009-03-12 22:52:09 -0400783
Russell King65af1912009-11-24 17:53:33 +0000784 paddr = page_to_phys(page) + off;
Russell King2ffe2da2009-10-31 16:52:16 +0000785 if (dir == DMA_FROM_DEVICE) {
786 outer_inv_range(paddr, paddr + size);
787 } else {
788 outer_clean_range(paddr, paddr + size);
789 }
790 /* FIXME: non-speculating: flush on bidirectional mappings? */
Nicolas Pitre43377452009-03-12 22:52:09 -0400791}
Russell King4ea0d732009-11-24 16:27:17 +0000792
Marek Szyprowskiabe2a2f2012-02-10 19:55:20 +0100793static void __dma_page_dev_to_cpu(struct page *page, unsigned long off,
Russell King4ea0d732009-11-24 16:27:17 +0000794 size_t size, enum dma_data_direction dir)
795{
Russell King2ffe2da2009-10-31 16:52:16 +0000796 unsigned long paddr = page_to_phys(page) + off;
797
798 /* FIXME: non-speculating: not required */
799 /* don't bother invalidating if DMA to device */
800 if (dir != DMA_TO_DEVICE)
801 outer_inv_range(paddr, paddr + size);
802
Russell Kinga9c91472009-11-26 16:19:58 +0000803 dma_cache_maint_page(page, off, size, dir, dmac_unmap_area);
Catalin Marinasc0177802010-09-13 15:57:36 +0100804
805 /*
806 * Mark the D-cache clean for this page to avoid extra flushing.
807 */
808 if (dir != DMA_TO_DEVICE && off == 0 && size >= PAGE_SIZE)
809 set_bit(PG_dcache_clean, &page->flags);
Russell King4ea0d732009-11-24 16:27:17 +0000810}
Nicolas Pitre43377452009-03-12 22:52:09 -0400811
Russell Kingafd1a322008-09-25 16:30:57 +0100812/**
Marek Szyprowski253a1402012-02-10 19:55:20 +0100813 * arm_dma_map_sg - map a set of SG buffers for streaming mode DMA
Russell Kingafd1a322008-09-25 16:30:57 +0100814 * @dev: valid struct device pointer, or NULL for ISA and EISA-like devices
815 * @sg: list of buffers
816 * @nents: number of buffers to map
817 * @dir: DMA transfer direction
818 *
819 * Map a set of buffers described by scatterlist in streaming mode for DMA.
820 * This is the scatter-gather version of the dma_map_single interface.
821 * Here the scatter gather list elements are each tagged with the
822 * appropriate dma address and length. They are obtained via
823 * sg_dma_{address,length}.
824 *
825 * Device ownership issues as mentioned for dma_map_single are the same
826 * here.
827 */
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100828int arm_dma_map_sg(struct device *dev, struct scatterlist *sg, int nents,
829 enum dma_data_direction dir, struct dma_attrs *attrs)
Russell Kingafd1a322008-09-25 16:30:57 +0100830{
Marek Szyprowski253a1402012-02-10 19:55:20 +0100831 struct dma_map_ops *ops = get_dma_ops(dev);
Russell Kingafd1a322008-09-25 16:30:57 +0100832 struct scatterlist *s;
Russell King01135d92008-09-25 21:05:02 +0100833 int i, j;
Russell Kingafd1a322008-09-25 16:30:57 +0100834
835 for_each_sg(sg, s, nents, i) {
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +0200836#ifdef CONFIG_NEED_SG_DMA_LENGTH
837 s->dma_length = s->length;
838#endif
Marek Szyprowski253a1402012-02-10 19:55:20 +0100839 s->dma_address = ops->map_page(dev, sg_page(s), s->offset,
840 s->length, dir, attrs);
Russell King01135d92008-09-25 21:05:02 +0100841 if (dma_mapping_error(dev, s->dma_address))
842 goto bad_mapping;
Russell Kingafd1a322008-09-25 16:30:57 +0100843 }
Russell Kingafd1a322008-09-25 16:30:57 +0100844 return nents;
Russell King01135d92008-09-25 21:05:02 +0100845
846 bad_mapping:
847 for_each_sg(sg, s, i, j)
Marek Szyprowski253a1402012-02-10 19:55:20 +0100848 ops->unmap_page(dev, sg_dma_address(s), sg_dma_len(s), dir, attrs);
Russell King01135d92008-09-25 21:05:02 +0100849 return 0;
Russell Kingafd1a322008-09-25 16:30:57 +0100850}
Russell Kingafd1a322008-09-25 16:30:57 +0100851
852/**
Marek Szyprowski253a1402012-02-10 19:55:20 +0100853 * arm_dma_unmap_sg - unmap a set of SG buffers mapped by dma_map_sg
Russell Kingafd1a322008-09-25 16:30:57 +0100854 * @dev: valid struct device pointer, or NULL for ISA and EISA-like devices
855 * @sg: list of buffers
Linus Walleij0adfca62011-01-12 18:50:37 +0100856 * @nents: number of buffers to unmap (same as was passed to dma_map_sg)
Russell Kingafd1a322008-09-25 16:30:57 +0100857 * @dir: DMA transfer direction (same as was passed to dma_map_sg)
858 *
859 * Unmap a set of streaming mode DMA translations. Again, CPU access
860 * rules concerning calls here are the same as for dma_unmap_single().
861 */
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100862void arm_dma_unmap_sg(struct device *dev, struct scatterlist *sg, int nents,
863 enum dma_data_direction dir, struct dma_attrs *attrs)
Russell Kingafd1a322008-09-25 16:30:57 +0100864{
Marek Szyprowski253a1402012-02-10 19:55:20 +0100865 struct dma_map_ops *ops = get_dma_ops(dev);
Russell King01135d92008-09-25 21:05:02 +0100866 struct scatterlist *s;
Marek Szyprowski253a1402012-02-10 19:55:20 +0100867
Russell King01135d92008-09-25 21:05:02 +0100868 int i;
869
870 for_each_sg(sg, s, nents, i)
Marek Szyprowski253a1402012-02-10 19:55:20 +0100871 ops->unmap_page(dev, sg_dma_address(s), sg_dma_len(s), dir, attrs);
Russell Kingafd1a322008-09-25 16:30:57 +0100872}
Russell Kingafd1a322008-09-25 16:30:57 +0100873
874/**
Marek Szyprowski253a1402012-02-10 19:55:20 +0100875 * arm_dma_sync_sg_for_cpu
Russell Kingafd1a322008-09-25 16:30:57 +0100876 * @dev: valid struct device pointer, or NULL for ISA and EISA-like devices
877 * @sg: list of buffers
878 * @nents: number of buffers to map (returned from dma_map_sg)
879 * @dir: DMA transfer direction (same as was passed to dma_map_sg)
880 */
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100881void arm_dma_sync_sg_for_cpu(struct device *dev, struct scatterlist *sg,
Russell Kingafd1a322008-09-25 16:30:57 +0100882 int nents, enum dma_data_direction dir)
883{
Marek Szyprowski253a1402012-02-10 19:55:20 +0100884 struct dma_map_ops *ops = get_dma_ops(dev);
Russell Kingafd1a322008-09-25 16:30:57 +0100885 struct scatterlist *s;
886 int i;
887
Marek Szyprowski253a1402012-02-10 19:55:20 +0100888 for_each_sg(sg, s, nents, i)
889 ops->sync_single_for_cpu(dev, sg_dma_address(s), s->length,
890 dir);
Russell Kingafd1a322008-09-25 16:30:57 +0100891}
Russell Kingafd1a322008-09-25 16:30:57 +0100892
893/**
Marek Szyprowski253a1402012-02-10 19:55:20 +0100894 * arm_dma_sync_sg_for_device
Russell Kingafd1a322008-09-25 16:30:57 +0100895 * @dev: valid struct device pointer, or NULL for ISA and EISA-like devices
896 * @sg: list of buffers
897 * @nents: number of buffers to map (returned from dma_map_sg)
898 * @dir: DMA transfer direction (same as was passed to dma_map_sg)
899 */
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100900void arm_dma_sync_sg_for_device(struct device *dev, struct scatterlist *sg,
Russell Kingafd1a322008-09-25 16:30:57 +0100901 int nents, enum dma_data_direction dir)
902{
Marek Szyprowski253a1402012-02-10 19:55:20 +0100903 struct dma_map_ops *ops = get_dma_ops(dev);
Russell Kingafd1a322008-09-25 16:30:57 +0100904 struct scatterlist *s;
905 int i;
906
Marek Szyprowski253a1402012-02-10 19:55:20 +0100907 for_each_sg(sg, s, nents, i)
908 ops->sync_single_for_device(dev, sg_dma_address(s), s->length,
909 dir);
Russell Kingafd1a322008-09-25 16:30:57 +0100910}
Russell King24056f52011-01-03 11:29:28 +0000911
Russell King022ae532011-07-08 21:26:59 +0100912/*
913 * Return whether the given device DMA address mask can be supported
914 * properly. For example, if your device can only drive the low 24-bits
915 * during bus mastering, then you would pass 0x00ffffff as the mask
916 * to this function.
917 */
918int dma_supported(struct device *dev, u64 mask)
919{
920 if (mask < (u64)arm_dma_limit)
921 return 0;
922 return 1;
923}
924EXPORT_SYMBOL(dma_supported);
925
Marek Szyprowskif6fe2822012-02-10 19:55:20 +0100926static int arm_dma_set_mask(struct device *dev, u64 dma_mask)
Russell King022ae532011-07-08 21:26:59 +0100927{
928 if (!dev->dma_mask || !dma_supported(dev, dma_mask))
929 return -EIO;
930
Russell King022ae532011-07-08 21:26:59 +0100931 *dev->dma_mask = dma_mask;
Russell King022ae532011-07-08 21:26:59 +0100932
933 return 0;
934}
Russell King022ae532011-07-08 21:26:59 +0100935
Russell King24056f52011-01-03 11:29:28 +0000936#define PREALLOC_DMA_DEBUG_ENTRIES 4096
937
938static int __init dma_debug_do_init(void)
939{
940 dma_debug_init(PREALLOC_DMA_DEBUG_ENTRIES);
941 return 0;
942}
943fs_initcall(dma_debug_do_init);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +0200944
945#ifdef CONFIG_ARM_DMA_USE_IOMMU
946
947/* IOMMU */
948
949static inline dma_addr_t __alloc_iova(struct dma_iommu_mapping *mapping,
950 size_t size)
951{
952 unsigned int order = get_order(size);
953 unsigned int align = 0;
954 unsigned int count, start;
955 unsigned long flags;
956
957 count = ((PAGE_ALIGN(size) >> PAGE_SHIFT) +
958 (1 << mapping->order) - 1) >> mapping->order;
959
960 if (order > mapping->order)
961 align = (1 << (order - mapping->order)) - 1;
962
963 spin_lock_irqsave(&mapping->lock, flags);
964 start = bitmap_find_next_zero_area(mapping->bitmap, mapping->bits, 0,
965 count, align);
966 if (start > mapping->bits) {
967 spin_unlock_irqrestore(&mapping->lock, flags);
968 return DMA_ERROR_CODE;
969 }
970
971 bitmap_set(mapping->bitmap, start, count);
972 spin_unlock_irqrestore(&mapping->lock, flags);
973
974 return mapping->base + (start << (mapping->order + PAGE_SHIFT));
975}
976
977static inline void __free_iova(struct dma_iommu_mapping *mapping,
978 dma_addr_t addr, size_t size)
979{
980 unsigned int start = (addr - mapping->base) >>
981 (mapping->order + PAGE_SHIFT);
982 unsigned int count = ((size >> PAGE_SHIFT) +
983 (1 << mapping->order) - 1) >> mapping->order;
984 unsigned long flags;
985
986 spin_lock_irqsave(&mapping->lock, flags);
987 bitmap_clear(mapping->bitmap, start, count);
988 spin_unlock_irqrestore(&mapping->lock, flags);
989}
990
991static struct page **__iommu_alloc_buffer(struct device *dev, size_t size, gfp_t gfp)
992{
993 struct page **pages;
994 int count = size >> PAGE_SHIFT;
995 int array_size = count * sizeof(struct page *);
996 int i = 0;
997
998 if (array_size <= PAGE_SIZE)
999 pages = kzalloc(array_size, gfp);
1000 else
1001 pages = vzalloc(array_size);
1002 if (!pages)
1003 return NULL;
1004
1005 while (count) {
Marek Szyprowskib1fc9022012-06-21 11:48:11 +02001006 int j, order = __fls(count);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001007
1008 pages[i] = alloc_pages(gfp | __GFP_NOWARN, order);
1009 while (!pages[i] && order)
1010 pages[i] = alloc_pages(gfp | __GFP_NOWARN, --order);
1011 if (!pages[i])
1012 goto error;
1013
1014 if (order)
1015 split_page(pages[i], order);
1016 j = 1 << order;
1017 while (--j)
1018 pages[i + j] = pages[i] + j;
1019
1020 __dma_clear_buffer(pages[i], PAGE_SIZE << order);
1021 i += 1 << order;
1022 count -= 1 << order;
1023 }
1024
1025 return pages;
1026error:
1027 while (--i)
1028 if (pages[i])
1029 __free_pages(pages[i], 0);
1030 if (array_size < PAGE_SIZE)
1031 kfree(pages);
1032 else
1033 vfree(pages);
1034 return NULL;
1035}
1036
1037static int __iommu_free_buffer(struct device *dev, struct page **pages, size_t size)
1038{
1039 int count = size >> PAGE_SHIFT;
1040 int array_size = count * sizeof(struct page *);
1041 int i;
1042 for (i = 0; i < count; i++)
1043 if (pages[i])
1044 __free_pages(pages[i], 0);
1045 if (array_size < PAGE_SIZE)
1046 kfree(pages);
1047 else
1048 vfree(pages);
1049 return 0;
1050}
1051
1052/*
1053 * Create a CPU mapping for a specified pages
1054 */
1055static void *
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001056__iommu_alloc_remap(struct page **pages, size_t size, gfp_t gfp, pgprot_t prot,
1057 const void *caller)
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001058{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001059 unsigned int i, nr_pages = PAGE_ALIGN(size) >> PAGE_SHIFT;
1060 struct vm_struct *area;
1061 unsigned long p;
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001062
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001063 area = get_vm_area_caller(size, VM_ARM_DMA_CONSISTENT | VM_USERMAP,
1064 caller);
1065 if (!area)
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001066 return NULL;
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001067
1068 area->pages = pages;
1069 area->nr_pages = nr_pages;
1070 p = (unsigned long)area->addr;
1071
1072 for (i = 0; i < nr_pages; i++) {
1073 phys_addr_t phys = __pfn_to_phys(page_to_pfn(pages[i]));
1074 if (ioremap_page_range(p, p + PAGE_SIZE, phys, prot))
1075 goto err;
1076 p += PAGE_SIZE;
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001077 }
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001078 return area->addr;
1079err:
1080 unmap_kernel_range((unsigned long)area->addr, size);
1081 vunmap(area->addr);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001082 return NULL;
1083}
1084
1085/*
1086 * Create a mapping in device IO address space for specified pages
1087 */
1088static dma_addr_t
1089__iommu_create_mapping(struct device *dev, struct page **pages, size_t size)
1090{
1091 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1092 unsigned int count = PAGE_ALIGN(size) >> PAGE_SHIFT;
1093 dma_addr_t dma_addr, iova;
1094 int i, ret = DMA_ERROR_CODE;
1095
1096 dma_addr = __alloc_iova(mapping, size);
1097 if (dma_addr == DMA_ERROR_CODE)
1098 return dma_addr;
1099
1100 iova = dma_addr;
1101 for (i = 0; i < count; ) {
1102 unsigned int next_pfn = page_to_pfn(pages[i]) + 1;
1103 phys_addr_t phys = page_to_phys(pages[i]);
1104 unsigned int len, j;
1105
1106 for (j = i + 1; j < count; j++, next_pfn++)
1107 if (page_to_pfn(pages[j]) != next_pfn)
1108 break;
1109
1110 len = (j - i) << PAGE_SHIFT;
1111 ret = iommu_map(mapping->domain, iova, phys, len, 0);
1112 if (ret < 0)
1113 goto fail;
1114 iova += len;
1115 i = j;
1116 }
1117 return dma_addr;
1118fail:
1119 iommu_unmap(mapping->domain, dma_addr, iova-dma_addr);
1120 __free_iova(mapping, dma_addr, size);
1121 return DMA_ERROR_CODE;
1122}
1123
1124static int __iommu_remove_mapping(struct device *dev, dma_addr_t iova, size_t size)
1125{
1126 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1127
1128 /*
1129 * add optional in-page offset from iova to size and align
1130 * result to page size
1131 */
1132 size = PAGE_ALIGN((iova & ~PAGE_MASK) + size);
1133 iova &= PAGE_MASK;
1134
1135 iommu_unmap(mapping->domain, iova, size);
1136 __free_iova(mapping, iova, size);
1137 return 0;
1138}
1139
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001140static struct page **__iommu_get_pages(void *cpu_addr)
1141{
1142 struct vm_struct *area;
1143
1144 area = find_vm_area(cpu_addr);
1145 if (area && (area->flags & VM_ARM_DMA_CONSISTENT))
1146 return area->pages;
1147 return NULL;
1148}
1149
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001150static void *arm_iommu_alloc_attrs(struct device *dev, size_t size,
1151 dma_addr_t *handle, gfp_t gfp, struct dma_attrs *attrs)
1152{
1153 pgprot_t prot = __get_dma_pgprot(attrs, pgprot_kernel);
1154 struct page **pages;
1155 void *addr = NULL;
1156
1157 *handle = DMA_ERROR_CODE;
1158 size = PAGE_ALIGN(size);
1159
1160 pages = __iommu_alloc_buffer(dev, size, gfp);
1161 if (!pages)
1162 return NULL;
1163
1164 *handle = __iommu_create_mapping(dev, pages, size);
1165 if (*handle == DMA_ERROR_CODE)
1166 goto err_buffer;
1167
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001168 addr = __iommu_alloc_remap(pages, size, gfp, prot,
1169 __builtin_return_address(0));
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001170 if (!addr)
1171 goto err_mapping;
1172
1173 return addr;
1174
1175err_mapping:
1176 __iommu_remove_mapping(dev, *handle, size);
1177err_buffer:
1178 __iommu_free_buffer(dev, pages, size);
1179 return NULL;
1180}
1181
1182static int arm_iommu_mmap_attrs(struct device *dev, struct vm_area_struct *vma,
1183 void *cpu_addr, dma_addr_t dma_addr, size_t size,
1184 struct dma_attrs *attrs)
1185{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001186 unsigned long uaddr = vma->vm_start;
1187 unsigned long usize = vma->vm_end - vma->vm_start;
1188 struct page **pages = __iommu_get_pages(cpu_addr);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001189
1190 vma->vm_page_prot = __get_dma_pgprot(attrs, vma->vm_page_prot);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001191
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001192 if (!pages)
1193 return -ENXIO;
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001194
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001195 do {
1196 int ret = vm_insert_page(vma, uaddr, *pages++);
1197 if (ret) {
1198 pr_err("Remapping memory failed: %d\n", ret);
1199 return ret;
1200 }
1201 uaddr += PAGE_SIZE;
1202 usize -= PAGE_SIZE;
1203 } while (usize > 0);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001204
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001205 return 0;
1206}
1207
1208/*
1209 * free a page as defined by the above mapping.
1210 * Must not be called with IRQs disabled.
1211 */
1212void arm_iommu_free_attrs(struct device *dev, size_t size, void *cpu_addr,
1213 dma_addr_t handle, struct dma_attrs *attrs)
1214{
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001215 struct page **pages = __iommu_get_pages(cpu_addr);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001216 size = PAGE_ALIGN(size);
1217
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001218 if (!pages) {
1219 WARN(1, "trying to free invalid coherent area: %p\n", cpu_addr);
1220 return;
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001221 }
Marek Szyprowskicb4d7a62012-07-30 09:11:33 +02001222
1223 unmap_kernel_range((unsigned long)cpu_addr, size);
1224 vunmap(cpu_addr);
1225
1226 __iommu_remove_mapping(dev, handle, size);
1227 __iommu_free_buffer(dev, pages, size);
Marek Szyprowskibebe3ac2012-05-16 15:48:21 +02001228}
1229
1230/*
1231 * Map a part of the scatter-gather list into contiguous io address space
1232 */
1233static int __map_sg_chunk(struct device *dev, struct scatterlist *sg,
1234 size_t size, dma_addr_t *handle,
1235 enum dma_data_direction dir)
1236{
1237 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1238 dma_addr_t iova, iova_base;
1239 int ret = 0;
1240 unsigned int count;
1241 struct scatterlist *s;
1242
1243 size = PAGE_ALIGN(size);
1244 *handle = DMA_ERROR_CODE;
1245
1246 iova_base = iova = __alloc_iova(mapping, size);
1247 if (iova == DMA_ERROR_CODE)
1248 return -ENOMEM;
1249
1250 for (count = 0, s = sg; count < (size >> PAGE_SHIFT); s = sg_next(s)) {
1251 phys_addr_t phys = page_to_phys(sg_page(s));
1252 unsigned int len = PAGE_ALIGN(s->offset + s->length);
1253
1254 if (!arch_is_coherent())
1255 __dma_page_cpu_to_dev(sg_page(s), s->offset, s->length, dir);
1256
1257 ret = iommu_map(mapping->domain, iova, phys, len, 0);
1258 if (ret < 0)
1259 goto fail;
1260 count += len >> PAGE_SHIFT;
1261 iova += len;
1262 }
1263 *handle = iova_base;
1264
1265 return 0;
1266fail:
1267 iommu_unmap(mapping->domain, iova_base, count * PAGE_SIZE);
1268 __free_iova(mapping, iova_base, size);
1269 return ret;
1270}
1271
1272/**
1273 * arm_iommu_map_sg - map a set of SG buffers for streaming mode DMA
1274 * @dev: valid struct device pointer
1275 * @sg: list of buffers
1276 * @nents: number of buffers to map
1277 * @dir: DMA transfer direction
1278 *
1279 * Map a set of buffers described by scatterlist in streaming mode for DMA.
1280 * The scatter gather list elements are merged together (if possible) and
1281 * tagged with the appropriate dma address and length. They are obtained via
1282 * sg_dma_{address,length}.
1283 */
1284int arm_iommu_map_sg(struct device *dev, struct scatterlist *sg, int nents,
1285 enum dma_data_direction dir, struct dma_attrs *attrs)
1286{
1287 struct scatterlist *s = sg, *dma = sg, *start = sg;
1288 int i, count = 0;
1289 unsigned int offset = s->offset;
1290 unsigned int size = s->offset + s->length;
1291 unsigned int max = dma_get_max_seg_size(dev);
1292
1293 for (i = 1; i < nents; i++) {
1294 s = sg_next(s);
1295
1296 s->dma_address = DMA_ERROR_CODE;
1297 s->dma_length = 0;
1298
1299 if (s->offset || (size & ~PAGE_MASK) || size + s->length > max) {
1300 if (__map_sg_chunk(dev, start, size, &dma->dma_address,
1301 dir) < 0)
1302 goto bad_mapping;
1303
1304 dma->dma_address += offset;
1305 dma->dma_length = size - offset;
1306
1307 size = offset = s->offset;
1308 start = s;
1309 dma = sg_next(dma);
1310 count += 1;
1311 }
1312 size += s->length;
1313 }
1314 if (__map_sg_chunk(dev, start, size, &dma->dma_address, dir) < 0)
1315 goto bad_mapping;
1316
1317 dma->dma_address += offset;
1318 dma->dma_length = size - offset;
1319
1320 return count+1;
1321
1322bad_mapping:
1323 for_each_sg(sg, s, count, i)
1324 __iommu_remove_mapping(dev, sg_dma_address(s), sg_dma_len(s));
1325 return 0;
1326}
1327
1328/**
1329 * arm_iommu_unmap_sg - unmap a set of SG buffers mapped by dma_map_sg
1330 * @dev: valid struct device pointer
1331 * @sg: list of buffers
1332 * @nents: number of buffers to unmap (same as was passed to dma_map_sg)
1333 * @dir: DMA transfer direction (same as was passed to dma_map_sg)
1334 *
1335 * Unmap a set of streaming mode DMA translations. Again, CPU access
1336 * rules concerning calls here are the same as for dma_unmap_single().
1337 */
1338void arm_iommu_unmap_sg(struct device *dev, struct scatterlist *sg, int nents,
1339 enum dma_data_direction dir, struct dma_attrs *attrs)
1340{
1341 struct scatterlist *s;
1342 int i;
1343
1344 for_each_sg(sg, s, nents, i) {
1345 if (sg_dma_len(s))
1346 __iommu_remove_mapping(dev, sg_dma_address(s),
1347 sg_dma_len(s));
1348 if (!arch_is_coherent())
1349 __dma_page_dev_to_cpu(sg_page(s), s->offset,
1350 s->length, dir);
1351 }
1352}
1353
1354/**
1355 * arm_iommu_sync_sg_for_cpu
1356 * @dev: valid struct device pointer
1357 * @sg: list of buffers
1358 * @nents: number of buffers to map (returned from dma_map_sg)
1359 * @dir: DMA transfer direction (same as was passed to dma_map_sg)
1360 */
1361void arm_iommu_sync_sg_for_cpu(struct device *dev, struct scatterlist *sg,
1362 int nents, enum dma_data_direction dir)
1363{
1364 struct scatterlist *s;
1365 int i;
1366
1367 for_each_sg(sg, s, nents, i)
1368 if (!arch_is_coherent())
1369 __dma_page_dev_to_cpu(sg_page(s), s->offset, s->length, dir);
1370
1371}
1372
1373/**
1374 * arm_iommu_sync_sg_for_device
1375 * @dev: valid struct device pointer
1376 * @sg: list of buffers
1377 * @nents: number of buffers to map (returned from dma_map_sg)
1378 * @dir: DMA transfer direction (same as was passed to dma_map_sg)
1379 */
1380void arm_iommu_sync_sg_for_device(struct device *dev, struct scatterlist *sg,
1381 int nents, enum dma_data_direction dir)
1382{
1383 struct scatterlist *s;
1384 int i;
1385
1386 for_each_sg(sg, s, nents, i)
1387 if (!arch_is_coherent())
1388 __dma_page_cpu_to_dev(sg_page(s), s->offset, s->length, dir);
1389}
1390
1391
1392/**
1393 * arm_iommu_map_page
1394 * @dev: valid struct device pointer
1395 * @page: page that buffer resides in
1396 * @offset: offset into page for start of buffer
1397 * @size: size of buffer to map
1398 * @dir: DMA transfer direction
1399 *
1400 * IOMMU aware version of arm_dma_map_page()
1401 */
1402static dma_addr_t arm_iommu_map_page(struct device *dev, struct page *page,
1403 unsigned long offset, size_t size, enum dma_data_direction dir,
1404 struct dma_attrs *attrs)
1405{
1406 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1407 dma_addr_t dma_addr;
1408 int ret, len = PAGE_ALIGN(size + offset);
1409
1410 if (!arch_is_coherent())
1411 __dma_page_cpu_to_dev(page, offset, size, dir);
1412
1413 dma_addr = __alloc_iova(mapping, len);
1414 if (dma_addr == DMA_ERROR_CODE)
1415 return dma_addr;
1416
1417 ret = iommu_map(mapping->domain, dma_addr, page_to_phys(page), len, 0);
1418 if (ret < 0)
1419 goto fail;
1420
1421 return dma_addr + offset;
1422fail:
1423 __free_iova(mapping, dma_addr, len);
1424 return DMA_ERROR_CODE;
1425}
1426
1427/**
1428 * arm_iommu_unmap_page
1429 * @dev: valid struct device pointer
1430 * @handle: DMA address of buffer
1431 * @size: size of buffer (same as passed to dma_map_page)
1432 * @dir: DMA transfer direction (same as passed to dma_map_page)
1433 *
1434 * IOMMU aware version of arm_dma_unmap_page()
1435 */
1436static void arm_iommu_unmap_page(struct device *dev, dma_addr_t handle,
1437 size_t size, enum dma_data_direction dir,
1438 struct dma_attrs *attrs)
1439{
1440 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1441 dma_addr_t iova = handle & PAGE_MASK;
1442 struct page *page = phys_to_page(iommu_iova_to_phys(mapping->domain, iova));
1443 int offset = handle & ~PAGE_MASK;
1444 int len = PAGE_ALIGN(size + offset);
1445
1446 if (!iova)
1447 return;
1448
1449 if (!arch_is_coherent())
1450 __dma_page_dev_to_cpu(page, offset, size, dir);
1451
1452 iommu_unmap(mapping->domain, iova, len);
1453 __free_iova(mapping, iova, len);
1454}
1455
1456static void arm_iommu_sync_single_for_cpu(struct device *dev,
1457 dma_addr_t handle, size_t size, enum dma_data_direction dir)
1458{
1459 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1460 dma_addr_t iova = handle & PAGE_MASK;
1461 struct page *page = phys_to_page(iommu_iova_to_phys(mapping->domain, iova));
1462 unsigned int offset = handle & ~PAGE_MASK;
1463
1464 if (!iova)
1465 return;
1466
1467 if (!arch_is_coherent())
1468 __dma_page_dev_to_cpu(page, offset, size, dir);
1469}
1470
1471static void arm_iommu_sync_single_for_device(struct device *dev,
1472 dma_addr_t handle, size_t size, enum dma_data_direction dir)
1473{
1474 struct dma_iommu_mapping *mapping = dev->archdata.mapping;
1475 dma_addr_t iova = handle & PAGE_MASK;
1476 struct page *page = phys_to_page(iommu_iova_to_phys(mapping->domain, iova));
1477 unsigned int offset = handle & ~PAGE_MASK;
1478
1479 if (!iova)
1480 return;
1481
1482 __dma_page_cpu_to_dev(page, offset, size, dir);
1483}
1484
1485struct dma_map_ops iommu_ops = {
1486 .alloc = arm_iommu_alloc_attrs,
1487 .free = arm_iommu_free_attrs,
1488 .mmap = arm_iommu_mmap_attrs,
1489
1490 .map_page = arm_iommu_map_page,
1491 .unmap_page = arm_iommu_unmap_page,
1492 .sync_single_for_cpu = arm_iommu_sync_single_for_cpu,
1493 .sync_single_for_device = arm_iommu_sync_single_for_device,
1494
1495 .map_sg = arm_iommu_map_sg,
1496 .unmap_sg = arm_iommu_unmap_sg,
1497 .sync_sg_for_cpu = arm_iommu_sync_sg_for_cpu,
1498 .sync_sg_for_device = arm_iommu_sync_sg_for_device,
1499};
1500
1501/**
1502 * arm_iommu_create_mapping
1503 * @bus: pointer to the bus holding the client device (for IOMMU calls)
1504 * @base: start address of the valid IO address space
1505 * @size: size of the valid IO address space
1506 * @order: accuracy of the IO addresses allocations
1507 *
1508 * Creates a mapping structure which holds information about used/unused
1509 * IO address ranges, which is required to perform memory allocation and
1510 * mapping with IOMMU aware functions.
1511 *
1512 * The client device need to be attached to the mapping with
1513 * arm_iommu_attach_device function.
1514 */
1515struct dma_iommu_mapping *
1516arm_iommu_create_mapping(struct bus_type *bus, dma_addr_t base, size_t size,
1517 int order)
1518{
1519 unsigned int count = size >> (PAGE_SHIFT + order);
1520 unsigned int bitmap_size = BITS_TO_LONGS(count) * sizeof(long);
1521 struct dma_iommu_mapping *mapping;
1522 int err = -ENOMEM;
1523
1524 if (!count)
1525 return ERR_PTR(-EINVAL);
1526
1527 mapping = kzalloc(sizeof(struct dma_iommu_mapping), GFP_KERNEL);
1528 if (!mapping)
1529 goto err;
1530
1531 mapping->bitmap = kzalloc(bitmap_size, GFP_KERNEL);
1532 if (!mapping->bitmap)
1533 goto err2;
1534
1535 mapping->base = base;
1536 mapping->bits = BITS_PER_BYTE * bitmap_size;
1537 mapping->order = order;
1538 spin_lock_init(&mapping->lock);
1539
1540 mapping->domain = iommu_domain_alloc(bus);
1541 if (!mapping->domain)
1542 goto err3;
1543
1544 kref_init(&mapping->kref);
1545 return mapping;
1546err3:
1547 kfree(mapping->bitmap);
1548err2:
1549 kfree(mapping);
1550err:
1551 return ERR_PTR(err);
1552}
1553
1554static void release_iommu_mapping(struct kref *kref)
1555{
1556 struct dma_iommu_mapping *mapping =
1557 container_of(kref, struct dma_iommu_mapping, kref);
1558
1559 iommu_domain_free(mapping->domain);
1560 kfree(mapping->bitmap);
1561 kfree(mapping);
1562}
1563
1564void arm_iommu_release_mapping(struct dma_iommu_mapping *mapping)
1565{
1566 if (mapping)
1567 kref_put(&mapping->kref, release_iommu_mapping);
1568}
1569
1570/**
1571 * arm_iommu_attach_device
1572 * @dev: valid struct device pointer
1573 * @mapping: io address space mapping structure (returned from
1574 * arm_iommu_create_mapping)
1575 *
1576 * Attaches specified io address space mapping to the provided device,
1577 * this replaces the dma operations (dma_map_ops pointer) with the
1578 * IOMMU aware version. More than one client might be attached to
1579 * the same io address space mapping.
1580 */
1581int arm_iommu_attach_device(struct device *dev,
1582 struct dma_iommu_mapping *mapping)
1583{
1584 int err;
1585
1586 err = iommu_attach_device(mapping->domain, dev);
1587 if (err)
1588 return err;
1589
1590 kref_get(&mapping->kref);
1591 dev->archdata.mapping = mapping;
1592 set_dma_ops(dev, &iommu_ops);
1593
1594 pr_info("Attached IOMMU controller to %s device.\n", dev_name(dev));
1595 return 0;
1596}
1597
1598#endif