| /* Copyright (c) 2011-2018, The Linux Foundation. All rights reserved. |
| * |
| * This program is free software; you can redistribute it and/or modify |
| * it under the terms of the GNU General Public License version 2 and |
| * only version 2 as published by the Free Software Foundation. |
| * |
| * This program is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| * GNU General Public License for more details. |
| * |
| */ |
| #include <linux/types.h> |
| #include <linux/delay.h> |
| #include <linux/device.h> |
| #include <linux/spinlock.h> |
| #include <linux/genalloc.h> |
| #include <linux/slab.h> |
| #include <linux/iommu.h> |
| #include <linux/msm_kgsl.h> |
| #include <linux/ratelimit.h> |
| #include <linux/of_platform.h> |
| #include <soc/qcom/scm.h> |
| #include <soc/qcom/secure_buffer.h> |
| #include <linux/compat.h> |
| |
| #include "kgsl.h" |
| #include "kgsl_device.h" |
| #include "kgsl_mmu.h" |
| #include "kgsl_sharedmem.h" |
| #include "kgsl_iommu.h" |
| #include "adreno_pm4types.h" |
| #include "adreno.h" |
| #include "kgsl_trace.h" |
| #include "kgsl_pwrctrl.h" |
| |
| #define CP_APERTURE_REG 0 |
| #define CP_SMMU_APERTURE_ID 0x1B |
| |
| #define _IOMMU_PRIV(_mmu) (&((_mmu)->priv.iommu)) |
| |
| #define ADDR_IN_GLOBAL(_mmu, _a) \ |
| (((_a) >= KGSL_IOMMU_GLOBAL_MEM_BASE(_mmu)) && \ |
| ((_a) < (KGSL_IOMMU_GLOBAL_MEM_BASE(_mmu) + \ |
| KGSL_IOMMU_GLOBAL_MEM_SIZE))) |
| |
| /* |
| * Flag to set SMMU memory attributes required to |
| * enable system cache for GPU transactions. |
| */ |
| #ifndef IOMMU_USE_UPSTREAM_HINT |
| #define IOMMU_USE_UPSTREAM_HINT 0 |
| #endif |
| |
| static struct kgsl_mmu_pt_ops iommu_pt_ops; |
| static bool need_iommu_sync; |
| |
| const unsigned int kgsl_iommu_reg_list[KGSL_IOMMU_REG_MAX] = { |
| 0x0,/* SCTLR */ |
| 0x20,/* TTBR0 */ |
| 0x34,/* CONTEXTIDR */ |
| 0x58,/* FSR */ |
| 0x60,/* FAR_0 */ |
| 0x618,/* TLBIALL */ |
| 0x008,/* RESUME */ |
| 0x68,/* FSYNR0 */ |
| 0x6C,/* FSYNR1 */ |
| 0x7F0,/* TLBSYNC */ |
| 0x7F4,/* TLBSTATUS */ |
| }; |
| |
| /* |
| * struct kgsl_iommu_addr_entry - entry in the kgsl_iommu_pt rbtree. |
| * @base: starting virtual address of the entry |
| * @size: size of the entry |
| * @node: the rbtree node |
| * |
| */ |
| struct kgsl_iommu_addr_entry { |
| uint64_t base; |
| uint64_t size; |
| struct rb_node node; |
| }; |
| |
| static struct kmem_cache *addr_entry_cache; |
| |
| /* |
| * There are certain memory allocations (ringbuffer, memstore, etc) that need to |
| * be present at the same address in every pagetable. We call these "global" |
| * pagetable entries. There are relatively few of these and they are mostly |
| * stable (defined at init time) but the actual number of globals can differ |
| * slight depending on the target and implementation. |
| * |
| * Here we define an array and a simple allocator to keep track of the currently |
| * active global entries. Each entry is assigned a unique address inside of a |
| * MMU implementation specific "global" region. The addresses are assigned |
| * sequentially and never re-used to avoid having to go back and reprogram |
| * existing pagetables. The entire list of active entries are mapped and |
| * unmapped into every new pagetable as it is created and destroyed. |
| * |
| * Because there are relatively few entries and they are defined at boot time we |
| * don't need to go over the top to define a dynamic allocation scheme. It will |
| * be less wasteful to pick a static number with a little bit of growth |
| * potential. |
| */ |
| |
| #define GLOBAL_PT_ENTRIES 32 |
| |
| struct global_pt_entry { |
| struct kgsl_memdesc *memdesc; |
| char name[32]; |
| }; |
| |
| static struct global_pt_entry global_pt_entries[GLOBAL_PT_ENTRIES]; |
| static int secure_global_size; |
| static int global_pt_count; |
| uint64_t global_pt_alloc; |
| static struct kgsl_memdesc gpu_qdss_desc; |
| static struct kgsl_memdesc gpu_qtimer_desc; |
| |
| void kgsl_print_global_pt_entries(struct seq_file *s) |
| { |
| int i; |
| |
| for (i = 0; i < global_pt_count; i++) { |
| struct kgsl_memdesc *memdesc = global_pt_entries[i].memdesc; |
| |
| if (memdesc == NULL) |
| continue; |
| |
| seq_printf(s, "0x%pK-0x%pK %16llu %s\n", |
| (uint64_t *)(uintptr_t) memdesc->gpuaddr, |
| (uint64_t *)(uintptr_t) (memdesc->gpuaddr + |
| memdesc->size - 1), memdesc->size, |
| global_pt_entries[i].name); |
| } |
| } |
| |
| static void kgsl_iommu_unmap_globals(struct kgsl_pagetable *pagetable) |
| { |
| unsigned int i; |
| |
| for (i = 0; i < global_pt_count; i++) { |
| if (global_pt_entries[i].memdesc != NULL) |
| kgsl_mmu_unmap(pagetable, |
| global_pt_entries[i].memdesc); |
| } |
| } |
| |
| static int kgsl_iommu_map_globals(struct kgsl_pagetable *pagetable) |
| { |
| unsigned int i; |
| |
| for (i = 0; i < global_pt_count; i++) { |
| if (global_pt_entries[i].memdesc != NULL) { |
| int ret = kgsl_mmu_map(pagetable, |
| global_pt_entries[i].memdesc); |
| |
| if (ret) |
| return ret; |
| } |
| } |
| |
| return 0; |
| } |
| |
| void kgsl_iommu_unmap_global_secure_pt_entry(struct kgsl_device *device, |
| struct kgsl_memdesc *memdesc) |
| { |
| if (!kgsl_mmu_is_secured(&device->mmu) || memdesc == NULL) |
| return; |
| |
| /* Check if an empty memdesc got passed in */ |
| if ((memdesc->gpuaddr == 0) || (memdesc->size == 0)) |
| return; |
| |
| if (memdesc->pagetable) { |
| if (memdesc->pagetable->name == KGSL_MMU_SECURE_PT) |
| kgsl_mmu_unmap(memdesc->pagetable, memdesc); |
| } |
| } |
| |
| int kgsl_iommu_map_global_secure_pt_entry(struct kgsl_device *device, |
| struct kgsl_memdesc *entry) |
| { |
| int ret = 0; |
| |
| if (!kgsl_mmu_is_secured(&device->mmu)) |
| return -ENOTSUPP; |
| |
| if (entry != NULL) { |
| struct kgsl_pagetable *pagetable = device->mmu.securepagetable; |
| entry->pagetable = pagetable; |
| entry->gpuaddr = KGSL_IOMMU_SECURE_BASE(&device->mmu) + |
| secure_global_size; |
| |
| ret = kgsl_mmu_map(pagetable, entry); |
| if (ret == 0) |
| secure_global_size += entry->size; |
| } |
| return ret; |
| } |
| |
| static void kgsl_iommu_remove_global(struct kgsl_mmu *mmu, |
| struct kgsl_memdesc *memdesc) |
| { |
| int i; |
| |
| if (memdesc->gpuaddr == 0 || !(memdesc->priv & KGSL_MEMDESC_GLOBAL)) |
| return; |
| |
| for (i = 0; i < global_pt_count; i++) { |
| if (global_pt_entries[i].memdesc == memdesc) { |
| memdesc->gpuaddr = 0; |
| memdesc->priv &= ~KGSL_MEMDESC_GLOBAL; |
| global_pt_entries[i].memdesc = NULL; |
| return; |
| } |
| } |
| } |
| |
| static void kgsl_iommu_add_global(struct kgsl_mmu *mmu, |
| struct kgsl_memdesc *memdesc, const char *name) |
| { |
| if (memdesc->gpuaddr != 0) |
| return; |
| |
| /*Check that we can fit the global allocations */ |
| if (WARN_ON(global_pt_count >= GLOBAL_PT_ENTRIES) || |
| WARN_ON((global_pt_alloc + memdesc->size) >= |
| KGSL_IOMMU_GLOBAL_MEM_SIZE)) |
| return; |
| |
| memdesc->gpuaddr = KGSL_IOMMU_GLOBAL_MEM_BASE(mmu) + global_pt_alloc; |
| |
| memdesc->priv |= KGSL_MEMDESC_GLOBAL; |
| global_pt_alloc += memdesc->size; |
| |
| global_pt_entries[global_pt_count].memdesc = memdesc; |
| strlcpy(global_pt_entries[global_pt_count].name, name, |
| sizeof(global_pt_entries[global_pt_count].name)); |
| global_pt_count++; |
| } |
| |
| struct kgsl_memdesc *kgsl_iommu_get_qdss_global_entry(void) |
| { |
| return &gpu_qdss_desc; |
| } |
| |
| static void kgsl_setup_qdss_desc(struct kgsl_device *device) |
| { |
| int result = 0; |
| uint32_t gpu_qdss_entry[2]; |
| |
| if (!of_find_property(device->pdev->dev.of_node, |
| "qcom,gpu-qdss-stm", NULL)) |
| return; |
| |
| if (of_property_read_u32_array(device->pdev->dev.of_node, |
| "qcom,gpu-qdss-stm", gpu_qdss_entry, 2)) { |
| KGSL_CORE_ERR("Failed to read gpu qdss dts entry\n"); |
| return; |
| } |
| |
| gpu_qdss_desc.flags = 0; |
| gpu_qdss_desc.priv = 0; |
| gpu_qdss_desc.physaddr = gpu_qdss_entry[0]; |
| gpu_qdss_desc.size = gpu_qdss_entry[1]; |
| gpu_qdss_desc.pagetable = NULL; |
| gpu_qdss_desc.ops = NULL; |
| gpu_qdss_desc.dev = device->dev->parent; |
| gpu_qdss_desc.hostptr = NULL; |
| |
| result = memdesc_sg_dma(&gpu_qdss_desc, gpu_qdss_desc.physaddr, |
| gpu_qdss_desc.size); |
| if (result) { |
| KGSL_CORE_ERR("memdesc_sg_dma failed: %d\n", result); |
| return; |
| } |
| |
| kgsl_mmu_add_global(device, &gpu_qdss_desc, "gpu-qdss"); |
| } |
| |
| static inline void kgsl_cleanup_qdss_desc(struct kgsl_mmu *mmu) |
| { |
| kgsl_iommu_remove_global(mmu, &gpu_qdss_desc); |
| kgsl_sharedmem_free(&gpu_qdss_desc); |
| } |
| |
| struct kgsl_memdesc *kgsl_iommu_get_qtimer_global_entry(void) |
| { |
| return &gpu_qtimer_desc; |
| } |
| |
| static void kgsl_setup_qtimer_desc(struct kgsl_device *device) |
| { |
| int result = 0; |
| uint32_t gpu_qtimer_entry[2]; |
| |
| if (!of_find_property(device->pdev->dev.of_node, |
| "qcom,gpu-qtimer", NULL)) |
| return; |
| |
| if (of_property_read_u32_array(device->pdev->dev.of_node, |
| "qcom,gpu-qtimer", gpu_qtimer_entry, 2)) { |
| KGSL_CORE_ERR("Failed to read gpu qtimer dts entry\n"); |
| return; |
| } |
| |
| gpu_qtimer_desc.flags = 0; |
| gpu_qtimer_desc.priv = 0; |
| gpu_qtimer_desc.physaddr = gpu_qtimer_entry[0]; |
| gpu_qtimer_desc.size = gpu_qtimer_entry[1]; |
| gpu_qtimer_desc.pagetable = NULL; |
| gpu_qtimer_desc.ops = NULL; |
| gpu_qtimer_desc.dev = device->dev->parent; |
| gpu_qtimer_desc.hostptr = NULL; |
| |
| result = memdesc_sg_dma(&gpu_qtimer_desc, gpu_qtimer_desc.physaddr, |
| gpu_qtimer_desc.size); |
| if (result) { |
| KGSL_CORE_ERR("memdesc_sg_dma failed: %d\n", result); |
| return; |
| } |
| |
| kgsl_mmu_add_global(device, &gpu_qtimer_desc, "gpu-qtimer"); |
| } |
| |
| static inline void kgsl_cleanup_qtimer_desc(struct kgsl_mmu *mmu) |
| { |
| kgsl_iommu_remove_global(mmu, &gpu_qtimer_desc); |
| kgsl_sharedmem_free(&gpu_qtimer_desc); |
| } |
| |
| static inline void _iommu_sync_mmu_pc(bool lock) |
| { |
| if (need_iommu_sync == false) |
| return; |
| |
| if (lock) |
| mutex_lock(&kgsl_mmu_sync); |
| else |
| mutex_unlock(&kgsl_mmu_sync); |
| } |
| |
| static void _detach_pt(struct kgsl_iommu_pt *iommu_pt, |
| struct kgsl_iommu_context *ctx) |
| { |
| if (iommu_pt->attached) { |
| _iommu_sync_mmu_pc(true); |
| iommu_detach_device(iommu_pt->domain, ctx->dev); |
| _iommu_sync_mmu_pc(false); |
| iommu_pt->attached = false; |
| } |
| } |
| |
| static int _attach_pt(struct kgsl_iommu_pt *iommu_pt, |
| struct kgsl_iommu_context *ctx) |
| { |
| int ret; |
| |
| if (iommu_pt->attached) |
| return 0; |
| |
| _iommu_sync_mmu_pc(true); |
| ret = iommu_attach_device(iommu_pt->domain, ctx->dev); |
| _iommu_sync_mmu_pc(false); |
| |
| if (ret == 0) |
| iommu_pt->attached = true; |
| |
| return ret; |
| } |
| |
| static int _iommu_map_sync_pc(struct kgsl_pagetable *pt, |
| uint64_t gpuaddr, phys_addr_t physaddr, |
| uint64_t size, unsigned int flags) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt->priv; |
| int ret; |
| |
| _iommu_sync_mmu_pc(true); |
| |
| ret = iommu_map(iommu_pt->domain, gpuaddr, physaddr, size, flags); |
| |
| _iommu_sync_mmu_pc(false); |
| |
| if (ret) { |
| KGSL_CORE_ERR("map err: 0x%016llX, 0x%llx, 0x%x, %d\n", |
| gpuaddr, size, flags, ret); |
| return -ENODEV; |
| } |
| |
| return 0; |
| } |
| |
| static int _iommu_unmap_sync_pc(struct kgsl_pagetable *pt, |
| uint64_t addr, uint64_t size) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt->priv; |
| size_t unmapped = 0; |
| |
| _iommu_sync_mmu_pc(true); |
| |
| unmapped = iommu_unmap(iommu_pt->domain, addr, size); |
| |
| _iommu_sync_mmu_pc(false); |
| |
| if (unmapped != size) { |
| KGSL_CORE_ERR("unmap err: 0x%016llx, 0x%llx, %zd\n", |
| addr, size, unmapped); |
| return -ENODEV; |
| } |
| |
| return 0; |
| } |
| |
| static int _iommu_map_sg_offset_sync_pc(struct kgsl_pagetable *pt, |
| uint64_t addr, struct scatterlist *sg, int nents, |
| uint64_t offset, uint64_t size, unsigned int flags) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt->priv; |
| uint64_t offset_tmp = offset; |
| uint64_t size_tmp = size; |
| size_t mapped = 0; |
| unsigned int i; |
| struct scatterlist *s; |
| phys_addr_t physaddr; |
| int ret; |
| |
| _iommu_sync_mmu_pc(true); |
| |
| for_each_sg(sg, s, nents, i) { |
| /* Iterate until we find the offset */ |
| if (offset_tmp >= s->length) { |
| offset_tmp -= s->length; |
| continue; |
| } |
| |
| /* How much mapping is needed in this sg? */ |
| if (size < s->length - offset_tmp) |
| size_tmp = size; |
| else |
| size_tmp = s->length - offset_tmp; |
| |
| /* Get the phys addr for the offset page */ |
| if (offset_tmp != 0) { |
| physaddr = page_to_phys(nth_page(sg_page(s), |
| offset_tmp >> PAGE_SHIFT)); |
| /* Reset offset_tmp */ |
| offset_tmp = 0; |
| } else |
| physaddr = page_to_phys(sg_page(s)); |
| |
| /* Do the map for this sg */ |
| ret = iommu_map(iommu_pt->domain, addr + mapped, |
| physaddr, size_tmp, flags); |
| if (ret) |
| break; |
| |
| mapped += size_tmp; |
| size -= size_tmp; |
| |
| if (size == 0) |
| break; |
| } |
| |
| _iommu_sync_mmu_pc(false); |
| |
| if (size != 0) { |
| /* Cleanup on error */ |
| _iommu_unmap_sync_pc(pt, addr, mapped); |
| KGSL_CORE_ERR( |
| "map sg offset err: 0x%016llX, %d, %x, %zd\n", |
| addr, nents, flags, mapped); |
| return -ENODEV; |
| } |
| |
| return 0; |
| } |
| |
| static int _iommu_map_sg_sync_pc(struct kgsl_pagetable *pt, |
| uint64_t addr, struct scatterlist *sg, int nents, |
| unsigned int flags) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt->priv; |
| size_t mapped; |
| |
| _iommu_sync_mmu_pc(true); |
| |
| mapped = iommu_map_sg(iommu_pt->domain, addr, sg, nents, flags); |
| |
| _iommu_sync_mmu_pc(false); |
| |
| if (mapped == 0) { |
| KGSL_CORE_ERR("map sg err: 0x%016llX, %d, %x, %zd\n", |
| addr, nents, flags, mapped); |
| return -ENODEV; |
| } |
| |
| return 0; |
| } |
| |
| /* |
| * One page allocation for a guard region to protect against over-zealous |
| * GPU pre-fetch |
| */ |
| |
| static struct page *kgsl_guard_page; |
| static struct kgsl_memdesc kgsl_secure_guard_page_memdesc; |
| |
| /* |
| * The dummy page is a placeholder/extra page to be used for sparse mappings. |
| * This page will be mapped to all virtual sparse bindings that are not |
| * physically backed. |
| */ |
| static struct page *kgsl_dummy_page; |
| |
| /* These functions help find the nearest allocated memory entries on either side |
| * of a faulting address. If we know the nearby allocations memory we can |
| * get a better determination of what we think should have been located in the |
| * faulting region |
| */ |
| |
| /* |
| * A local structure to make it easy to store the interesting bits for the |
| * memory entries on either side of the faulting address |
| */ |
| |
| struct _mem_entry { |
| uint64_t gpuaddr; |
| uint64_t size; |
| uint64_t flags; |
| unsigned int priv; |
| int pending_free; |
| pid_t pid; |
| char name[32]; |
| }; |
| |
| static void _get_global_entries(uint64_t faultaddr, |
| struct _mem_entry *prev, |
| struct _mem_entry *next) |
| { |
| int i; |
| uint64_t prevaddr = 0; |
| struct global_pt_entry *p = NULL; |
| |
| uint64_t nextaddr = (uint64_t) -1; |
| struct global_pt_entry *n = NULL; |
| |
| for (i = 0; i < global_pt_count; i++) { |
| uint64_t addr; |
| |
| if (global_pt_entries[i].memdesc == NULL) |
| continue; |
| |
| addr = global_pt_entries[i].memdesc->gpuaddr; |
| if ((addr < faultaddr) && (addr > prevaddr)) { |
| prevaddr = addr; |
| p = &global_pt_entries[i]; |
| } |
| |
| if ((addr > faultaddr) && (addr < nextaddr)) { |
| nextaddr = addr; |
| n = &global_pt_entries[i]; |
| } |
| } |
| |
| if (p != NULL) { |
| prev->gpuaddr = p->memdesc->gpuaddr; |
| prev->size = p->memdesc->size; |
| prev->flags = p->memdesc->flags; |
| prev->priv = p->memdesc->priv; |
| prev->pid = 0; |
| strlcpy(prev->name, p->name, sizeof(prev->name)); |
| } |
| |
| if (n != NULL) { |
| next->gpuaddr = n->memdesc->gpuaddr; |
| next->size = n->memdesc->size; |
| next->flags = n->memdesc->flags; |
| next->priv = n->memdesc->priv; |
| next->pid = 0; |
| strlcpy(next->name, n->name, sizeof(next->name)); |
| } |
| } |
| |
| void __kgsl_get_memory_usage(struct _mem_entry *entry) |
| { |
| kgsl_get_memory_usage(entry->name, sizeof(entry->name), entry->flags); |
| } |
| |
| static void _get_entries(struct kgsl_process_private *private, |
| uint64_t faultaddr, struct _mem_entry *prev, |
| struct _mem_entry *next) |
| { |
| int id; |
| struct kgsl_mem_entry *entry; |
| |
| uint64_t prevaddr = 0; |
| struct kgsl_mem_entry *p = NULL; |
| |
| uint64_t nextaddr = (uint64_t) -1; |
| struct kgsl_mem_entry *n = NULL; |
| |
| idr_for_each_entry(&private->mem_idr, entry, id) { |
| uint64_t addr = entry->memdesc.gpuaddr; |
| |
| if ((addr < faultaddr) && (addr > prevaddr)) { |
| prevaddr = addr; |
| p = entry; |
| } |
| |
| if ((addr > faultaddr) && (addr < nextaddr)) { |
| nextaddr = addr; |
| n = entry; |
| } |
| } |
| |
| if (p != NULL) { |
| prev->gpuaddr = p->memdesc.gpuaddr; |
| prev->size = p->memdesc.size; |
| prev->flags = p->memdesc.flags; |
| prev->priv = p->memdesc.priv; |
| prev->pending_free = p->pending_free; |
| prev->pid = private->pid; |
| __kgsl_get_memory_usage(prev); |
| } |
| |
| if (n != NULL) { |
| next->gpuaddr = n->memdesc.gpuaddr; |
| next->size = n->memdesc.size; |
| next->flags = n->memdesc.flags; |
| next->priv = n->memdesc.priv; |
| next->pending_free = n->pending_free; |
| next->pid = private->pid; |
| __kgsl_get_memory_usage(next); |
| } |
| } |
| |
| static void _find_mem_entries(struct kgsl_mmu *mmu, uint64_t faultaddr, |
| struct _mem_entry *preventry, struct _mem_entry *nextentry, |
| struct kgsl_context *context) |
| { |
| struct kgsl_process_private *private; |
| |
| memset(preventry, 0, sizeof(*preventry)); |
| memset(nextentry, 0, sizeof(*nextentry)); |
| |
| /* Set the maximum possible size as an initial value */ |
| nextentry->gpuaddr = (uint64_t) -1; |
| |
| if (ADDR_IN_GLOBAL(mmu, faultaddr)) { |
| _get_global_entries(faultaddr, preventry, nextentry); |
| } else if (context) { |
| private = context->proc_priv; |
| spin_lock(&private->mem_lock); |
| _get_entries(private, faultaddr, preventry, nextentry); |
| spin_unlock(&private->mem_lock); |
| } |
| } |
| |
| static void _print_entry(struct kgsl_device *device, struct _mem_entry *entry) |
| { |
| KGSL_LOG_DUMP(device, |
| "[%016llX - %016llX] %s %s (pid = %d) (%s)\n", |
| entry->gpuaddr, |
| entry->gpuaddr + entry->size, |
| entry->priv & KGSL_MEMDESC_GUARD_PAGE ? "(+guard)" : "", |
| entry->pending_free ? "(pending free)" : "", |
| entry->pid, entry->name); |
| } |
| |
| static void _check_if_freed(struct kgsl_iommu_context *ctx, |
| uint64_t addr, pid_t ptname) |
| { |
| uint64_t gpuaddr = addr; |
| uint64_t size = 0; |
| uint64_t flags = 0; |
| pid_t pid; |
| |
| char name[32]; |
| |
| memset(name, 0, sizeof(name)); |
| |
| if (kgsl_memfree_find_entry(ptname, &gpuaddr, &size, &flags, &pid)) { |
| kgsl_get_memory_usage(name, sizeof(name) - 1, flags); |
| KGSL_LOG_DUMP(ctx->kgsldev, "---- premature free ----\n"); |
| KGSL_LOG_DUMP(ctx->kgsldev, |
| "[%8.8llX-%8.8llX] (%s) was already freed by pid %d\n", |
| gpuaddr, gpuaddr + size, name, pid); |
| } |
| } |
| |
| static bool |
| kgsl_iommu_uche_overfetch(struct kgsl_process_private *private, |
| uint64_t faultaddr) |
| { |
| int id; |
| struct kgsl_mem_entry *entry = NULL; |
| |
| spin_lock(&private->mem_lock); |
| idr_for_each_entry(&private->mem_idr, entry, id) { |
| struct kgsl_memdesc *m = &entry->memdesc; |
| |
| if ((faultaddr >= (m->gpuaddr + m->size)) |
| && (faultaddr < (m->gpuaddr + m->size + 64))) { |
| spin_unlock(&private->mem_lock); |
| return true; |
| } |
| } |
| spin_unlock(&private->mem_lock); |
| return false; |
| } |
| |
| /* |
| * Read pagefaults where the faulting address lies within the first 64 bytes |
| * of a page (UCHE line size is 64 bytes) and the fault page is preceded by a |
| * valid allocation are considered likely due to UCHE overfetch and suppressed. |
| */ |
| |
| static bool kgsl_iommu_suppress_pagefault(uint64_t faultaddr, int write, |
| struct kgsl_context *context) |
| { |
| /* |
| * If there is no context associated with the pagefault then this |
| * could be a fault on a global buffer. We do not suppress faults |
| * on global buffers as they are mainly accessed by the CP bypassing |
| * the UCHE. Also, write pagefaults are never suppressed. |
| */ |
| if (!context || write) |
| return false; |
| |
| return kgsl_iommu_uche_overfetch(context->proc_priv, faultaddr); |
| } |
| |
| static int kgsl_iommu_fault_handler(struct iommu_domain *domain, |
| struct device *dev, unsigned long addr, int flags, void *token) |
| { |
| int ret = 0; |
| struct kgsl_pagetable *pt = token; |
| struct kgsl_mmu *mmu = pt->mmu; |
| struct kgsl_iommu *iommu; |
| struct kgsl_iommu_context *ctx; |
| u64 ptbase; |
| u32 contextidr; |
| pid_t pid = 0; |
| pid_t ptname; |
| struct _mem_entry prev, next; |
| int write; |
| struct kgsl_device *device; |
| struct adreno_device *adreno_dev; |
| struct adreno_gpudev *gpudev; |
| unsigned int no_page_fault_log = 0; |
| unsigned int curr_context_id = 0; |
| struct kgsl_context *context; |
| char *fault_type = "unknown"; |
| |
| static DEFINE_RATELIMIT_STATE(_rs, |
| DEFAULT_RATELIMIT_INTERVAL, |
| DEFAULT_RATELIMIT_BURST); |
| |
| if (mmu == NULL) |
| return ret; |
| |
| iommu = _IOMMU_PRIV(mmu); |
| ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| device = KGSL_MMU_DEVICE(mmu); |
| adreno_dev = ADRENO_DEVICE(device); |
| gpudev = ADRENO_GPU_DEVICE(adreno_dev); |
| |
| if (pt->name == KGSL_MMU_SECURE_PT) |
| ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; |
| |
| /* |
| * set the fault bits and stuff before any printks so that if fault |
| * handler runs then it will know it's dealing with a pagefault. |
| * Read the global current timestamp because we could be in middle of |
| * RB switch and hence the cur RB may not be reliable but global |
| * one will always be reliable |
| */ |
| kgsl_sharedmem_readl(&device->memstore, &curr_context_id, |
| KGSL_MEMSTORE_OFFSET(KGSL_MEMSTORE_GLOBAL, current_context)); |
| |
| context = kgsl_context_get(device, curr_context_id); |
| |
| write = (flags & IOMMU_FAULT_WRITE) ? 1 : 0; |
| if (flags & IOMMU_FAULT_TRANSLATION) |
| fault_type = "translation"; |
| else if (flags & IOMMU_FAULT_PERMISSION) |
| fault_type = "permission"; |
| else if (flags & IOMMU_FAULT_EXTERNAL) |
| fault_type = "external"; |
| else if (flags & IOMMU_FAULT_TRANSACTION_STALLED) |
| fault_type = "transaction stalled"; |
| |
| if (kgsl_iommu_suppress_pagefault(addr, write, context)) { |
| iommu->pagefault_suppression_count++; |
| kgsl_context_put(context); |
| return ret; |
| } |
| |
| if (context != NULL) { |
| /* save pagefault timestamp for GFT */ |
| set_bit(KGSL_CONTEXT_PRIV_PAGEFAULT, &context->priv); |
| pid = context->proc_priv->pid; |
| } |
| |
| ctx->fault = 1; |
| |
| if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, |
| &adreno_dev->ft_pf_policy) && |
| (flags & IOMMU_FAULT_TRANSACTION_STALLED)) { |
| /* |
| * Turn off GPU IRQ so we don't get faults from it too. |
| * The device mutex must be held to change power state |
| */ |
| mutex_lock(&device->mutex); |
| kgsl_pwrctrl_change_state(device, KGSL_STATE_AWARE); |
| mutex_unlock(&device->mutex); |
| } |
| |
| ptbase = KGSL_IOMMU_GET_CTX_REG_Q(ctx, TTBR0); |
| contextidr = KGSL_IOMMU_GET_CTX_REG(ctx, CONTEXTIDR); |
| |
| ptname = MMU_FEATURE(mmu, KGSL_MMU_GLOBAL_PAGETABLE) ? |
| KGSL_MMU_GLOBAL_PT : pid; |
| /* |
| * Trace needs to be logged before searching the faulting |
| * address in free list as it takes quite long time in |
| * search and delays the trace unnecessarily. |
| */ |
| trace_kgsl_mmu_pagefault(ctx->kgsldev, addr, |
| ptname, write ? "write" : "read"); |
| |
| if (test_bit(KGSL_FT_PAGEFAULT_LOG_ONE_PER_PAGE, |
| &adreno_dev->ft_pf_policy)) |
| no_page_fault_log = kgsl_mmu_log_fault_addr(mmu, ptbase, addr); |
| |
| if (!no_page_fault_log && __ratelimit(&_rs)) { |
| KGSL_MEM_CRIT(ctx->kgsldev, |
| "GPU PAGE FAULT: addr = %lX pid= %d\n", addr, ptname); |
| KGSL_MEM_CRIT(ctx->kgsldev, |
| "context=%s TTBR0=0x%llx CIDR=0x%x (%s %s fault)\n", |
| ctx->name, ptbase, contextidr, |
| write ? "write" : "read", fault_type); |
| |
| if (gpudev->iommu_fault_block) { |
| unsigned int fsynr1; |
| |
| fsynr1 = KGSL_IOMMU_GET_CTX_REG(ctx, FSYNR1); |
| KGSL_MEM_CRIT(ctx->kgsldev, |
| "FAULTING BLOCK: %s\n", |
| gpudev->iommu_fault_block(adreno_dev, |
| fsynr1)); |
| } |
| |
| /* Don't print the debug if this is a permissions fault */ |
| if (!(flags & IOMMU_FAULT_PERMISSION)) { |
| _check_if_freed(ctx, addr, ptname); |
| |
| KGSL_LOG_DUMP(ctx->kgsldev, |
| "---- nearby memory ----\n"); |
| |
| _find_mem_entries(mmu, addr, &prev, &next, context); |
| if (prev.gpuaddr) |
| _print_entry(ctx->kgsldev, &prev); |
| else |
| KGSL_LOG_DUMP(ctx->kgsldev, "*EMPTY*\n"); |
| |
| KGSL_LOG_DUMP(ctx->kgsldev, " <- fault @ %8.8lX\n", |
| addr); |
| |
| if (next.gpuaddr != (uint64_t) -1) |
| _print_entry(ctx->kgsldev, &next); |
| else |
| KGSL_LOG_DUMP(ctx->kgsldev, "*EMPTY*\n"); |
| } |
| } |
| |
| |
| /* |
| * We do not want the h/w to resume fetching data from an iommu |
| * that has faulted, this is better for debugging as it will stall |
| * the GPU and trigger a snapshot. Return EBUSY error. |
| */ |
| if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, |
| &adreno_dev->ft_pf_policy) && |
| (flags & IOMMU_FAULT_TRANSACTION_STALLED)) { |
| uint32_t sctlr_val; |
| |
| ret = -EBUSY; |
| /* |
| * Disable context fault interrupts |
| * as we do not clear FSR in the ISR. |
| * Will be re-enabled after FSR is cleared. |
| */ |
| sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); |
| sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_CFIE_SHIFT); |
| KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); |
| |
| adreno_set_gpu_fault(adreno_dev, ADRENO_IOMMU_PAGE_FAULT); |
| /* Go ahead with recovery*/ |
| adreno_dispatcher_schedule(device); |
| } |
| |
| kgsl_context_put(context); |
| return ret; |
| } |
| |
| /* |
| * kgsl_iommu_disable_clk() - Disable iommu clocks |
| * Disable IOMMU clocks |
| */ |
| static void kgsl_iommu_disable_clk(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| int j; |
| |
| atomic_dec(&iommu->clk_enable_count); |
| |
| /* |
| * Make sure the clk refcounts are good. An unbalance may |
| * cause the clocks to be off when we need them on. |
| */ |
| WARN_ON(atomic_read(&iommu->clk_enable_count) < 0); |
| |
| for (j = (KGSL_IOMMU_MAX_CLKS - 1); j >= 0; j--) |
| if (iommu->clks[j]) |
| clk_disable_unprepare(iommu->clks[j]); |
| } |
| |
| /* |
| * kgsl_iommu_enable_clk_prepare_enable - Enable the specified IOMMU clock |
| * Try 4 times to enable it and then BUG() for debug |
| */ |
| static void kgsl_iommu_clk_prepare_enable(struct clk *clk) |
| { |
| int num_retries = 4; |
| |
| while (num_retries--) { |
| if (!clk_prepare_enable(clk)) |
| return; |
| } |
| |
| /* Failure is fatal so BUG() to facilitate debug */ |
| KGSL_CORE_ERR("IOMMU clock enable failed\n"); |
| BUG(); |
| } |
| |
| /* |
| * kgsl_iommu_enable_clk - Enable iommu clocks |
| * Enable all the IOMMU clocks |
| */ |
| static void kgsl_iommu_enable_clk(struct kgsl_mmu *mmu) |
| { |
| int j; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| |
| for (j = 0; j < KGSL_IOMMU_MAX_CLKS; j++) { |
| if (iommu->clks[j]) |
| kgsl_iommu_clk_prepare_enable(iommu->clks[j]); |
| } |
| atomic_inc(&iommu->clk_enable_count); |
| } |
| |
| /* kgsl_iommu_get_ttbr0 - Get TTBR0 setting for a pagetable */ |
| static u64 kgsl_iommu_get_ttbr0(struct kgsl_pagetable *pt) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt ? pt->priv : NULL; |
| |
| BUG_ON(iommu_pt == NULL); |
| |
| return iommu_pt->ttbr0; |
| } |
| |
| static bool kgsl_iommu_pt_equal(struct kgsl_mmu *mmu, |
| struct kgsl_pagetable *pt, |
| u64 ttbr0) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt ? pt->priv : NULL; |
| u64 domain_ttbr0; |
| |
| if (iommu_pt == NULL) |
| return 0; |
| |
| domain_ttbr0 = kgsl_iommu_get_ttbr0(pt); |
| |
| return (domain_ttbr0 == ttbr0); |
| } |
| |
| /* kgsl_iommu_get_contextidr - query CONTEXTIDR setting for a pagetable */ |
| static u32 kgsl_iommu_get_contextidr(struct kgsl_pagetable *pt) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt ? pt->priv : NULL; |
| |
| BUG_ON(iommu_pt == NULL); |
| |
| return iommu_pt->contextidr; |
| } |
| |
| /* |
| * kgsl_iommu_destroy_pagetable - Free up reaources help by a pagetable |
| * @mmu_specific_pt - Pointer to pagetable which is to be freed |
| * |
| * Return - void |
| */ |
| static void kgsl_iommu_destroy_pagetable(struct kgsl_pagetable *pt) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt->priv; |
| struct kgsl_mmu *mmu = pt->mmu; |
| struct kgsl_iommu *iommu; |
| struct kgsl_iommu_context *ctx; |
| |
| /* |
| * Make sure all allocations are unmapped before destroying |
| * the pagetable |
| */ |
| WARN_ON(!list_empty(&pt->list)); |
| |
| iommu = _IOMMU_PRIV(mmu); |
| |
| if (pt->name == KGSL_MMU_SECURE_PT) { |
| ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; |
| } else { |
| ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| kgsl_iommu_unmap_globals(pt); |
| } |
| |
| if (iommu_pt->domain) { |
| trace_kgsl_pagetable_destroy(iommu_pt->ttbr0, pt->name); |
| |
| _detach_pt(iommu_pt, ctx); |
| |
| iommu_domain_free(iommu_pt->domain); |
| } |
| |
| kfree(iommu_pt); |
| } |
| |
| static void setup_64bit_pagetable(struct kgsl_mmu *mmu, |
| struct kgsl_pagetable *pagetable, |
| struct kgsl_iommu_pt *pt) |
| { |
| if (mmu->secured && pagetable->name == KGSL_MMU_SECURE_PT) { |
| pt->compat_va_start = KGSL_IOMMU_SECURE_BASE(mmu); |
| pt->compat_va_end = KGSL_IOMMU_SECURE_END(mmu); |
| pt->va_start = KGSL_IOMMU_SECURE_BASE(mmu); |
| pt->va_end = KGSL_IOMMU_SECURE_END(mmu); |
| } else { |
| pt->compat_va_start = KGSL_IOMMU_SVM_BASE32; |
| pt->compat_va_end = KGSL_IOMMU_SECURE_BASE(mmu); |
| pt->va_start = KGSL_IOMMU_VA_BASE64; |
| pt->va_end = KGSL_IOMMU_VA_END64; |
| } |
| |
| if (pagetable->name != KGSL_MMU_GLOBAL_PT && |
| pagetable->name != KGSL_MMU_SECURE_PT) { |
| if (kgsl_is_compat_task()) { |
| pt->svm_start = KGSL_IOMMU_SVM_BASE32; |
| pt->svm_end = KGSL_IOMMU_SECURE_BASE(mmu); |
| } else { |
| pt->svm_start = KGSL_IOMMU_SVM_BASE64; |
| pt->svm_end = KGSL_IOMMU_SVM_END64; |
| } |
| } |
| } |
| |
| static void setup_32bit_pagetable(struct kgsl_mmu *mmu, |
| struct kgsl_pagetable *pagetable, |
| struct kgsl_iommu_pt *pt) |
| { |
| if (mmu->secured) { |
| if (pagetable->name == KGSL_MMU_SECURE_PT) { |
| pt->compat_va_start = KGSL_IOMMU_SECURE_BASE(mmu); |
| pt->compat_va_end = KGSL_IOMMU_SECURE_END(mmu); |
| pt->va_start = KGSL_IOMMU_SECURE_BASE(mmu); |
| pt->va_end = KGSL_IOMMU_SECURE_END(mmu); |
| } else { |
| pt->va_start = KGSL_IOMMU_SVM_BASE32; |
| pt->va_end = KGSL_IOMMU_SECURE_BASE(mmu); |
| pt->compat_va_start = pt->va_start; |
| pt->compat_va_end = pt->va_end; |
| } |
| } else { |
| pt->va_start = KGSL_IOMMU_SVM_BASE32; |
| pt->va_end = KGSL_IOMMU_GLOBAL_MEM_BASE(mmu); |
| pt->compat_va_start = pt->va_start; |
| pt->compat_va_end = pt->va_end; |
| } |
| |
| if (pagetable->name != KGSL_MMU_GLOBAL_PT && |
| pagetable->name != KGSL_MMU_SECURE_PT) { |
| pt->svm_start = KGSL_IOMMU_SVM_BASE32; |
| pt->svm_end = KGSL_IOMMU_SVM_END32; |
| } |
| } |
| |
| |
| static struct kgsl_iommu_pt * |
| _alloc_pt(struct device *dev, struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) |
| { |
| struct kgsl_iommu_pt *iommu_pt; |
| struct bus_type *bus = kgsl_mmu_get_bus(dev); |
| |
| if (bus == NULL) |
| return ERR_PTR(-ENODEV); |
| |
| iommu_pt = kzalloc(sizeof(struct kgsl_iommu_pt), GFP_KERNEL); |
| if (iommu_pt == NULL) |
| return ERR_PTR(-ENOMEM); |
| |
| iommu_pt->domain = iommu_domain_alloc(bus); |
| if (iommu_pt->domain == NULL) { |
| kfree(iommu_pt); |
| return ERR_PTR(-ENODEV); |
| } |
| |
| pt->pt_ops = &iommu_pt_ops; |
| pt->priv = iommu_pt; |
| pt->fault_addr = ~0ULL; |
| iommu_pt->rbtree = RB_ROOT; |
| |
| if (MMU_FEATURE(mmu, KGSL_MMU_64BIT)) |
| setup_64bit_pagetable(mmu, pt, iommu_pt); |
| else |
| setup_32bit_pagetable(mmu, pt, iommu_pt); |
| |
| |
| return iommu_pt; |
| } |
| |
| static void _free_pt(struct kgsl_iommu_context *ctx, struct kgsl_pagetable *pt) |
| { |
| struct kgsl_iommu_pt *iommu_pt = pt->priv; |
| |
| pt->pt_ops = NULL; |
| pt->priv = NULL; |
| |
| if (iommu_pt == NULL) |
| return; |
| |
| _detach_pt(iommu_pt, ctx); |
| |
| if (iommu_pt->domain != NULL) |
| iommu_domain_free(iommu_pt->domain); |
| kfree(iommu_pt); |
| } |
| |
| void _enable_gpuhtw_llc(struct kgsl_mmu *mmu, struct kgsl_iommu_pt *iommu_pt) |
| { |
| struct kgsl_device *device = KGSL_MMU_DEVICE(mmu); |
| struct adreno_device *adreno_dev = ADRENO_DEVICE(device); |
| int gpuhtw_llc_enable = 1; |
| int ret; |
| |
| /* GPU pagetable walk LLC slice not enabled */ |
| if (!adreno_dev->gpuhtw_llc_slice) |
| return; |
| |
| /* Domain attribute to enable system cache for GPU pagetable walks */ |
| ret = iommu_domain_set_attr(iommu_pt->domain, |
| DOMAIN_ATTR_USE_UPSTREAM_HINT, &gpuhtw_llc_enable); |
| /* |
| * Warn that the system cache will not be used for GPU |
| * pagetable walks. This is not a fatal error. |
| */ |
| WARN_ONCE(ret, |
| "System cache not enabled for GPU pagetable walks: %d\n", ret); |
| } |
| |
| static int program_smmu_aperture(unsigned int cb, unsigned int aperture_reg) |
| { |
| struct scm_desc desc = {0}; |
| |
| desc.args[0] = 0xFFFF0000 | ((aperture_reg & 0xff) << 8) | (cb & 0xff); |
| desc.args[1] = 0xFFFFFFFF; |
| desc.args[2] = 0xFFFFFFFF; |
| desc.args[3] = 0xFFFFFFFF; |
| desc.arginfo = SCM_ARGS(4); |
| |
| return scm_call2(SCM_SIP_FNID(SCM_SVC_MP, CP_SMMU_APERTURE_ID), &desc); |
| } |
| |
| static int _init_global_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) |
| { |
| int ret = 0; |
| struct kgsl_iommu_pt *iommu_pt = NULL; |
| unsigned int cb_num; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| |
| iommu_pt = _alloc_pt(ctx->dev, mmu, pt); |
| |
| if (IS_ERR(iommu_pt)) |
| return PTR_ERR(iommu_pt); |
| |
| if (kgsl_mmu_is_perprocess(mmu)) { |
| ret = iommu_domain_set_attr(iommu_pt->domain, |
| DOMAIN_ATTR_PROCID, &pt->name); |
| if (ret) { |
| KGSL_CORE_ERR("set DOMAIN_ATTR_PROCID failed: %d\n", |
| ret); |
| goto done; |
| } |
| } |
| |
| _enable_gpuhtw_llc(mmu, iommu_pt); |
| |
| ret = _attach_pt(iommu_pt, ctx); |
| if (ret) |
| goto done; |
| |
| iommu_set_fault_handler(iommu_pt->domain, |
| kgsl_iommu_fault_handler, pt); |
| |
| ret = iommu_domain_get_attr(iommu_pt->domain, |
| DOMAIN_ATTR_CONTEXT_BANK, &cb_num); |
| if (ret) { |
| KGSL_CORE_ERR("get DOMAIN_ATTR_CONTEXT_BANK failed: %d\n", |
| ret); |
| goto done; |
| } |
| |
| if (!MMU_FEATURE(mmu, KGSL_MMU_GLOBAL_PAGETABLE) && |
| scm_is_call_available(SCM_SVC_MP, CP_SMMU_APERTURE_ID)) { |
| ret = program_smmu_aperture(cb_num, CP_APERTURE_REG); |
| if (ret) { |
| pr_err("SMMU aperture programming call failed with error %d\n", |
| ret); |
| return ret; |
| } |
| } |
| |
| ctx->cb_num = cb_num; |
| ctx->regbase = iommu->regbase + KGSL_IOMMU_CB0_OFFSET |
| + (cb_num << KGSL_IOMMU_CB_SHIFT); |
| |
| ret = iommu_domain_get_attr(iommu_pt->domain, |
| DOMAIN_ATTR_TTBR0, &iommu_pt->ttbr0); |
| if (ret) { |
| KGSL_CORE_ERR("get DOMAIN_ATTR_TTBR0 failed: %d\n", |
| ret); |
| goto done; |
| } |
| ret = iommu_domain_get_attr(iommu_pt->domain, |
| DOMAIN_ATTR_CONTEXTIDR, &iommu_pt->contextidr); |
| if (ret) { |
| KGSL_CORE_ERR("get DOMAIN_ATTR_CONTEXTIDR failed: %d\n", |
| ret); |
| goto done; |
| } |
| |
| ret = kgsl_iommu_map_globals(pt); |
| |
| done: |
| if (ret) |
| _free_pt(ctx, pt); |
| |
| return ret; |
| } |
| |
| static int _init_secure_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) |
| { |
| int ret = 0; |
| struct kgsl_iommu_pt *iommu_pt = NULL; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; |
| int secure_vmid = VMID_CP_PIXEL; |
| unsigned int cb_num; |
| |
| if (!mmu->secured) |
| return -EPERM; |
| |
| if (!MMU_FEATURE(mmu, KGSL_MMU_HYP_SECURE_ALLOC)) { |
| if (!kgsl_mmu_bus_secured(ctx->dev)) |
| return -EPERM; |
| } |
| |
| iommu_pt = _alloc_pt(ctx->dev, mmu, pt); |
| |
| if (IS_ERR(iommu_pt)) |
| return PTR_ERR(iommu_pt); |
| |
| ret = iommu_domain_set_attr(iommu_pt->domain, |
| DOMAIN_ATTR_SECURE_VMID, &secure_vmid); |
| if (ret) { |
| KGSL_CORE_ERR("set DOMAIN_ATTR_SECURE_VMID failed: %d\n", ret); |
| goto done; |
| } |
| |
| _enable_gpuhtw_llc(mmu, iommu_pt); |
| |
| ret = _attach_pt(iommu_pt, ctx); |
| |
| if (MMU_FEATURE(mmu, KGSL_MMU_HYP_SECURE_ALLOC)) |
| iommu_set_fault_handler(iommu_pt->domain, |
| kgsl_iommu_fault_handler, pt); |
| |
| ret = iommu_domain_get_attr(iommu_pt->domain, |
| DOMAIN_ATTR_CONTEXT_BANK, &cb_num); |
| if (ret) { |
| KGSL_CORE_ERR("get DOMAIN_ATTR_PROCID failed: %d\n", |
| ret); |
| goto done; |
| } |
| |
| ctx->cb_num = cb_num; |
| ctx->regbase = iommu->regbase + KGSL_IOMMU_CB0_OFFSET |
| + (cb_num << KGSL_IOMMU_CB_SHIFT); |
| |
| done: |
| if (ret) |
| _free_pt(ctx, pt); |
| return ret; |
| } |
| |
| static int _init_per_process_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) |
| { |
| int ret = 0; |
| struct kgsl_iommu_pt *iommu_pt = NULL; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| int dynamic = 1; |
| unsigned int cb_num = ctx->cb_num; |
| |
| iommu_pt = _alloc_pt(ctx->dev, mmu, pt); |
| |
| if (IS_ERR(iommu_pt)) |
| return PTR_ERR(iommu_pt); |
| |
| ret = iommu_domain_set_attr(iommu_pt->domain, |
| DOMAIN_ATTR_DYNAMIC, &dynamic); |
| if (ret) { |
| KGSL_CORE_ERR("set DOMAIN_ATTR_DYNAMIC failed: %d\n", ret); |
| goto done; |
| } |
| ret = iommu_domain_set_attr(iommu_pt->domain, |
| DOMAIN_ATTR_CONTEXT_BANK, &cb_num); |
| if (ret) { |
| KGSL_CORE_ERR("set DOMAIN_ATTR_CONTEXT_BANK failed: %d\n", ret); |
| goto done; |
| } |
| |
| ret = iommu_domain_set_attr(iommu_pt->domain, |
| DOMAIN_ATTR_PROCID, &pt->name); |
| if (ret) { |
| KGSL_CORE_ERR("set DOMAIN_ATTR_PROCID failed: %d\n", ret); |
| goto done; |
| } |
| |
| _enable_gpuhtw_llc(mmu, iommu_pt); |
| |
| ret = _attach_pt(iommu_pt, ctx); |
| if (ret) |
| goto done; |
| |
| /* now read back the attributes needed for self programming */ |
| ret = iommu_domain_get_attr(iommu_pt->domain, |
| DOMAIN_ATTR_TTBR0, &iommu_pt->ttbr0); |
| if (ret) { |
| KGSL_CORE_ERR("get DOMAIN_ATTR_TTBR0 failed: %d\n", ret); |
| goto done; |
| } |
| |
| ret = iommu_domain_get_attr(iommu_pt->domain, |
| DOMAIN_ATTR_CONTEXTIDR, &iommu_pt->contextidr); |
| if (ret) { |
| KGSL_CORE_ERR("get DOMAIN_ATTR_CONTEXTIDR failed: %d\n", ret); |
| goto done; |
| } |
| |
| ret = kgsl_iommu_map_globals(pt); |
| |
| done: |
| if (ret) |
| _free_pt(ctx, pt); |
| |
| return ret; |
| } |
| |
| /* kgsl_iommu_init_pt - Set up an IOMMU pagetable */ |
| static int kgsl_iommu_init_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) |
| { |
| if (pt == NULL) |
| return -EINVAL; |
| |
| switch (pt->name) { |
| case KGSL_MMU_GLOBAL_PT: |
| return _init_global_pt(mmu, pt); |
| |
| case KGSL_MMU_SECURE_PT: |
| return _init_secure_pt(mmu, pt); |
| |
| default: |
| return _init_per_process_pt(mmu, pt); |
| } |
| } |
| |
| static struct kgsl_pagetable *kgsl_iommu_getpagetable(struct kgsl_mmu *mmu, |
| unsigned long name) |
| { |
| struct kgsl_pagetable *pt; |
| |
| if (!kgsl_mmu_is_perprocess(mmu) && (name != KGSL_MMU_SECURE_PT)) { |
| name = KGSL_MMU_GLOBAL_PT; |
| if (mmu->defaultpagetable != NULL) |
| return mmu->defaultpagetable; |
| } |
| |
| pt = kgsl_get_pagetable(name); |
| if (pt == NULL) |
| pt = kgsl_mmu_createpagetableobject(mmu, name); |
| |
| return pt; |
| } |
| |
| /* |
| * kgsl_iommu_get_reg_ahbaddr - Returns the ahb address of the register |
| * @mmu - Pointer to mmu structure |
| * @id - The context ID of the IOMMU ctx |
| * @reg - The register for which address is required |
| * |
| * Return - The address of register which can be used in type0 packet |
| */ |
| static unsigned int kgsl_iommu_get_reg_ahbaddr(struct kgsl_mmu *mmu, |
| int id, unsigned int reg) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[id]; |
| |
| return ctx->gpu_offset + kgsl_iommu_reg_list[reg]; |
| } |
| |
| static void _detach_context(struct kgsl_iommu_context *ctx) |
| { |
| struct kgsl_iommu_pt *iommu_pt; |
| |
| if (ctx->default_pt == NULL) |
| return; |
| |
| iommu_pt = ctx->default_pt->priv; |
| |
| _detach_pt(iommu_pt, ctx); |
| |
| ctx->default_pt = NULL; |
| } |
| |
| static void kgsl_iommu_close(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| int i; |
| |
| for (i = 0; i < KGSL_IOMMU_CONTEXT_MAX; i++) |
| _detach_context(&iommu->ctx[i]); |
| |
| kgsl_mmu_putpagetable(mmu->defaultpagetable); |
| mmu->defaultpagetable = NULL; |
| |
| kgsl_mmu_putpagetable(mmu->securepagetable); |
| mmu->securepagetable = NULL; |
| |
| if (iommu->regbase != NULL) |
| iounmap(iommu->regbase); |
| |
| kgsl_sharedmem_free(&kgsl_secure_guard_page_memdesc); |
| |
| if (kgsl_guard_page != NULL) { |
| __free_page(kgsl_guard_page); |
| kgsl_guard_page = NULL; |
| } |
| |
| if (kgsl_dummy_page != NULL) { |
| __free_page(kgsl_dummy_page); |
| kgsl_dummy_page = NULL; |
| } |
| |
| kgsl_iommu_remove_global(mmu, &iommu->setstate); |
| kgsl_sharedmem_free(&iommu->setstate); |
| kgsl_cleanup_qdss_desc(mmu); |
| kgsl_cleanup_qtimer_desc(mmu); |
| } |
| |
| static int _setstate_alloc(struct kgsl_device *device, |
| struct kgsl_iommu *iommu) |
| { |
| int ret; |
| |
| ret = kgsl_sharedmem_alloc_contig(device, &iommu->setstate, PAGE_SIZE); |
| |
| if (!ret) { |
| /* Mark the setstate memory as read only */ |
| iommu->setstate.flags |= KGSL_MEMFLAGS_GPUREADONLY; |
| |
| kgsl_sharedmem_set(device, &iommu->setstate, 0, 0, PAGE_SIZE); |
| } |
| |
| return ret; |
| } |
| |
| static int kgsl_iommu_init(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_device *device = KGSL_MMU_DEVICE(mmu); |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| int status; |
| |
| mmu->features |= KGSL_MMU_PAGED; |
| |
| if (ctx->name == NULL) { |
| KGSL_CORE_ERR("dt: gfx3d0_user context bank not found\n"); |
| return -EINVAL; |
| } |
| |
| status = _setstate_alloc(device, iommu); |
| if (status) |
| return status; |
| |
| /* check requirements for per process pagetables */ |
| if (ctx->gpu_offset == UINT_MAX) { |
| KGSL_CORE_ERR("missing qcom,gpu-offset forces global pt\n"); |
| mmu->features |= KGSL_MMU_GLOBAL_PAGETABLE; |
| } |
| |
| if (iommu->version == 1 && iommu->micro_mmu_ctrl == UINT_MAX) { |
| KGSL_CORE_ERR( |
| "missing qcom,micro-mmu-control forces global pt\n"); |
| mmu->features |= KGSL_MMU_GLOBAL_PAGETABLE; |
| } |
| |
| /* Check to see if we need to do the IOMMU sync dance */ |
| need_iommu_sync = of_property_read_bool(device->pdev->dev.of_node, |
| "qcom,gpu-quirk-iommu-sync"); |
| |
| iommu->regbase = ioremap(iommu->regstart, iommu->regsize); |
| if (iommu->regbase == NULL) { |
| KGSL_CORE_ERR("Could not map IOMMU registers 0x%lx:0x%x\n", |
| iommu->regstart, iommu->regsize); |
| status = -ENOMEM; |
| goto done; |
| } |
| |
| if (addr_entry_cache == NULL) { |
| addr_entry_cache = KMEM_CACHE(kgsl_iommu_addr_entry, 0); |
| if (addr_entry_cache == NULL) { |
| status = -ENOMEM; |
| goto done; |
| } |
| } |
| |
| kgsl_iommu_add_global(mmu, &iommu->setstate, "setstate"); |
| kgsl_setup_qdss_desc(device); |
| kgsl_setup_qtimer_desc(device); |
| |
| if (!mmu->secured) |
| goto done; |
| |
| mmu->securepagetable = kgsl_mmu_getpagetable(mmu, |
| KGSL_MMU_SECURE_PT); |
| if (IS_ERR(mmu->securepagetable)) { |
| status = PTR_ERR(mmu->securepagetable); |
| mmu->securepagetable = NULL; |
| } else if (mmu->securepagetable == NULL) { |
| status = -ENOMEM; |
| } |
| |
| done: |
| if (status) |
| kgsl_iommu_close(mmu); |
| |
| return status; |
| } |
| |
| static int _setup_user_context(struct kgsl_mmu *mmu) |
| { |
| int ret = 0; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| struct kgsl_device *device = KGSL_MMU_DEVICE(mmu); |
| struct adreno_device *adreno_dev = ADRENO_DEVICE(device); |
| struct kgsl_iommu_pt *iommu_pt = NULL; |
| unsigned int sctlr_val; |
| |
| if (mmu->defaultpagetable == NULL) { |
| mmu->defaultpagetable = kgsl_mmu_getpagetable(mmu, |
| KGSL_MMU_GLOBAL_PT); |
| /* if we don't have a default pagetable, nothing will work */ |
| if (IS_ERR(mmu->defaultpagetable)) { |
| ret = PTR_ERR(mmu->defaultpagetable); |
| mmu->defaultpagetable = NULL; |
| return ret; |
| } else if (mmu->defaultpagetable == NULL) { |
| return -ENOMEM; |
| } |
| } |
| |
| iommu_pt = mmu->defaultpagetable->priv; |
| if (iommu_pt == NULL) |
| return -ENODEV; |
| |
| ret = _attach_pt(iommu_pt, ctx); |
| if (ret) |
| return ret; |
| |
| ctx->default_pt = mmu->defaultpagetable; |
| |
| kgsl_iommu_enable_clk(mmu); |
| |
| sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); |
| |
| /* |
| * If pagefault policy is GPUHALT_ENABLE, |
| * 1) Program CFCFG to 1 to enable STALL mode |
| * 2) Program HUPCF to 0 (Stall or terminate subsequent |
| * transactions in the presence of an outstanding fault) |
| * else |
| * 1) Program CFCFG to 0 to disable STALL mode (0=Terminate) |
| * 2) Program HUPCF to 1 (Process subsequent transactions |
| * independently of any outstanding fault) |
| */ |
| |
| if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, |
| &adreno_dev->ft_pf_policy)) { |
| sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); |
| sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); |
| } else { |
| sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); |
| sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); |
| } |
| KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); |
| kgsl_iommu_disable_clk(mmu); |
| |
| return 0; |
| } |
| |
| static int _setup_secure_context(struct kgsl_mmu *mmu) |
| { |
| int ret; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; |
| unsigned int cb_num; |
| |
| struct kgsl_iommu_pt *iommu_pt; |
| |
| if (ctx->dev == NULL || !mmu->secured) |
| return 0; |
| |
| if (mmu->securepagetable == NULL) |
| return -ENOMEM; |
| |
| iommu_pt = mmu->securepagetable->priv; |
| |
| ret = _attach_pt(iommu_pt, ctx); |
| if (ret) |
| goto done; |
| |
| ctx->default_pt = mmu->securepagetable; |
| |
| ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXT_BANK, |
| &cb_num); |
| if (ret) { |
| KGSL_CORE_ERR("get CONTEXT_BANK attr, err %d\n", ret); |
| goto done; |
| } |
| ctx->cb_num = cb_num; |
| done: |
| if (ret) |
| _detach_context(ctx); |
| return ret; |
| } |
| |
| static int kgsl_iommu_set_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt); |
| |
| static int kgsl_iommu_start(struct kgsl_mmu *mmu) |
| { |
| int status; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| |
| status = _setup_user_context(mmu); |
| if (status) |
| return status; |
| |
| status = _setup_secure_context(mmu); |
| if (status) { |
| _detach_context(&iommu->ctx[KGSL_IOMMU_CONTEXT_USER]); |
| return status; |
| } |
| |
| /* Make sure the hardware is programmed to the default pagetable */ |
| return kgsl_iommu_set_pt(mmu, mmu->defaultpagetable); |
| } |
| |
| static int |
| kgsl_iommu_unmap_offset(struct kgsl_pagetable *pt, |
| struct kgsl_memdesc *memdesc, uint64_t addr, |
| uint64_t offset, uint64_t size) |
| { |
| if (size == 0 || (size + offset) > kgsl_memdesc_footprint(memdesc)) |
| return -EINVAL; |
| /* |
| * All GPU addresses as assigned are page aligned, but some |
| * functions perturb the gpuaddr with an offset, so apply the |
| * mask here to make sure we have the right address. |
| */ |
| |
| addr = PAGE_ALIGN(addr); |
| if (addr == 0) |
| return -EINVAL; |
| |
| return _iommu_unmap_sync_pc(pt, addr + offset, size); |
| } |
| |
| static int |
| kgsl_iommu_unmap(struct kgsl_pagetable *pt, struct kgsl_memdesc *memdesc) |
| { |
| if (memdesc->size == 0 || memdesc->gpuaddr == 0) |
| return -EINVAL; |
| |
| return kgsl_iommu_unmap_offset(pt, memdesc, memdesc->gpuaddr, 0, |
| kgsl_memdesc_footprint(memdesc)); |
| } |
| |
| /** |
| * _iommu_map_guard_page - Map iommu guard page |
| * @pt - Pointer to kgsl pagetable structure |
| * @memdesc - memdesc to add guard page |
| * @gpuaddr - GPU addr of guard page |
| * @protflags - flags for mapping |
| * |
| * Return 0 on success, error on map fail |
| */ |
| static int _iommu_map_guard_page(struct kgsl_pagetable *pt, |
| struct kgsl_memdesc *memdesc, |
| uint64_t gpuaddr, |
| unsigned int protflags) |
| { |
| phys_addr_t physaddr; |
| |
| if (!kgsl_memdesc_has_guard_page(memdesc)) |
| return 0; |
| |
| /* |
| * Allocate guard page for secure buffers. |
| * This has to be done after we attach a smmu pagetable. |
| * Allocate the guard page when first secure buffer is. |
| * mapped to save 1MB of memory if CPZ is not used. |
| */ |
| if (kgsl_memdesc_is_secured(memdesc)) { |
| struct scatterlist *sg; |
| unsigned int sgp_size = pt->mmu->secure_align_mask + 1; |
| |
| if (!kgsl_secure_guard_page_memdesc.sgt) { |
| if (kgsl_allocate_user(KGSL_MMU_DEVICE(pt->mmu), |
| &kgsl_secure_guard_page_memdesc, |
| sgp_size, KGSL_MEMFLAGS_SECURE)) { |
| KGSL_CORE_ERR( |
| "Secure guard page alloc failed\n"); |
| return -ENOMEM; |
| } |
| } |
| |
| sg = kgsl_secure_guard_page_memdesc.sgt->sgl; |
| physaddr = page_to_phys(sg_page(sg)); |
| } else { |
| if (kgsl_guard_page == NULL) { |
| kgsl_guard_page = alloc_page(GFP_KERNEL | __GFP_ZERO | |
| __GFP_NORETRY | __GFP_HIGHMEM); |
| if (kgsl_guard_page == NULL) |
| return -ENOMEM; |
| } |
| |
| physaddr = page_to_phys(kgsl_guard_page); |
| } |
| |
| return _iommu_map_sync_pc(pt, gpuaddr, physaddr, |
| kgsl_memdesc_guard_page_size(memdesc), |
| protflags & ~IOMMU_WRITE); |
| } |
| |
| static unsigned int _get_protection_flags(struct kgsl_memdesc *memdesc) |
| { |
| unsigned int flags = IOMMU_READ | IOMMU_WRITE | |
| IOMMU_NOEXEC | IOMMU_USE_UPSTREAM_HINT; |
| |
| if (memdesc->flags & KGSL_MEMFLAGS_GPUREADONLY) |
| flags &= ~IOMMU_WRITE; |
| |
| if (memdesc->priv & KGSL_MEMDESC_PRIVILEGED) |
| flags |= IOMMU_PRIV; |
| |
| if (memdesc->flags & KGSL_MEMFLAGS_IOCOHERENT) |
| flags |= IOMMU_CACHE; |
| |
| return flags; |
| } |
| |
| static int |
| kgsl_iommu_map(struct kgsl_pagetable *pt, |
| struct kgsl_memdesc *memdesc) |
| { |
| int ret; |
| uint64_t addr = memdesc->gpuaddr; |
| uint64_t size = memdesc->size; |
| unsigned int flags = _get_protection_flags(memdesc); |
| struct sg_table *sgt = NULL; |
| |
| /* |
| * For paged memory allocated through kgsl, memdesc->pages is not NULL. |
| * Allocate sgt here just for its map operation. Contiguous memory |
| * already has its sgt, so no need to allocate it here. |
| */ |
| if (memdesc->pages != NULL) |
| sgt = kgsl_alloc_sgt_from_pages(memdesc); |
| else |
| sgt = memdesc->sgt; |
| |
| if (IS_ERR(sgt)) |
| return PTR_ERR(sgt); |
| |
| ret = _iommu_map_sg_sync_pc(pt, addr, sgt->sgl, sgt->nents, flags); |
| if (ret) |
| goto done; |
| |
| ret = _iommu_map_guard_page(pt, memdesc, addr + size, flags); |
| if (ret) |
| _iommu_unmap_sync_pc(pt, addr, size); |
| |
| done: |
| if (memdesc->pages != NULL) |
| kgsl_free_sgt(sgt); |
| |
| return ret; |
| } |
| |
| static int kgsl_iommu_sparse_dummy_map(struct kgsl_pagetable *pt, |
| struct kgsl_memdesc *memdesc, uint64_t offset, uint64_t size) |
| { |
| int ret = 0, i; |
| struct page **pages = NULL; |
| struct sg_table sgt; |
| int count = size >> PAGE_SHIFT; |
| |
| /* verify the offset is within our range */ |
| if (size + offset > memdesc->size) |
| return -EINVAL; |
| |
| if (kgsl_dummy_page == NULL) { |
| kgsl_dummy_page = alloc_page(GFP_KERNEL | __GFP_ZERO | |
| __GFP_HIGHMEM); |
| if (kgsl_dummy_page == NULL) |
| return -ENOMEM; |
| } |
| |
| pages = kcalloc(count, sizeof(struct page *), GFP_KERNEL); |
| if (pages == NULL) |
| return -ENOMEM; |
| |
| for (i = 0; i < count; i++) |
| pages[i] = kgsl_dummy_page; |
| |
| ret = sg_alloc_table_from_pages(&sgt, pages, count, |
| 0, size, GFP_KERNEL); |
| if (ret == 0) { |
| ret = _iommu_map_sg_sync_pc(pt, memdesc->gpuaddr + offset, |
| sgt.sgl, sgt.nents, IOMMU_READ | IOMMU_NOEXEC); |
| sg_free_table(&sgt); |
| } |
| |
| kfree(pages); |
| |
| return ret; |
| } |
| |
| static int _map_to_one_page(struct kgsl_pagetable *pt, uint64_t addr, |
| struct kgsl_memdesc *memdesc, uint64_t physoffset, |
| uint64_t size, unsigned int map_flags) |
| { |
| int ret = 0, i; |
| int pg_sz = kgsl_memdesc_get_pagesize(memdesc); |
| int count = size >> PAGE_SHIFT; |
| struct page *page = NULL; |
| struct page **pages = NULL; |
| struct sg_page_iter sg_iter; |
| struct sg_table sgt; |
| |
| /* Find our physaddr offset addr */ |
| if (memdesc->pages != NULL) |
| page = memdesc->pages[physoffset >> PAGE_SHIFT]; |
| else { |
| for_each_sg_page(memdesc->sgt->sgl, &sg_iter, |
| memdesc->sgt->nents, physoffset >> PAGE_SHIFT) { |
| page = sg_page_iter_page(&sg_iter); |
| break; |
| } |
| } |
| |
| if (page == NULL) |
| return -EINVAL; |
| |
| pages = kcalloc(count, sizeof(struct page *), GFP_KERNEL); |
| if (pages == NULL) |
| return -ENOMEM; |
| |
| for (i = 0; i < count; i++) { |
| if (pg_sz != PAGE_SIZE) { |
| struct page *tmp_page = page; |
| int j; |
| |
| for (j = 0; j < 16; j++, tmp_page += PAGE_SIZE) |
| pages[i++] = tmp_page; |
| } else |
| pages[i] = page; |
| } |
| |
| ret = sg_alloc_table_from_pages(&sgt, pages, count, |
| 0, size, GFP_KERNEL); |
| if (ret == 0) { |
| ret = _iommu_map_sg_sync_pc(pt, addr, sgt.sgl, |
| sgt.nents, map_flags); |
| sg_free_table(&sgt); |
| } |
| |
| kfree(pages); |
| |
| return ret; |
| } |
| |
| static int kgsl_iommu_map_offset(struct kgsl_pagetable *pt, |
| uint64_t virtaddr, uint64_t virtoffset, |
| struct kgsl_memdesc *memdesc, uint64_t physoffset, |
| uint64_t size, uint64_t feature_flag) |
| { |
| int pg_sz; |
| unsigned int protflags = _get_protection_flags(memdesc); |
| int ret; |
| struct sg_table *sgt = NULL; |
| |
| pg_sz = kgsl_memdesc_get_pagesize(memdesc); |
| if (!IS_ALIGNED(virtaddr | virtoffset | physoffset | size, pg_sz)) |
| return -EINVAL; |
| |
| if (size == 0) |
| return -EINVAL; |
| |
| if (!(feature_flag & KGSL_SPARSE_BIND_MULTIPLE_TO_PHYS) && |
| size + physoffset > kgsl_memdesc_footprint(memdesc)) |
| return -EINVAL; |
| |
| /* |
| * For paged memory allocated through kgsl, memdesc->pages is not NULL. |
| * Allocate sgt here just for its map operation. Contiguous memory |
| * already has its sgt, so no need to allocate it here. |
| */ |
| if (memdesc->pages != NULL) |
| sgt = kgsl_alloc_sgt_from_pages(memdesc); |
| else |
| sgt = memdesc->sgt; |
| |
| if (IS_ERR(sgt)) |
| return PTR_ERR(sgt); |
| |
| if (feature_flag & KGSL_SPARSE_BIND_MULTIPLE_TO_PHYS) |
| ret = _map_to_one_page(pt, virtaddr + virtoffset, |
| memdesc, physoffset, size, protflags); |
| else |
| ret = _iommu_map_sg_offset_sync_pc(pt, virtaddr + virtoffset, |
| sgt->sgl, sgt->nents, |
| physoffset, size, protflags); |
| |
| if (memdesc->pages != NULL) |
| kgsl_free_sgt(sgt); |
| |
| return ret; |
| } |
| |
| /* This function must be called with context bank attached */ |
| static void kgsl_iommu_clear_fsr(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| unsigned int sctlr_val; |
| |
| if (ctx->default_pt != NULL) { |
| kgsl_iommu_enable_clk(mmu); |
| KGSL_IOMMU_SET_CTX_REG(ctx, FSR, 0xffffffff); |
| /* |
| * Re-enable context fault interrupts after clearing |
| * FSR to prevent the interrupt from firing repeatedly |
| */ |
| sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); |
| sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_CFIE_SHIFT); |
| KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); |
| /* |
| * Make sure the above register writes |
| * are not reordered across the barrier |
| * as we use writel_relaxed to write them |
| */ |
| wmb(); |
| kgsl_iommu_disable_clk(mmu); |
| } |
| } |
| |
| static void kgsl_iommu_pagefault_resume(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| |
| if (ctx->default_pt != NULL && ctx->fault) { |
| /* |
| * Write 1 to RESUME.TnR to terminate the |
| * stalled transaction. |
| */ |
| KGSL_IOMMU_SET_CTX_REG(ctx, RESUME, 1); |
| /* |
| * Make sure the above register writes |
| * are not reordered across the barrier |
| * as we use writel_relaxed to write them |
| */ |
| wmb(); |
| ctx->fault = 0; |
| } |
| } |
| |
| static void kgsl_iommu_stop(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| int i; |
| |
| /* |
| * If the iommu supports retention, we don't need |
| * to detach when stopping. |
| */ |
| if (!MMU_FEATURE(mmu, KGSL_MMU_RETENTION)) { |
| for (i = 0; i < KGSL_IOMMU_CONTEXT_MAX; i++) |
| _detach_context(&iommu->ctx[i]); |
| } |
| } |
| |
| static u64 |
| kgsl_iommu_get_current_ttbr0(struct kgsl_mmu *mmu) |
| { |
| u64 val; |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| /* |
| * We cannot enable or disable the clocks in interrupt context, this |
| * function is called from interrupt context if there is an axi error |
| */ |
| if (in_interrupt()) |
| return 0; |
| |
| kgsl_iommu_enable_clk(mmu); |
| val = KGSL_IOMMU_GET_CTX_REG_Q(&iommu->ctx[KGSL_IOMMU_CONTEXT_USER], |
| TTBR0); |
| kgsl_iommu_disable_clk(mmu); |
| return val; |
| } |
| |
| /* |
| * kgsl_iommu_set_pt - Change the IOMMU pagetable of the primary context bank |
| * @mmu - Pointer to mmu structure |
| * @pt - Pagetable to switch to |
| * |
| * Set the new pagetable for the IOMMU by doing direct register writes |
| * to the IOMMU registers through the cpu |
| * |
| * Return - void |
| */ |
| static int kgsl_iommu_set_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| uint64_t ttbr0, temp; |
| unsigned int contextidr; |
| unsigned long wait_for_flush; |
| |
| if ((pt != mmu->defaultpagetable) && !kgsl_mmu_is_perprocess(mmu)) |
| return 0; |
| |
| kgsl_iommu_enable_clk(mmu); |
| |
| ttbr0 = kgsl_mmu_pagetable_get_ttbr0(pt); |
| contextidr = kgsl_mmu_pagetable_get_contextidr(pt); |
| |
| KGSL_IOMMU_SET_CTX_REG_Q(ctx, TTBR0, ttbr0); |
| KGSL_IOMMU_SET_CTX_REG(ctx, CONTEXTIDR, contextidr); |
| |
| /* memory barrier before reading TTBR0 register */ |
| mb(); |
| temp = KGSL_IOMMU_GET_CTX_REG_Q(ctx, TTBR0); |
| |
| KGSL_IOMMU_SET_CTX_REG(ctx, TLBIALL, 1); |
| /* make sure the TBLI write completes before we wait */ |
| mb(); |
| /* |
| * Wait for flush to complete by polling the flush |
| * status bit of TLBSTATUS register for not more than |
| * 2 s. After 2s just exit, at that point the SMMU h/w |
| * may be stuck and will eventually cause GPU to hang |
| * or bring the system down. |
| */ |
| wait_for_flush = jiffies + msecs_to_jiffies(2000); |
| KGSL_IOMMU_SET_CTX_REG(ctx, TLBSYNC, 0); |
| while (KGSL_IOMMU_GET_CTX_REG(ctx, TLBSTATUS) & |
| (KGSL_IOMMU_CTX_TLBSTATUS_SACTIVE)) { |
| if (time_after(jiffies, wait_for_flush)) { |
| KGSL_DRV_WARN(KGSL_MMU_DEVICE(mmu), |
| "Wait limit reached for IOMMU tlb flush\n"); |
| break; |
| } |
| cpu_relax(); |
| } |
| |
| kgsl_iommu_disable_clk(mmu); |
| return 0; |
| } |
| |
| /* |
| * kgsl_iommu_set_pf_policy() - Set the pagefault policy for IOMMU |
| * @mmu: Pointer to mmu structure |
| * @pf_policy: The pagefault polict to set |
| * |
| * Check if the new policy indicated by pf_policy is same as current |
| * policy, if same then return else set the policy |
| */ |
| static int kgsl_iommu_set_pf_policy(struct kgsl_mmu *mmu, |
| unsigned long pf_policy) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; |
| struct kgsl_device *device = KGSL_MMU_DEVICE(mmu); |
| struct adreno_device *adreno_dev = ADRENO_DEVICE(device); |
| |
| if ((adreno_dev->ft_pf_policy & |
| BIT(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE)) == |
| (pf_policy & BIT(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE))) |
| return 0; |
| |
| /* If not attached, policy will be updated during the next attach */ |
| if (ctx->default_pt != NULL) { |
| unsigned int sctlr_val; |
| |
| kgsl_iommu_enable_clk(mmu); |
| |
| sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); |
| |
| if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, &pf_policy)) { |
| sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); |
| sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); |
| } else { |
| sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); |
| sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); |
| } |
| |
| KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); |
| |
| kgsl_iommu_disable_clk(mmu); |
| } |
| |
| return 0; |
| } |
| |
| static struct kgsl_protected_registers * |
| kgsl_iommu_get_prot_regs(struct kgsl_mmu *mmu) |
| { |
| struct kgsl_iommu *iommu = _IOMMU_PRIV(mmu); |
| |
| return &iommu->protect; |
| } |
| |
| static struct kgsl_iommu_addr_entry *_find_gpuaddr( |
| struct kgsl_pagetable *pagetable, uint64_t gpuaddr) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| struct rb_node *node = pt->rbtree.rb_node; |
| |
| while (node != NULL) { |
| struct kgsl_iommu_addr_entry *entry = rb_entry(node, |
| struct kgsl_iommu_addr_entry, node); |
| |
| if (gpuaddr < entry->base) |
| node = node->rb_left; |
| else if (gpuaddr > entry->base) |
| node = node->rb_right; |
| else |
| return entry; |
| } |
| |
| return NULL; |
| } |
| |
| static int _remove_gpuaddr(struct kgsl_pagetable *pagetable, |
| uint64_t gpuaddr) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| struct kgsl_iommu_addr_entry *entry; |
| |
| entry = _find_gpuaddr(pagetable, gpuaddr); |
| |
| if (entry != NULL) { |
| rb_erase(&entry->node, &pt->rbtree); |
| kmem_cache_free(addr_entry_cache, entry); |
| return 0; |
| } |
| |
| WARN(1, "Couldn't remove gpuaddr: 0x%llx\n", gpuaddr); |
| return -ENOMEM; |
| } |
| |
| static int _insert_gpuaddr(struct kgsl_pagetable *pagetable, |
| uint64_t gpuaddr, uint64_t size) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| struct rb_node **node, *parent = NULL; |
| struct kgsl_iommu_addr_entry *new = |
| kmem_cache_alloc(addr_entry_cache, GFP_ATOMIC); |
| |
| if (new == NULL) |
| return -ENOMEM; |
| |
| new->base = gpuaddr; |
| new->size = size; |
| |
| node = &pt->rbtree.rb_node; |
| |
| while (*node != NULL) { |
| struct kgsl_iommu_addr_entry *this; |
| |
| parent = *node; |
| this = rb_entry(parent, struct kgsl_iommu_addr_entry, node); |
| |
| if (new->base < this->base) |
| node = &parent->rb_left; |
| else if (new->base > this->base) |
| node = &parent->rb_right; |
| else { |
| /* Duplicate entry */ |
| WARN(1, "duplicate gpuaddr: 0x%llx\n", gpuaddr); |
| return -EEXIST; |
| } |
| } |
| |
| rb_link_node(&new->node, parent, node); |
| rb_insert_color(&new->node, &pt->rbtree); |
| |
| return 0; |
| } |
| |
| static uint64_t _get_unmapped_area(struct kgsl_pagetable *pagetable, |
| uint64_t bottom, uint64_t top, uint64_t size, |
| uint64_t align) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| struct rb_node *node = rb_first(&pt->rbtree); |
| uint64_t start; |
| |
| bottom = ALIGN(bottom, align); |
| start = bottom; |
| |
| while (node != NULL) { |
| uint64_t gap; |
| struct kgsl_iommu_addr_entry *entry = rb_entry(node, |
| struct kgsl_iommu_addr_entry, node); |
| |
| /* |
| * Skip any entries that are outside of the range, but make sure |
| * to account for some that might straddle the lower bound |
| */ |
| if (entry->base < bottom) { |
| if (entry->base + entry->size > bottom) |
| start = ALIGN(entry->base + entry->size, align); |
| node = rb_next(node); |
| continue; |
| } |
| |
| /* Stop if we went over the top */ |
| if (entry->base >= top) |
| break; |
| |
| /* Make sure there is a gap to consider */ |
| if (start < entry->base) { |
| gap = entry->base - start; |
| |
| if (gap >= size) |
| return start; |
| } |
| |
| /* Stop if there is no more room in the region */ |
| if (entry->base + entry->size >= top) |
| return (uint64_t) -ENOMEM; |
| |
| /* Start the next cycle at the end of the current entry */ |
| start = ALIGN(entry->base + entry->size, align); |
| node = rb_next(node); |
| } |
| |
| if (start + size <= top) |
| return start; |
| |
| return (uint64_t) -ENOMEM; |
| } |
| |
| static uint64_t _get_unmapped_area_topdown(struct kgsl_pagetable *pagetable, |
| uint64_t bottom, uint64_t top, uint64_t size, |
| uint64_t align) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| struct rb_node *node = rb_last(&pt->rbtree); |
| uint64_t end = top; |
| uint64_t mask = ~(align - 1); |
| struct kgsl_iommu_addr_entry *entry; |
| |
| /* Make sure that the bottom is correctly aligned */ |
| bottom = ALIGN(bottom, align); |
| |
| /* Make sure the requested size will fit in the range */ |
| if (size > (top - bottom)) |
| return -ENOMEM; |
| |
| /* Walk back through the list to find the highest entry in the range */ |
| for (node = rb_last(&pt->rbtree); node != NULL; node = rb_prev(node)) { |
| entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); |
| if (entry->base < top) |
| break; |
| } |
| |
| while (node != NULL) { |
| uint64_t offset; |
| |
| entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); |
| |
| /* If the entire entry is below the range the search is over */ |
| if ((entry->base + entry->size) < bottom) |
| break; |
| |
| /* Get the top of the entry properly aligned */ |
| offset = ALIGN(entry->base + entry->size, align); |
| |
| /* |
| * Try to allocate the memory from the top of the gap, |
| * making sure that it fits between the top of this entry and |
| * the bottom of the previous one |
| */ |
| |
| if ((end > size) && (offset < end)) { |
| uint64_t chunk = (end - size) & mask; |
| |
| if (chunk >= offset) |
| return chunk; |
| } |
| |
| /* |
| * If we get here and the current entry is outside of the range |
| * then we are officially out of room |
| */ |
| |
| if (entry->base < bottom) |
| return (uint64_t) -ENOMEM; |
| |
| /* Set the top of the gap to the current entry->base */ |
| end = entry->base; |
| |
| /* And move on to the next lower entry */ |
| node = rb_prev(node); |
| } |
| |
| /* If we get here then there are no more entries in the region */ |
| if ((end > size) && (((end - size) & mask) >= bottom)) |
| return (end - size) & mask; |
| |
| return (uint64_t) -ENOMEM; |
| } |
| |
| static uint64_t kgsl_iommu_find_svm_region(struct kgsl_pagetable *pagetable, |
| uint64_t start, uint64_t end, uint64_t size, |
| uint64_t alignment) |
| { |
| uint64_t addr; |
| |
| /* Avoid black holes */ |
| if (WARN(end <= start, "Bad search range: 0x%llx-0x%llx", start, end)) |
| return (uint64_t) -EINVAL; |
| |
| spin_lock(&pagetable->lock); |
| addr = _get_unmapped_area_topdown(pagetable, |
| start, end, size, alignment); |
| spin_unlock(&pagetable->lock); |
| return addr; |
| } |
| |
| static int kgsl_iommu_set_svm_region(struct kgsl_pagetable *pagetable, |
| uint64_t gpuaddr, uint64_t size) |
| { |
| int ret = -ENOMEM; |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| struct rb_node *node; |
| |
| /* Make sure the requested address doesn't fall in the global range */ |
| if (ADDR_IN_GLOBAL(pagetable->mmu, gpuaddr) || |
| ADDR_IN_GLOBAL(pagetable->mmu, gpuaddr + size)) |
| return -ENOMEM; |
| |
| spin_lock(&pagetable->lock); |
| node = pt->rbtree.rb_node; |
| |
| while (node != NULL) { |
| uint64_t start, end; |
| struct kgsl_iommu_addr_entry *entry = rb_entry(node, |
| struct kgsl_iommu_addr_entry, node); |
| |
| start = entry->base; |
| end = entry->base + entry->size; |
| |
| if (gpuaddr + size <= start) |
| node = node->rb_left; |
| else if (end <= gpuaddr) |
| node = node->rb_right; |
| else |
| goto out; |
| } |
| |
| ret = _insert_gpuaddr(pagetable, gpuaddr, size); |
| out: |
| spin_unlock(&pagetable->lock); |
| return ret; |
| } |
| |
| |
| static int kgsl_iommu_get_gpuaddr(struct kgsl_pagetable *pagetable, |
| struct kgsl_memdesc *memdesc) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| int ret = 0; |
| uint64_t addr, start, end, size; |
| unsigned int align; |
| |
| if (WARN_ON(kgsl_memdesc_use_cpu_map(memdesc))) |
| return -EINVAL; |
| |
| if (memdesc->flags & KGSL_MEMFLAGS_SECURE && |
| pagetable->name != KGSL_MMU_SECURE_PT) |
| return -EINVAL; |
| |
| size = kgsl_memdesc_footprint(memdesc); |
| |
| align = 1 << kgsl_memdesc_get_align(memdesc); |
| |
| if (memdesc->flags & KGSL_MEMFLAGS_FORCE_32BIT) { |
| start = pt->compat_va_start; |
| end = pt->compat_va_end; |
| } else { |
| start = pt->va_start; |
| end = pt->va_end; |
| } |
| |
| /* |
| * When mapping secure buffers, adjust the start of the va range |
| * to the end of secure global buffers. |
| */ |
| if (kgsl_memdesc_is_secured(memdesc)) |
| start += secure_global_size; |
| |
| spin_lock(&pagetable->lock); |
| |
| addr = _get_unmapped_area(pagetable, start, end, size, align); |
| |
| if (addr == (uint64_t) -ENOMEM) { |
| ret = -ENOMEM; |
| goto out; |
| } |
| |
| ret = _insert_gpuaddr(pagetable, addr, size); |
| if (ret == 0) { |
| memdesc->gpuaddr = addr; |
| memdesc->pagetable = pagetable; |
| } |
| |
| out: |
| spin_unlock(&pagetable->lock); |
| return ret; |
| } |
| |
| static void kgsl_iommu_put_gpuaddr(struct kgsl_memdesc *memdesc) |
| { |
| if (memdesc->pagetable == NULL) |
| return; |
| |
| spin_lock(&memdesc->pagetable->lock); |
| |
| _remove_gpuaddr(memdesc->pagetable, memdesc->gpuaddr); |
| |
| spin_unlock(&memdesc->pagetable->lock); |
| } |
| |
| static int kgsl_iommu_svm_range(struct kgsl_pagetable *pagetable, |
| uint64_t *lo, uint64_t *hi, uint64_t memflags) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| bool gpu_compat = (memflags & KGSL_MEMFLAGS_FORCE_32BIT) != 0; |
| |
| if (lo != NULL) |
| *lo = gpu_compat ? pt->compat_va_start : pt->svm_start; |
| if (hi != NULL) |
| *hi = gpu_compat ? pt->compat_va_end : pt->svm_end; |
| |
| return 0; |
| } |
| |
| static bool kgsl_iommu_addr_in_range(struct kgsl_pagetable *pagetable, |
| uint64_t gpuaddr) |
| { |
| struct kgsl_iommu_pt *pt = pagetable->priv; |
| |
| if (gpuaddr == 0) |
| return false; |
| |
| if (gpuaddr >= pt->va_start && gpuaddr < pt->va_end) |
| return true; |
| |
| if (gpuaddr >= pt->compat_va_start && gpuaddr < pt->compat_va_end) |
| return true; |
| |
| if (gpuaddr >= pt->svm_start && gpuaddr < pt->svm_end) |
| return true; |
| |
| return false; |
| } |
| |
| static const struct { |
| int id; |
| char *name; |
| } kgsl_iommu_cbs[] = { |
| { KGSL_IOMMU_CONTEXT_USER, "gfx3d_user", }, |
| { KGSL_IOMMU_CONTEXT_SECURE, "gfx3d_secure" }, |
| { KGSL_IOMMU_CONTEXT_SECURE, "gfx3d_secure_alt" }, |
| }; |
| |
| static int _kgsl_iommu_cb_probe(struct kgsl_device *device, |
| struct kgsl_iommu *iommu, struct device_node *node) |
| { |
| struct platform_device *pdev = of_find_device_by_node(node); |
| struct kgsl_iommu_context *ctx = NULL; |
| struct adreno_device *adreno_dev = ADRENO_DEVICE(device); |
| int i; |
| |
| for (i = 0; i < ARRAY_SIZE(kgsl_iommu_cbs); i++) { |
| if (!strcmp(node->name, kgsl_iommu_cbs[i].name)) { |
| int id = kgsl_iommu_cbs[i].id; |
| |
| if (ADRENO_QUIRK(adreno_dev, |
| ADRENO_QUIRK_MMU_SECURE_CB_ALT)) { |
| if (!strcmp(node->name, "gfx3d_secure")) |
| continue; |
| } else if (!strcmp(node->name, "gfx3d_secure_alt")) |
| continue; |
| |
| ctx = &iommu->ctx[id]; |
| ctx->id = id; |
| ctx->cb_num = -1; |
| ctx->name = kgsl_iommu_cbs[i].name; |
| |
| break; |
| } |
| } |
| |
| if (ctx == NULL) { |
| KGSL_CORE_ERR("dt: Unused context label %s\n", node->name); |
| return 0; |
| } |
| |
| if (ctx->id == KGSL_IOMMU_CONTEXT_SECURE) |
| device->mmu.secured = true; |
| |
| /* this property won't be found for all context banks */ |
| if (of_property_read_u32(node, "qcom,gpu-offset", &ctx->gpu_offset)) |
| ctx->gpu_offset = UINT_MAX; |
| |
| ctx->kgsldev = device; |
| |
| /* arm-smmu driver we'll have the right device pointer here. */ |
| if (of_find_property(node, "iommus", NULL)) { |
| ctx->dev = &pdev->dev; |
| } else { |
| ctx->dev = kgsl_mmu_get_ctx(ctx->name); |
| |
| if (IS_ERR(ctx->dev)) |
| return PTR_ERR(ctx->dev); |
| } |
| |
| return 0; |
| } |
| |
| static const struct { |
| char *feature; |
| unsigned long bit; |
| } kgsl_iommu_features[] = { |
| { "qcom,retention", KGSL_MMU_RETENTION }, |
| { "qcom,global_pt", KGSL_MMU_GLOBAL_PAGETABLE }, |
| { "qcom,hyp_secure_alloc", KGSL_MMU_HYP_SECURE_ALLOC }, |
| { "qcom,force-32bit", KGSL_MMU_FORCE_32BIT }, |
| }; |
| |
| static int _kgsl_iommu_probe(struct kgsl_device *device, |
| struct device_node *node) |
| { |
| const char *cname; |
| struct property *prop; |
| u32 reg_val[2]; |
| int i = 0; |
| struct kgsl_iommu *iommu = KGSL_IOMMU_PRIV(device); |
| struct device_node *child; |
| struct platform_device *pdev = of_find_device_by_node(node); |
| |
| memset(iommu, 0, sizeof(*iommu)); |
| |
| if (of_device_is_compatible(node, "qcom,kgsl-smmu-v1")) |
| iommu->version = 1; |
| else |
| iommu->version = 2; |
| |
| if (of_property_read_u32_array(node, "reg", reg_val, 2)) { |
| KGSL_CORE_ERR("dt: Unable to read KGSL IOMMU register range\n"); |
| return -EINVAL; |
| } |
| iommu->regstart = reg_val[0]; |
| iommu->regsize = reg_val[1]; |
| |
| /* Protecting the SMMU registers is mandatory */ |
| if (of_property_read_u32_array(node, "qcom,protect", reg_val, 2)) { |
| KGSL_CORE_ERR("dt: no iommu protection range specified\n"); |
| return -EINVAL; |
| } |
| iommu->protect.base = reg_val[0] / sizeof(u32); |
| iommu->protect.range = ilog2(reg_val[1] / sizeof(u32)); |
| |
| of_property_for_each_string(node, "clock-names", prop, cname) { |
| struct clk *c = devm_clk_get(&pdev->dev, cname); |
| |
| if (IS_ERR(c)) { |
| KGSL_CORE_ERR("dt: Couldn't get clock: %s\n", cname); |
| return -ENODEV; |
| } |
| if (i >= KGSL_IOMMU_MAX_CLKS) { |
| KGSL_CORE_ERR("dt: too many clocks defined.\n"); |
| return -EINVAL; |
| } |
| |
| iommu->clks[i] = c; |
| ++i; |
| } |
| |
| for (i = 0; i < ARRAY_SIZE(kgsl_iommu_features); i++) { |
| if (of_property_read_bool(node, kgsl_iommu_features[i].feature)) |
| device->mmu.features |= kgsl_iommu_features[i].bit; |
| } |
| |
| if (of_property_read_u32(node, "qcom,micro-mmu-control", |
| &iommu->micro_mmu_ctrl)) |
| iommu->micro_mmu_ctrl = UINT_MAX; |
| |
| if (of_property_read_u32(node, "qcom,secure_align_mask", |
| &device->mmu.secure_align_mask)) |
| device->mmu.secure_align_mask = 0xfff; |
| |
| /* Fill out the rest of the devices in the node */ |
| of_platform_populate(node, NULL, NULL, &pdev->dev); |
| |
| for_each_child_of_node(node, child) { |
| int ret; |
| |
| if (!of_device_is_compatible(child, "qcom,smmu-kgsl-cb")) |
| continue; |
| |
| ret = _kgsl_iommu_cb_probe(device, iommu, child); |
| if (ret) |
| return ret; |
| } |
| |
| return 0; |
| } |
| |
| static const struct { |
| char *compat; |
| int (*probe)(struct kgsl_device *device, struct device_node *node); |
| } kgsl_dt_devices[] = { |
| { "qcom,kgsl-smmu-v1", _kgsl_iommu_probe }, |
| { "qcom,kgsl-smmu-v2", _kgsl_iommu_probe }, |
| }; |
| |
| static int kgsl_iommu_probe(struct kgsl_device *device) |
| { |
| int i; |
| |
| for (i = 0; i < ARRAY_SIZE(kgsl_dt_devices); i++) { |
| struct device_node *node; |
| |
| node = of_find_compatible_node(device->pdev->dev.of_node, |
| NULL, kgsl_dt_devices[i].compat); |
| |
| if (node != NULL) |
| return kgsl_dt_devices[i].probe(device, node); |
| } |
| |
| return -ENODEV; |
| } |
| |
| struct kgsl_mmu_ops kgsl_iommu_ops = { |
| .mmu_init = kgsl_iommu_init, |
| .mmu_close = kgsl_iommu_close, |
| .mmu_start = kgsl_iommu_start, |
| .mmu_stop = kgsl_iommu_stop, |
| .mmu_set_pt = kgsl_iommu_set_pt, |
| .mmu_clear_fsr = kgsl_iommu_clear_fsr, |
| .mmu_get_current_ttbr0 = kgsl_iommu_get_current_ttbr0, |
| .mmu_enable_clk = kgsl_iommu_enable_clk, |
| .mmu_disable_clk = kgsl_iommu_disable_clk, |
| .mmu_get_reg_ahbaddr = kgsl_iommu_get_reg_ahbaddr, |
| .mmu_pt_equal = kgsl_iommu_pt_equal, |
| .mmu_set_pf_policy = kgsl_iommu_set_pf_policy, |
| .mmu_pagefault_resume = kgsl_iommu_pagefault_resume, |
| .mmu_get_prot_regs = kgsl_iommu_get_prot_regs, |
| .mmu_init_pt = kgsl_iommu_init_pt, |
| .mmu_add_global = kgsl_iommu_add_global, |
| .mmu_remove_global = kgsl_iommu_remove_global, |
| .mmu_getpagetable = kgsl_iommu_getpagetable, |
| .mmu_get_qdss_global_entry = kgsl_iommu_get_qdss_global_entry, |
| .mmu_get_qtimer_global_entry = kgsl_iommu_get_qtimer_global_entry, |
| .probe = kgsl_iommu_probe, |
| }; |
| |
| static struct kgsl_mmu_pt_ops iommu_pt_ops = { |
| .mmu_map = kgsl_iommu_map, |
| .mmu_unmap = kgsl_iommu_unmap, |
| .mmu_destroy_pagetable = kgsl_iommu_destroy_pagetable, |
| .get_ttbr0 = kgsl_iommu_get_ttbr0, |
| .get_contextidr = kgsl_iommu_get_contextidr, |
| .get_gpuaddr = kgsl_iommu_get_gpuaddr, |
| .put_gpuaddr = kgsl_iommu_put_gpuaddr, |
| .set_svm_region = kgsl_iommu_set_svm_region, |
| .find_svm_region = kgsl_iommu_find_svm_region, |
| .svm_range = kgsl_iommu_svm_range, |
| .addr_in_range = kgsl_iommu_addr_in_range, |
| .mmu_map_offset = kgsl_iommu_map_offset, |
| .mmu_unmap_offset = kgsl_iommu_unmap_offset, |
| .mmu_sparse_dummy_map = kgsl_iommu_sparse_dummy_map, |
| }; |