/* Copyright (c) 2011-2015, The Linux Foundation. All rights reserved. * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License version 2 and * only version 2 as published by the Free Software Foundation. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * */ #include #include #include #include #include #include #include #ifdef CONFIG_MSM_IOMMU #include #endif #include #include #include #include #include #include "kgsl.h" #include "kgsl_device.h" #include "kgsl_mmu.h" #include "kgsl_sharedmem.h" #include "kgsl_iommu.h" #include "adreno_pm4types.h" #include "adreno.h" #include "kgsl_trace.h" #include "kgsl_cffdump.h" #include "kgsl_pwrctrl.h" static struct kgsl_mmu_pt_ops iommu_pt_ops; const unsigned int kgsl_iommu_reg_list[KGSL_IOMMU_REG_MAX] = { 0x0,/* SCTLR */ 0x20,/* TTBR0 */ 0x34,/* CONTEXTIDR */ 0x58,/* FSR */ 0x60,/* FAR_0 */ 0x618,/* TLBIALL */ 0x008,/* RESUME */ 0x68,/* FSYNR0 */ 0x6C,/* FSYNR1 */ 0x7F0,/* TLBSYNC */ 0x7F4,/* TLBSTATUS */ }; /* * struct kgsl_iommu_addr_entry - entry in the kgsl_iommu_pt rbtree. * @base: starting virtual address of the entry * @size: size of the entry * @node: the rbtree node * */ struct kgsl_iommu_addr_entry { uint64_t base; uint64_t size; struct rb_node node; }; static struct kmem_cache *addr_entry_cache; static inline void _iommu_sync_mmu_pc(struct kgsl_device *device, bool lock) { struct adreno_device *adreno_dev = ADRENO_DEVICE(device); if (!ADRENO_FEATURE(adreno_dev, ADRENO_SYNC_SMMU_PC)) return; if (lock) mutex_lock(&device->mutex_mmu_sync); else mutex_unlock(&device->mutex_mmu_sync); } static void _detach_pt(struct kgsl_iommu_pt *iommu_pt, struct kgsl_iommu_context *ctx, struct kgsl_device *device) { if (iommu_pt->attached) { _iommu_sync_mmu_pc(device, true); iommu_detach_device(iommu_pt->domain, ctx->dev); _iommu_sync_mmu_pc(device, false); iommu_pt->attached = false; } } static int _attach_pt(struct kgsl_iommu_pt *iommu_pt, struct kgsl_iommu_context *ctx, struct kgsl_device *device) { int ret; if (iommu_pt->attached) return 0; _iommu_sync_mmu_pc(device, true); ret = iommu_attach_device(iommu_pt->domain, ctx->dev); _iommu_sync_mmu_pc(device, false); if (ret == 0) iommu_pt->attached = true; else KGSL_CORE_ERR("iommu_attach_device(%s) failed: %d\n", ctx->name, ret); return ret; } /* * One page allocation for a guard region to protect against over-zealous * GPU pre-fetch */ static struct page *kgsl_guard_page; static struct kgsl_memdesc kgsl_secure_guard_page_memdesc; /* These functions help find the nearest allocated memory entries on either side * of a faulting address. If we know the nearby allocations memory we can * get a better determination of what we think should have been located in the * faulting region */ /* * A local structure to make it easy to store the interesting bits for the * memory entries on either side of the faulting address */ struct _mem_entry { uint64_t gpuaddr; uint64_t size; uint64_t flags; unsigned int priv; int pending_free; pid_t pid; }; static void _get_entries(struct kgsl_process_private *private, uint64_t faultaddr, struct _mem_entry *prev, struct _mem_entry *next) { int id; struct kgsl_mem_entry *entry; uint64_t prevaddr = 0; struct kgsl_mem_entry *p = NULL; uint64_t nextaddr = (uint64_t) -1; struct kgsl_mem_entry *n = NULL; idr_for_each_entry(&private->mem_idr, entry, id) { uint64_t addr = entry->memdesc.gpuaddr; if ((addr < faultaddr) && (addr > prevaddr)) { prevaddr = addr; p = entry; } if ((addr > faultaddr) && (addr < nextaddr)) { nextaddr = addr; n = entry; } } if (p != NULL) { prev->gpuaddr = p->memdesc.gpuaddr; prev->size = p->memdesc.size; prev->flags = p->memdesc.flags; prev->priv = p->memdesc.priv; prev->pending_free = p->pending_free; prev->pid = private->pid; } if (n != NULL) { next->gpuaddr = n->memdesc.gpuaddr; next->size = n->memdesc.size; next->flags = n->memdesc.flags; next->priv = n->memdesc.priv; next->pending_free = n->pending_free; next->pid = private->pid; } } static void _find_mem_entries(struct kgsl_mmu *mmu, uint64_t faultaddr, phys_addr_t ptbase, struct _mem_entry *preventry, struct _mem_entry *nextentry) { struct kgsl_process_private *private = NULL, *p; int id = kgsl_mmu_get_ptname_from_ptbase(mmu, ptbase); memset(preventry, 0, sizeof(*preventry)); memset(nextentry, 0, sizeof(*nextentry)); /* Set the maximum possible size as an initial value */ nextentry->gpuaddr = (uint64_t) -1; mutex_lock(&kgsl_driver.process_mutex); list_for_each_entry(p, &kgsl_driver.process_list, list) { if (p->pagetable && (p->pagetable->name == id)) { if (kgsl_process_private_get(p)) private = p; break; } } mutex_unlock(&kgsl_driver.process_mutex); if (private != NULL) { spin_lock(&private->mem_lock); _get_entries(private, faultaddr, preventry, nextentry); spin_unlock(&private->mem_lock); kgsl_process_private_put(private); } } static void _print_entry(struct kgsl_device *device, struct _mem_entry *entry) { char name[32]; memset(name, 0, sizeof(name)); kgsl_get_memory_usage(name, sizeof(name) - 1, entry->flags); KGSL_LOG_DUMP(device, "[%016llX - %016llX] %s %s (pid = %d) (%s)\n", entry->gpuaddr, entry->gpuaddr + entry->size, entry->priv & KGSL_MEMDESC_GUARD_PAGE ? "(+guard)" : "", entry->pending_free ? "(pending free)" : "", entry->pid, name); } static void _check_if_freed(struct kgsl_iommu_context *ctx, uint64_t addr, pid_t ptname) { uint64_t gpuaddr = addr; uint64_t size = 0; uint64_t flags = 0; pid_t pid; char name[32]; memset(name, 0, sizeof(name)); if (kgsl_memfree_find_entry(ptname, &gpuaddr, &size, &flags, &pid)) { kgsl_get_memory_usage(name, sizeof(name) - 1, flags); KGSL_LOG_DUMP(ctx->kgsldev, "---- premature free ----\n"); KGSL_LOG_DUMP(ctx->kgsldev, "[%8.8llX-%8.8llX] (%s) was already freed by pid %d\n", gpuaddr, gpuaddr + size, name, pid); } } static int kgsl_iommu_fault_handler(struct iommu_domain *domain, struct device *dev, unsigned long addr, int flags, void *token) { int ret = 0; struct kgsl_pagetable *pt = token; struct kgsl_mmu *mmu = pt->mmu; struct kgsl_iommu *iommu; struct kgsl_iommu_context *ctx; u64 ptbase; u32 contextidr; pid_t ptname; struct _mem_entry prev, next; int write; struct kgsl_device *device; struct adreno_device *adreno_dev; unsigned int no_page_fault_log = 0; unsigned int curr_context_id = 0; struct kgsl_context *context; char *fault_type = "unknown"; static DEFINE_RATELIMIT_STATE(_rs, DEFAULT_RATELIMIT_INTERVAL, DEFAULT_RATELIMIT_BURST); if (mmu == NULL || mmu->priv == NULL) return ret; iommu = mmu->priv; ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; device = mmu->device; adreno_dev = ADRENO_DEVICE(device); if (pt->name == KGSL_MMU_SECURE_PT) ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; /* * set the fault bits and stuff before any printks so that if fault * handler runs then it will know it's dealing with a pagefault. * Read the global current timestamp because we could be in middle of * RB switch and hence the cur RB may not be reliable but global * one will always be reliable */ kgsl_sharedmem_readl(&device->memstore, &curr_context_id, KGSL_MEMSTORE_OFFSET(KGSL_MEMSTORE_GLOBAL, current_context)); context = kgsl_context_get(device, curr_context_id); if (context != NULL) { /* save pagefault timestamp for GFT */ set_bit(KGSL_CONTEXT_PRIV_PAGEFAULT, &context->priv); kgsl_context_put(context); context = NULL; } ctx->fault = 1; if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, &adreno_dev->ft_pf_policy) && (flags & IOMMU_FAULT_TRANSACTION_STALLED)) { /* * Turn off GPU IRQ so we don't get faults from it too. * The device mutex must be held to change power state */ mutex_lock(&device->mutex); kgsl_pwrctrl_change_state(device, KGSL_STATE_AWARE); mutex_unlock(&device->mutex); } write = (flags & IOMMU_FAULT_WRITE) ? 1 : 0; if (flags & IOMMU_FAULT_TRANSLATION) fault_type = "translation"; else if (flags & IOMMU_FAULT_PERMISSION) fault_type = "permission"; ptbase = KGSL_IOMMU_GET_CTX_REG_Q(ctx, TTBR0); contextidr = KGSL_IOMMU_GET_CTX_REG(ctx, CONTEXTIDR); ptname = kgsl_mmu_get_ptname_from_ptbase(mmu, ptbase); if (test_bit(KGSL_FT_PAGEFAULT_LOG_ONE_PER_PAGE, &adreno_dev->ft_pf_policy)) no_page_fault_log = kgsl_mmu_log_fault_addr(mmu, ptbase, addr); if (!no_page_fault_log && __ratelimit(&_rs)) { KGSL_MEM_CRIT(ctx->kgsldev, "GPU PAGE FAULT: addr = %lX pid= %d\n", addr, ptname); KGSL_MEM_CRIT(ctx->kgsldev, "context=%s TTBR0=0x%llx CIDR=0x%x (%s %s fault)\n", ctx->name, ptbase, contextidr, write ? "write" : "read", fault_type); /* Don't print the debug if this is a permissions fault */ if (!(flags & IOMMU_FAULT_PERMISSION)) { _check_if_freed(ctx, addr, ptname); KGSL_LOG_DUMP(ctx->kgsldev, "---- nearby memory ----\n"); _find_mem_entries(mmu, addr, ptbase, &prev, &next); if (prev.gpuaddr) _print_entry(ctx->kgsldev, &prev); else KGSL_LOG_DUMP(ctx->kgsldev, "*EMPTY*\n"); KGSL_LOG_DUMP(ctx->kgsldev, " <- fault @ %8.8lX\n", addr); if (next.gpuaddr != (uint64_t) -1) _print_entry(ctx->kgsldev, &next); else KGSL_LOG_DUMP(ctx->kgsldev, "*EMPTY*\n"); } } trace_kgsl_mmu_pagefault(ctx->kgsldev, addr, kgsl_mmu_get_ptname_from_ptbase(mmu, ptbase), write ? "write" : "read"); /* * We do not want the h/w to resume fetching data from an iommu * that has faulted, this is better for debugging as it will stall * the GPU and trigger a snapshot. Return EBUSY error. */ if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, &adreno_dev->ft_pf_policy) && (flags & IOMMU_FAULT_TRANSACTION_STALLED)) { uint32_t sctlr_val; ret = -EBUSY; /* Disable context fault interrupts */ sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_CFIE_SHIFT); KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); adreno_set_gpu_fault(adreno_dev, ADRENO_IOMMU_PAGE_FAULT); /* Go ahead with recovery*/ adreno_dispatcher_schedule(device); } return ret; } /* * kgsl_iommu_disable_clk() - Disable iommu clocks * Disable IOMMU clocks */ static void kgsl_iommu_disable_clk(struct kgsl_mmu *mmu) { struct kgsl_iommu *iommu = mmu->priv; int j; atomic_dec(&iommu->clk_enable_count); BUG_ON(atomic_read(&iommu->clk_enable_count) < 0); for (j = (KGSL_IOMMU_MAX_CLKS - 1); j >= 0; j--) if (iommu->clks[j]) clk_disable_unprepare(iommu->clks[j]); } /* * kgsl_iommu_enable_clk_prepare_enable - Enable the specified IOMMU clock * Try 4 times to enable it and then BUG() for debug */ static void kgsl_iommu_clk_prepare_enable(struct clk *clk) { int num_retries = 4; while (num_retries--) { if (!clk_prepare_enable(clk)) return; } /* Failure is fatal so BUG() to facilitate debug */ KGSL_CORE_ERR("IOMMU clock enable failed\n"); BUG(); } /* * kgsl_iommu_enable_clk - Enable iommu clocks * Enable all the IOMMU clocks */ static void kgsl_iommu_enable_clk(struct kgsl_mmu *mmu) { int j; struct kgsl_iommu *iommu = mmu->priv; for (j = 0; j < KGSL_IOMMU_MAX_CLKS; j++) { if (iommu->clks[j]) kgsl_iommu_clk_prepare_enable(iommu->clks[j]); } atomic_inc(&iommu->clk_enable_count); } /* kgsl_iommu_get_ttbr0 - Get TTBR0 setting for a pagetable */ static u64 kgsl_iommu_get_ttbr0(struct kgsl_pagetable *pt) { struct kgsl_iommu_pt *iommu_pt = pt ? pt->priv : NULL; BUG_ON(iommu_pt == NULL); return iommu_pt->ttbr0; } /* kgsl_iommu_get_contextidr - query CONTEXTIDR setting for a pagetable */ static u32 kgsl_iommu_get_contextidr(struct kgsl_pagetable *pt) { struct kgsl_iommu_pt *iommu_pt = pt ? pt->priv : NULL; BUG_ON(iommu_pt == NULL); return iommu_pt->contextidr; } /* * kgsl_iommu_destroy_pagetable - Free up reaources help by a pagetable * @mmu_specific_pt - Pointer to pagetable which is to be freed * * Return - void */ static void kgsl_iommu_destroy_pagetable(struct kgsl_pagetable *pt) { struct kgsl_iommu_pt *iommu_pt = pt->priv; struct kgsl_mmu *mmu = pt->mmu; struct kgsl_iommu *iommu; struct kgsl_iommu_context *ctx; BUG_ON(!list_empty(&pt->list)); iommu = mmu->priv; if (KGSL_MMU_SECURE_PT == pt->name) ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; else ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; if (iommu_pt->domain) { trace_kgsl_pagetable_destroy(iommu_pt->ttbr0, pt->name); _detach_pt(iommu_pt, ctx, mmu->device); iommu_domain_free(iommu_pt->domain); } kfree(iommu_pt); } /* currently only the MSM_IOMMU driver supports secure iommu */ #ifdef CONFIG_MSM_IOMMU static inline struct bus_type * get_secure_bus(void) { return &msm_iommu_sec_bus_type; } #else static inline struct bus_type * get_secure_bus(void) { return NULL; } #endif static void setup_64bit_pagetable(struct kgsl_mmu *mmu, struct kgsl_pagetable *pagetable, struct kgsl_iommu_pt *pt) { if (mmu->secured && pagetable->name == KGSL_MMU_SECURE_PT) { pt->compat_va_start = KGSL_IOMMU_SECURE_BASE; pt->compat_va_end = KGSL_IOMMU_SECURE_END; pt->va_start = KGSL_IOMMU_SECURE_BASE; pt->va_end = KGSL_IOMMU_SECURE_END; } else { pt->compat_va_start = KGSL_IOMMU_SVM_BASE32; pt->compat_va_end = KGSL_IOMMU_SVM_END32; pt->va_start = KGSL_IOMMU_VA_BASE64; pt->va_end = KGSL_IOMMU_VA_END64; } if (pagetable->name != KGSL_MMU_GLOBAL_PT && pagetable->name != KGSL_MMU_SECURE_PT) { if (is_compat_task()) { pt->svm_start = KGSL_IOMMU_SVM_BASE32; pt->svm_end = KGSL_IOMMU_SVM_END32; } else { pt->svm_start = KGSL_IOMMU_SVM_BASE64; pt->svm_end = KGSL_IOMMU_SVM_END64; } } } static void setup_32bit_pagetable(struct kgsl_mmu *mmu, struct kgsl_pagetable *pagetable, struct kgsl_iommu_pt *pt) { if (mmu->secured) { if (pagetable->name == KGSL_MMU_SECURE_PT) { pt->compat_va_start = KGSL_IOMMU_SECURE_BASE; pt->compat_va_end = KGSL_IOMMU_SECURE_END; pt->va_start = KGSL_IOMMU_SECURE_BASE; pt->va_end = KGSL_IOMMU_SECURE_END; } else { pt->va_start = KGSL_IOMMU_SVM_BASE32; pt->va_end = KGSL_IOMMU_SECURE_BASE; pt->compat_va_start = pt->va_start; pt->compat_va_end = pt->va_end; } } else { pt->va_start = KGSL_IOMMU_SVM_BASE32; pt->va_end = KGSL_MMU_GLOBAL_MEM_BASE; pt->compat_va_start = pt->va_start; pt->compat_va_end = pt->va_end; } if (pagetable->name != KGSL_MMU_GLOBAL_PT && pagetable->name != KGSL_MMU_SECURE_PT) { pt->svm_start = KGSL_IOMMU_SVM_BASE32; pt->svm_end = KGSL_IOMMU_SVM_END32; } } static struct kgsl_iommu_pt * _alloc_pt(struct bus_type *bus, struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) { struct kgsl_iommu_pt *iommu_pt; iommu_pt = kzalloc(sizeof(struct kgsl_iommu_pt), GFP_KERNEL); if (iommu_pt == NULL) return NULL; iommu_pt->domain = iommu_domain_alloc(bus); if (iommu_pt->domain == NULL) { kfree(iommu_pt); return NULL; } pt->pt_ops = &iommu_pt_ops; pt->priv = iommu_pt; iommu_pt->rbtree = RB_ROOT; if (MMU_FEATURE(mmu, KGSL_MMU_64BIT)) setup_64bit_pagetable(mmu, pt, iommu_pt); else setup_32bit_pagetable(mmu, pt, iommu_pt); return iommu_pt; } static void _free_pt(struct kgsl_iommu_context *ctx, struct kgsl_pagetable *pt, struct kgsl_device *device) { struct kgsl_iommu_pt *iommu_pt = pt->priv; pt->pt_ops = NULL; pt->priv = NULL; if (iommu_pt == NULL) return; _detach_pt(iommu_pt, ctx, device); if (iommu_pt->domain != NULL) iommu_domain_free(iommu_pt->domain); kfree(iommu_pt); } static int _init_global_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) { int ret = 0; struct kgsl_iommu_pt *iommu_pt = NULL; int disable_htw = !MMU_FEATURE(mmu, KGSL_MMU_COHERENT_HTW); unsigned int cb_num; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; iommu_pt = _alloc_pt(&platform_bus_type, mmu, pt); if (!iommu_pt) return -ENOMEM; iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_COHERENT_HTW_DISABLE, &disable_htw); if (kgsl_mmu_is_perprocess(mmu)) { ret = iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_PROCID, &pt->name); if (ret) { KGSL_CORE_ERR("set DOMAIN_ATTR_PROCID failed: %d\n", ret); goto done; } } ret = _attach_pt(iommu_pt, ctx, mmu->device); if (ret) goto done; iommu_set_fault_handler(iommu_pt->domain, kgsl_iommu_fault_handler, pt); ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXT_BANK, &cb_num); if (ret) { KGSL_CORE_ERR("get DOMAIN_ATTR_PROCID failed: %d\n", ret); goto done; } ctx->cb_num = cb_num; ctx->regbase = iommu->regbase + KGSL_IOMMU_CB0_OFFSET + (cb_num << KGSL_IOMMU_CB_SHIFT); ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_TTBR0, &iommu_pt->ttbr0); if (ret) { KGSL_CORE_ERR("get DOMAIN_ATTR_TTBR0 failed: %d\n", ret); goto done; } ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXTIDR, &iommu_pt->contextidr); if (ret) { KGSL_CORE_ERR("get DOMAIN_ATTR_CONTEXTIDR failed: %d\n", ret); goto done; } done: if (ret) _free_pt(ctx, pt, mmu->device); return ret; } static int _init_secure_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) { int ret = 0; struct kgsl_iommu_pt *iommu_pt = NULL; struct bus_type *bus = &platform_bus_type; struct kgsl_iommu *iommu = mmu->priv; int disable_htw = !MMU_FEATURE(mmu, KGSL_MMU_COHERENT_HTW); struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; int secure_vmid = VMID_CP_PIXEL; unsigned int cb_num; if (!mmu->secured) return -EPERM; if (!MMU_FEATURE(mmu, KGSL_MMU_HYP_SECURE_ALLOC)) { bus = get_secure_bus(); if (bus == NULL) return -EPERM; } iommu_pt = _alloc_pt(bus, mmu, pt); if (iommu_pt == NULL) return -ENOMEM; iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_COHERENT_HTW_DISABLE, &disable_htw); ret = iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_SECURE_VMID, &secure_vmid); if (ret) { KGSL_CORE_ERR("set DOMAIN_ATTR_SECURE_VMID failed: %d\n", ret); goto done; } ret = _attach_pt(iommu_pt, ctx, mmu->device); if (MMU_FEATURE(mmu, KGSL_MMU_HYP_SECURE_ALLOC)) iommu_set_fault_handler(iommu_pt->domain, kgsl_iommu_fault_handler, pt); ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXT_BANK, &cb_num); if (ret) { KGSL_CORE_ERR("get DOMAIN_ATTR_PROCID failed: %d\n", ret); goto done; } ctx->cb_num = cb_num; ctx->regbase = iommu->regbase + KGSL_IOMMU_CB0_OFFSET + (cb_num << KGSL_IOMMU_CB_SHIFT); done: if (ret) _free_pt(ctx, pt, mmu->device); return ret; } static int _init_per_process_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) { int ret = 0; struct kgsl_iommu_pt *iommu_pt = NULL; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; int dynamic = 1; unsigned int cb_num = ctx->cb_num; int disable_htw = !MMU_FEATURE(mmu, KGSL_MMU_COHERENT_HTW); iommu_pt = _alloc_pt(&platform_bus_type, mmu, pt); if (!iommu_pt) return -ENOMEM; ret = iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_DYNAMIC, &dynamic); if (ret) { KGSL_CORE_ERR("set DOMAIN_ATTR_DYNAMIC failed: %d\n", ret); goto done; } ret = iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXT_BANK, &cb_num); if (ret) { KGSL_CORE_ERR("set DOMAIN_ATTR_CONTEXT_BANK failed: %d\n", ret); goto done; } ret = iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_PROCID, &pt->name); if (ret) { KGSL_CORE_ERR("set DOMAIN_ATTR_PROCID failed: %d\n", ret); goto done; } iommu_domain_set_attr(iommu_pt->domain, DOMAIN_ATTR_COHERENT_HTW_DISABLE, &disable_htw); ret = _attach_pt(iommu_pt, ctx, mmu->device); if (ret) goto done; /* now read back the attributes needed for self programming */ ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_TTBR0, &iommu_pt->ttbr0); if (ret) { KGSL_CORE_ERR("get DOMAIN_ATTR_TTBR0 failed: %d\n", ret); goto done; } ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXTIDR, &iommu_pt->contextidr); if (ret) { KGSL_CORE_ERR("get DOMAIN_ATTR_CONTEXTIDR failed: %d\n", ret); goto done; } done: if (ret) _free_pt(ctx, pt, mmu->device); return ret; } /* kgsl_iommu_init_pt - Set up an IOMMU pagetable */ static int kgsl_iommu_init_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) { if (pt == NULL) return -EINVAL; switch (pt->name) { case KGSL_MMU_GLOBAL_PT: return _init_global_pt(mmu, pt); case KGSL_MMU_SECURE_PT: return _init_secure_pt(mmu, pt); default: return _init_per_process_pt(mmu, pt); } } #ifndef CONFIG_MSM_IOMMU static struct device *msm_iommu_get_ctx(const char *name) { return ERR_PTR(-ENODEV); } #endif /* * _get_iommu_ctxs - Get device pointer to IOMMU contexts * @mmu - Pointer to mmu device * * Return - 0 on success else error code */ static int _get_iommu_ctxs(struct kgsl_mmu *mmu) { struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx; int i; int ret = 0; for (i = 0; i < KGSL_IOMMU_CONTEXT_MAX; i++) { ctx = &iommu->ctx[i]; /* skip contexts not found in dt */ if (ctx->name == NULL) continue; ctx->kgsldev = mmu->device; if (ctx->dev != NULL) continue; /* * The old iommu driver requires that we query the context bank * device rather than getting it from dt. */ ctx->dev = msm_iommu_get_ctx(ctx->name); if (IS_ERR_OR_NULL(ctx->dev)) { ret = (!ctx->dev) ? -EINVAL : PTR_ERR(ctx->dev); memset(ctx, 0, sizeof(*ctx)); KGSL_CORE_ERR("ctx %s: msm_iommu_get_ctx err: %d\n", ctx->name, ret); break; } } return ret; } /* * kgsl_iommu_get_reg_ahbaddr - Returns the ahb address of the register * @mmu - Pointer to mmu structure * @id - The context ID of the IOMMU ctx * @reg - The register for which address is required * * Return - The address of register which can be used in type0 packet */ static unsigned int kgsl_iommu_get_reg_ahbaddr(struct kgsl_mmu *mmu, enum kgsl_iommu_context_id id, enum kgsl_iommu_reg_map reg) { unsigned int result; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[id]; result = ctx->gpu_offset + kgsl_iommu_reg_list[reg]; return result; } static int kgsl_iommu_init(struct kgsl_mmu *mmu) { /* * intialize device mmu * * call this with the global lock held */ int status = 0; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; if (ctx->name == NULL) { KGSL_CORE_ERR("dt: gfx3d0_user context bank not found\n"); return -EINVAL; } /* check requirements for per process pagetables */ if (ctx->gpu_offset == UINT_MAX) { KGSL_CORE_ERR("missing qcom,gpu-offset forces global pt\n"); mmu->features |= KGSL_MMU_GLOBAL_PAGETABLE; } if (iommu->version == 1 && iommu->micro_mmu_ctrl == UINT_MAX) { KGSL_CORE_ERR( "missing qcom,micro-mmu-control forces global pt\n"); mmu->features |= KGSL_MMU_GLOBAL_PAGETABLE; } iommu->regbase = ioremap(iommu->regstart, iommu->regsize); if (iommu->regbase == NULL) { KGSL_CORE_ERR("Could not map IOMMU registers 0x%lx:0x%x\n", iommu->regstart, iommu->regsize); return -ENOMEM; } status = _get_iommu_ctxs(mmu); if (status) goto done; if (addr_entry_cache == NULL) { addr_entry_cache = KMEM_CACHE(kgsl_iommu_addr_entry, 0); if (addr_entry_cache == NULL) { status = -ENOMEM; goto done; } } if (kgsl_guard_page == NULL) { kgsl_guard_page = alloc_page(GFP_KERNEL | __GFP_ZERO | __GFP_HIGHMEM); if (kgsl_guard_page == NULL) { status = -ENOMEM; goto done; } } done: return status; } static void _detach_context(struct kgsl_iommu_context *ctx, struct kgsl_device *device) { struct kgsl_iommu_pt *iommu_pt; if (ctx->default_pt == NULL) return; iommu_pt = ctx->default_pt->priv; _detach_pt(iommu_pt, ctx, device); ctx->default_pt = NULL; } static int _setup_user_context(struct kgsl_mmu *mmu) { int ret; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; struct adreno_device *adreno_dev = ADRENO_DEVICE(mmu->device); struct kgsl_iommu_pt *iommu_pt = NULL; unsigned int sctlr_val; if (mmu->defaultpagetable == NULL) { mmu->defaultpagetable = kgsl_mmu_getpagetable(mmu, KGSL_MMU_GLOBAL_PT); /* if we don't have a default pagetable, nothing will work */ if (IS_ERR(mmu->defaultpagetable)) { ret = PTR_ERR(mmu->defaultpagetable); mmu->defaultpagetable = NULL; return ret; } else if (mmu->defaultpagetable == NULL) { return -ENOMEM; } } iommu_pt = mmu->defaultpagetable->priv; ret = _attach_pt(iommu_pt, ctx, mmu->device); if (ret) return ret; kgsl_iommu_enable_clk(mmu); KGSL_IOMMU_SET_CTX_REG(ctx, TLBIALL, 1); sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); /* * For IOMMU V1, if pagefault policy is GPUHALT_ENABLE, * 1) Program CFCFG to 1 to enable STALL mode * 2) Program HUPCF to 0 (Stall or terminate subsequent * transactions in the presence of an outstanding fault) * else * 1) Program CFCFG to 0 to disable STALL mode (0=Terminate) * 2) Program HUPCF to 1 (Process subsequent transactions * independently of any outstanding fault) */ sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, &adreno_dev->ft_pf_policy)) { sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); } else { sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); } KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); kgsl_iommu_disable_clk(mmu); if (ret) _detach_context(ctx, mmu->device); return ret; } static int _setup_secure_context(struct kgsl_mmu *mmu) { int ret; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_SECURE]; unsigned int cb_num; struct kgsl_iommu_pt *iommu_pt; if (ctx->dev == NULL || !mmu->secured) return 0; if (mmu->securepagetable == NULL) { mmu->securepagetable = kgsl_mmu_getpagetable(mmu, KGSL_MMU_SECURE_PT); if (IS_ERR(mmu->securepagetable)) { ret = PTR_ERR(mmu->securepagetable); mmu->securepagetable = NULL; return ret; } else if (mmu->securepagetable == NULL) { return -ENOMEM; } } iommu_pt = mmu->securepagetable->priv; ret = _attach_pt(iommu_pt, ctx, mmu->device); if (ret) goto done; ctx->default_pt = mmu->securepagetable; ret = iommu_domain_get_attr(iommu_pt->domain, DOMAIN_ATTR_CONTEXT_BANK, &cb_num); if (ret) { KGSL_CORE_ERR("get CONTEXT_BANK attr, err %d\n", ret); goto done; } ctx->cb_num = cb_num; done: if (ret) _detach_context(ctx, mmu->device); return ret; } static int kgsl_iommu_start(struct kgsl_mmu *mmu) { int status; struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; status = _setup_user_context(mmu); if (status) return status; status = _setup_secure_context(mmu); if (status) _detach_context(&iommu->ctx[KGSL_IOMMU_CONTEXT_USER], mmu->device); else { kgsl_iommu_enable_clk(mmu); KGSL_IOMMU_SET_CTX_REG(ctx, TLBIALL, 1); kgsl_iommu_disable_clk(mmu); } return status; } static int kgsl_iommu_unmap(struct kgsl_pagetable *pt, struct kgsl_memdesc *memdesc) { struct kgsl_device *device = pt->mmu->device; int ret = 0; uint64_t range = memdesc->size; size_t unmapped = 0; struct kgsl_iommu_pt *iommu_pt = pt->priv; /* All GPU addresses as assigned are page aligned, but some functions purturb the gpuaddr with an offset, so apply the mask here to make sure we have the right address */ uint64_t gpuaddr = PAGE_ALIGN(memdesc->gpuaddr); if (range == 0 || gpuaddr == 0) return 0; if (kgsl_memdesc_has_guard_page(memdesc)) range += kgsl_memdesc_guard_page_size(pt->mmu, memdesc); if (kgsl_memdesc_is_secured(memdesc)) { if (!kgsl_mmu_is_secured(pt->mmu)) return -EINVAL; mutex_lock(&device->mutex); ret = kgsl_active_count_get(device); if (!ret) { _iommu_sync_mmu_pc(device, true); unmapped = iommu_unmap(iommu_pt->domain, gpuaddr, range); _iommu_sync_mmu_pc(device, false); kgsl_active_count_put(device); } mutex_unlock(&device->mutex); } else { _iommu_sync_mmu_pc(device, true); unmapped = iommu_unmap(iommu_pt->domain, gpuaddr, range); _iommu_sync_mmu_pc(device, false); } if (unmapped != range) { KGSL_CORE_ERR( "iommu_unmap(%p, %llx, %lld) failed with unmapped size: %zd\n", iommu_pt->domain, gpuaddr, range, unmapped); return -EINVAL; } return ret; } /** * _iommu_add_guard_page - Add iommu guard page * @pt - Pointer to kgsl pagetable structure * @memdesc - memdesc to add guard page * @gpuaddr - GPU addr of guard page * @protflags - flags for mapping * * Return 0 on success, error on map fail */ static int _iommu_add_guard_page(struct kgsl_pagetable *pt, struct kgsl_memdesc *memdesc, uint64_t gpuaddr, unsigned int protflags) { struct kgsl_iommu_pt *iommu_pt = pt->priv; phys_addr_t physaddr = page_to_phys(kgsl_guard_page); int ret; if (kgsl_memdesc_has_guard_page(memdesc)) { /* * Allocate guard page for secure buffers. * This has to be done after we attach a smmu pagetable. * Allocate the guard page when first secure buffer is. * mapped to save 1MB of memory if CPZ is not used. */ if (kgsl_memdesc_is_secured(memdesc)) { struct scatterlist *sg; unsigned int sgp_size = pt->mmu->secure_align_mask + 1; if (!kgsl_secure_guard_page_memdesc.sgt) { if (kgsl_allocate_user(pt->mmu->device, &kgsl_secure_guard_page_memdesc, pt, sgp_size, sgp_size, KGSL_MEMFLAGS_SECURE)) { KGSL_CORE_ERR( "Secure guard page alloc failed\n"); return -ENOMEM; } } sg = kgsl_secure_guard_page_memdesc.sgt->sgl; physaddr = page_to_phys(sg_page(sg)); } _iommu_sync_mmu_pc(pt->mmu->device, true); ret = iommu_map(iommu_pt->domain, gpuaddr, physaddr, kgsl_memdesc_guard_page_size(pt->mmu, memdesc), protflags & ~IOMMU_WRITE); _iommu_sync_mmu_pc(pt->mmu->device, false); if (ret) { KGSL_CORE_ERR( "iommu_map(%p, addr %016llX, flags %x) err: %d\n", iommu_pt->domain, gpuaddr, protflags & ~IOMMU_WRITE, ret); return ret; } } return 0; } static int kgsl_iommu_map(struct kgsl_pagetable *pt, struct kgsl_memdesc *memdesc) { int ret = 0; uint64_t addr = memdesc->gpuaddr; struct kgsl_iommu_pt *iommu_pt = pt->priv; uint64_t size = memdesc->size; unsigned int flags = 0; struct kgsl_device *device = pt->mmu->device; size_t mapped = 0; BUG_ON(NULL == iommu_pt); flags = IOMMU_READ | IOMMU_WRITE | IOMMU_NOEXEC; /* Set up the protection for the page(s) */ if (memdesc->flags & KGSL_MEMFLAGS_GPUREADONLY) flags &= ~IOMMU_WRITE; if (memdesc->priv & KGSL_MEMDESC_PRIVILEGED) flags |= IOMMU_PRIV; if (kgsl_memdesc_is_secured(memdesc)) { if (!kgsl_mmu_is_secured(pt->mmu)) return -EINVAL; mutex_lock(&device->mutex); ret = kgsl_active_count_get(device); if (!ret) { _iommu_sync_mmu_pc(device, true); mapped = iommu_map_sg(iommu_pt->domain, addr, memdesc->sgt->sgl, memdesc->sgt->nents, flags); _iommu_sync_mmu_pc(device, false); kgsl_active_count_put(device); } mutex_unlock(&device->mutex); } else { _iommu_sync_mmu_pc(device, true); mapped = iommu_map_sg(iommu_pt->domain, addr, memdesc->sgt->sgl, memdesc->sgt->nents, flags); _iommu_sync_mmu_pc(device, false); } if (mapped != size) { KGSL_CORE_ERR("iommu_map_sg(%p, %016llX, %lld, %x) err: %zd\n", iommu_pt->domain, addr, size, flags, mapped); return -ENODEV; } ret = _iommu_add_guard_page(pt, memdesc, addr + size, flags); if (ret) { /* cleanup the partial mapping */ _iommu_sync_mmu_pc(device, true); iommu_unmap(iommu_pt->domain, addr, size); _iommu_sync_mmu_pc(device, false); } return ret; } /* This function must be called with context bank attached */ static void kgsl_iommu_clear_fsr(struct kgsl_mmu *mmu) { struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; if (ctx->default_pt != NULL) { kgsl_iommu_enable_clk(mmu); KGSL_IOMMU_SET_CTX_REG(ctx, FSR, 0xffffffff); kgsl_iommu_disable_clk(mmu); } } static void kgsl_iommu_pagefault_resume(struct kgsl_mmu *mmu) { struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; unsigned int sctlr_val; if (ctx->default_pt != NULL && ctx->fault) { /* * Write 1 to RESUME.TnR to terminate the * stalled transaction. Also, re-enable * context fault interrupts by writing 1 * to SCTLR.CFIE */ sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_CFIE_SHIFT); KGSL_IOMMU_SET_CTX_REG(ctx, RESUME, 1); KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); /* * Make sure the above register writes * are not reordered across the barrier * as we use writel_relaxed to write them */ wmb(); ctx->fault = 0; } } static void kgsl_iommu_stop(struct kgsl_mmu *mmu) { int i; struct kgsl_iommu *iommu = mmu->priv; /* * If the iommu supports retention, we don't need * to detach when stopping. */ if (!MMU_FEATURE(mmu, KGSL_MMU_RETENTION)) { for (i = 0; i < KGSL_IOMMU_CONTEXT_MAX; i++) _detach_context(&iommu->ctx[i], mmu->device); } } static int kgsl_iommu_close(struct kgsl_mmu *mmu) { struct kgsl_iommu *iommu = mmu->priv; int i; for (i = 0; i < KGSL_IOMMU_CONTEXT_MAX; i++) _detach_context(&iommu->ctx[i], mmu->device); if (mmu->defaultpagetable != NULL) { kgsl_mmu_putpagetable(mmu->defaultpagetable); mmu->defaultpagetable = NULL; } if (mmu->securepagetable != NULL) { kgsl_mmu_putpagetable(mmu->securepagetable); mmu->securepagetable = NULL; } if (iommu->regbase != NULL) iounmap(iommu->regbase); kgsl_sharedmem_free(&kgsl_secure_guard_page_memdesc); if (kgsl_guard_page != NULL) { __free_page(kgsl_guard_page); kgsl_guard_page = NULL; } return 0; } static u64 kgsl_iommu_get_current_ttbr0(struct kgsl_mmu *mmu) { u64 val; struct kgsl_iommu *iommu = mmu->priv; /* * We cannot enable or disable the clocks in interrupt context, this * function is called from interrupt context if there is an axi error */ if (in_interrupt()) return 0; kgsl_iommu_enable_clk(mmu); val = KGSL_IOMMU_GET_CTX_REG_Q(&iommu->ctx[KGSL_IOMMU_CONTEXT_USER], TTBR0); kgsl_iommu_disable_clk(mmu); return val; } /* * kgsl_iommu_set_pt - Change the IOMMU pagetable of the primary context bank * @mmu - Pointer to mmu structure * @pt - Pagetable to switch to * * Set the new pagetable for the IOMMU by doing direct register writes * to the IOMMU registers through the cpu * * Return - void */ static int kgsl_iommu_set_pt(struct kgsl_mmu *mmu, struct kgsl_pagetable *pt) { struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; int ret = 0; uint64_t ttbr0, temp; unsigned int contextidr; unsigned long wait_for_flush; /* * If using a global pagetable, we can skip all this * because the pagetable will be set up by the iommu * driver and never changed at runtime. */ if (!kgsl_mmu_is_perprocess(mmu)) return 0; kgsl_iommu_enable_clk(mmu); ttbr0 = kgsl_mmu_pagetable_get_ttbr0(pt); contextidr = kgsl_mmu_pagetable_get_contextidr(pt); /* * Taking the liberty to spin idle since this codepath * is invoked when we can spin safely for it to be idle */ ret = adreno_spin_idle(mmu->device); if (ret) return ret; KGSL_IOMMU_SET_CTX_REG_Q(ctx, TTBR0, ttbr0); KGSL_IOMMU_SET_CTX_REG(ctx, CONTEXTIDR, contextidr); mb(); temp = KGSL_IOMMU_GET_CTX_REG_Q(ctx, TTBR0); KGSL_IOMMU_SET_CTX_REG(ctx, TLBIALL, 1); /* make sure the TBLI write completes before we wait */ mb(); /* * Wait for flush to complete by polling the flush * status bit of TLBSTATUS register for not more than * 2 s. After 2s just exit, at that point the SMMU h/w * may be stuck and will eventually cause GPU to hang * or bring the system down. */ wait_for_flush = jiffies + msecs_to_jiffies(2000); KGSL_IOMMU_SET_CTX_REG(ctx, TLBSYNC, 0); while (KGSL_IOMMU_GET_CTX_REG(ctx, TLBSTATUS) & (KGSL_IOMMU_CTX_TLBSTATUS_SACTIVE)) { if (time_after(jiffies, wait_for_flush)) { KGSL_DRV_WARN(mmu->device, "Wait limit reached for IOMMU tlb flush\n"); break; } cpu_relax(); } /* Disable smmu clock */ kgsl_iommu_disable_clk(mmu); return ret; } /* * kgsl_iommu_set_pf_policy() - Set the pagefault policy for IOMMU * @mmu: Pointer to mmu structure * @pf_policy: The pagefault polict to set * * Check if the new policy indicated by pf_policy is same as current * policy, if same then return else set the policy */ static int kgsl_iommu_set_pf_policy(struct kgsl_mmu *mmu, unsigned long pf_policy) { struct kgsl_iommu *iommu = mmu->priv; struct kgsl_iommu_context *ctx = &iommu->ctx[KGSL_IOMMU_CONTEXT_USER]; struct adreno_device *adreno_dev = ADRENO_DEVICE(mmu->device); int ret = 0; unsigned int sctlr_val; if ((adreno_dev->ft_pf_policy & BIT(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE)) == (pf_policy & BIT(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE))) return 0; /* If not attached, policy will be updated during the next attach */ if (ctx->default_pt != NULL) { /* Need to idle device before changing options */ ret = mmu->device->ftbl->idle(mmu->device); if (ret) return ret; kgsl_iommu_enable_clk(mmu); sctlr_val = KGSL_IOMMU_GET_CTX_REG(ctx, SCTLR); if (test_bit(KGSL_FT_PAGEFAULT_GPUHALT_ENABLE, &pf_policy)) { sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); } else { sctlr_val &= ~(0x1 << KGSL_IOMMU_SCTLR_CFCFG_SHIFT); sctlr_val |= (0x1 << KGSL_IOMMU_SCTLR_HUPCF_SHIFT); } KGSL_IOMMU_SET_CTX_REG(ctx, SCTLR, sctlr_val); kgsl_iommu_disable_clk(mmu); } return ret; } static struct kgsl_protected_registers * kgsl_iommu_get_prot_regs(struct kgsl_mmu *mmu) { struct kgsl_iommu *iommu = mmu->priv; return &iommu->protect; } static struct kgsl_iommu_addr_entry *_find_gpuaddr( struct kgsl_pagetable *pagetable, uint64_t gpuaddr) { struct kgsl_iommu_pt *pt = pagetable->priv; struct rb_node *node = pt->rbtree.rb_node; while (node != NULL) { struct kgsl_iommu_addr_entry *entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); if (gpuaddr < entry->base) node = node->rb_left; else if (gpuaddr > entry->base) node = node->rb_right; else return entry; } return NULL; } static int _remove_gpuaddr(struct kgsl_pagetable *pagetable, uint64_t gpuaddr) { struct kgsl_iommu_pt *pt = pagetable->priv; struct kgsl_iommu_addr_entry *entry; entry = _find_gpuaddr(pagetable, gpuaddr); if (entry != NULL) { rb_erase(&entry->node, &pt->rbtree); kmem_cache_free(addr_entry_cache, entry); return 0; } return -ENOMEM; } static int _insert_gpuaddr(struct kgsl_pagetable *pagetable, uint64_t gpuaddr, uint64_t size) { struct kgsl_iommu_pt *pt = pagetable->priv; struct rb_node **node, *parent = NULL; struct kgsl_iommu_addr_entry *new = kmem_cache_alloc(addr_entry_cache, GFP_ATOMIC); if (new == NULL) return -ENOMEM; new->base = gpuaddr; new->size = size; node = &pt->rbtree.rb_node; while (*node != NULL) { struct kgsl_iommu_addr_entry *this; parent = *node; this = rb_entry(parent, struct kgsl_iommu_addr_entry, node); if (new->base < this->base) node = &parent->rb_left; else if (new->base > this->base) node = &parent->rb_right; else BUG(); } rb_link_node(&new->node, parent, node); rb_insert_color(&new->node, &pt->rbtree); return 0; } static uint64_t _get_unmapped_area(struct kgsl_pagetable *pagetable, uint64_t bottom, uint64_t top, uint64_t size, uint64_t align) { struct kgsl_iommu_pt *pt = pagetable->priv; struct rb_node *node = rb_first(&pt->rbtree); uint64_t start; bottom = ALIGN(bottom, align); start = bottom; while (node != NULL) { uint64_t gap; struct kgsl_iommu_addr_entry *entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); /* * Skip any entries that are outside of the range, but make sure * to account for some that might straddle the lower bound */ if (entry->base < bottom) { if (entry->base + entry->size > bottom) start = ALIGN(entry->base + entry->size, align); node = rb_next(node); continue; } /* Stop if we went over the top */ if (entry->base >= top) break; /* Make sure there is a gap to consider */ if (start < entry->base) { gap = entry->base - start; if (gap >= size) return start; } /* Stop if there is no more room in the region */ if (entry->base + entry->size >= top) return (uint64_t) -ENOMEM; /* Start the next cycle at the end of the current entry */ start = ALIGN(entry->base + entry->size, align); node = rb_next(node); } if (start + size <= top) return start; return (uint64_t) -ENOMEM; } static uint64_t _get_unmapped_area_topdown(struct kgsl_pagetable *pagetable, uint64_t bottom, uint64_t top, uint64_t size, uint64_t align) { struct kgsl_iommu_pt *pt = pagetable->priv; struct rb_node *node = rb_last(&pt->rbtree); uint64_t end = top; uint64_t mask = ~(align - 1); struct kgsl_iommu_addr_entry *entry; /* Make sure that the bottom is correctly aligned */ bottom = ALIGN(bottom, align); /* Make sure the requested size will fit in the range */ if (size > (top - bottom)) return -ENOMEM; /* Walk back through the list to find the highest entry in the range */ for (node = rb_last(&pt->rbtree); node != NULL; node = rb_prev(node)) { entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); if (entry->base < top) break; } while (node != NULL) { uint64_t offset; entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); /* If the entire entry is below the range the search is over */ if ((entry->base + entry->size) < bottom) break; /* Get the top of the entry properly aligned */ offset = ALIGN(entry->base + entry->size, align); /* * Try to allocate the memory from the top of the gap, * making sure that it fits between the top of this entry and * the bottom of the previous one */ if ((end > size) && (offset < end)) { uint64_t chunk = (end - size) & mask; if (chunk >= offset) return chunk; } /* * If we get here and the current entry is outside of the range * then we are officially out of room */ if (entry->base < bottom) return (uint64_t) -ENOMEM; /* Set the top of the gap to the current entry->base */ end = entry->base; /* And move on to the next lower entry */ node = rb_prev(node); } /* If we get here then there are no more entries in the region */ if ((end > size) && (((end - size) & mask) >= bottom)) return (end - size) & mask; return (uint64_t) -ENOMEM; } static uint64_t kgsl_iommu_find_svm_region(struct kgsl_pagetable *pagetable, uint64_t start, uint64_t end, uint64_t size, uint64_t alignment) { uint64_t addr; /* Avoid black holes */ BUG_ON(end <= start); spin_lock(&pagetable->lock); addr = _get_unmapped_area_topdown(pagetable, start, end, size, alignment); spin_unlock(&pagetable->lock); return addr; } #define ADDR_IN_GLOBAL(_a) \ (((_a) >= KGSL_MMU_GLOBAL_MEM_BASE) && \ ((_a) < (KGSL_MMU_GLOBAL_MEM_BASE + KGSL_MMU_GLOBAL_MEM_SIZE))) static int kgsl_iommu_set_svm_region(struct kgsl_pagetable *pagetable, uint64_t gpuaddr, uint64_t size) { int ret = -ENOMEM; struct kgsl_iommu_pt *pt = pagetable->priv; struct rb_node *node; /* Make sure the requested address doesn't fall in the global range */ if (ADDR_IN_GLOBAL(gpuaddr) || ADDR_IN_GLOBAL(gpuaddr + size)) return -ENOMEM; spin_lock(&pagetable->lock); node = pt->rbtree.rb_node; while (node != NULL) { uint64_t start, end; struct kgsl_iommu_addr_entry *entry = rb_entry(node, struct kgsl_iommu_addr_entry, node); start = entry->base; end = entry->base + entry->size; if (gpuaddr + size <= start) node = node->rb_left; else if (end <= gpuaddr) node = node->rb_right; else goto out; } ret = _insert_gpuaddr(pagetable, gpuaddr, size); out: spin_unlock(&pagetable->lock); return ret; } static int kgsl_iommu_get_gpuaddr(struct kgsl_pagetable *pagetable, struct kgsl_memdesc *memdesc) { struct kgsl_iommu_pt *pt = pagetable->priv; int ret = 0; uint64_t addr, start, end; uint64_t size = memdesc->size; unsigned int align; BUG_ON(kgsl_memdesc_use_cpu_map(memdesc)); if (memdesc->flags & KGSL_MEMFLAGS_SECURE && pagetable->name != KGSL_MMU_SECURE_PT) return -EINVAL; if (kgsl_memdesc_has_guard_page(memdesc)) size += kgsl_memdesc_guard_page_size(pagetable->mmu, memdesc); align = 1 << kgsl_memdesc_get_align(memdesc); if (memdesc->flags & KGSL_MEMFLAGS_FORCE_32BIT) { start = pt->compat_va_start; end = pt->compat_va_end; } else { start = pt->va_start; end = pt->va_end; } spin_lock(&pagetable->lock); addr = _get_unmapped_area(pagetable, start, end, size, align); if (addr == (uint64_t) -ENOMEM) { ret = -ENOMEM; goto out; } ret = _insert_gpuaddr(pagetable, addr, size); if (ret == 0) memdesc->gpuaddr = addr; out: spin_unlock(&pagetable->lock); return ret; } static void kgsl_iommu_put_gpuaddr(struct kgsl_pagetable *pagetable, struct kgsl_memdesc *memdesc) { spin_lock(&pagetable->lock); if (_remove_gpuaddr(pagetable, memdesc->gpuaddr)) BUG(); spin_unlock(&pagetable->lock); } static int kgsl_iommu_svm_range(struct kgsl_pagetable *pagetable, uint64_t *lo, uint64_t *hi, uint64_t memflags) { struct kgsl_iommu_pt *pt = pagetable->priv; bool gpu_compat = (memflags & KGSL_MEMFLAGS_FORCE_32BIT) != 0; if (lo != NULL) *lo = gpu_compat ? pt->compat_va_start : pt->svm_start; if (hi != NULL) *hi = gpu_compat ? pt->compat_va_end : pt->svm_end; return 0; } static bool kgsl_iommu_addr_in_range(struct kgsl_pagetable *pagetable, uint64_t gpuaddr) { struct kgsl_iommu_pt *pt = pagetable->priv; if (gpuaddr == 0) return false; if (gpuaddr >= pt->va_start && gpuaddr < pt->va_end) return true; if (gpuaddr >= pt->compat_va_start && gpuaddr < pt->compat_va_end) return true; if (gpuaddr >= pt->svm_start && gpuaddr < pt->svm_end) return true; return false; } struct kgsl_mmu_ops kgsl_iommu_ops = { .mmu_init = kgsl_iommu_init, .mmu_close = kgsl_iommu_close, .mmu_start = kgsl_iommu_start, .mmu_stop = kgsl_iommu_stop, .mmu_set_pt = kgsl_iommu_set_pt, .mmu_clear_fsr = kgsl_iommu_clear_fsr, .mmu_get_current_ttbr0 = kgsl_iommu_get_current_ttbr0, .mmu_enable_clk = kgsl_iommu_enable_clk, .mmu_disable_clk = kgsl_iommu_disable_clk, .mmu_get_reg_ahbaddr = kgsl_iommu_get_reg_ahbaddr, .mmu_set_pf_policy = kgsl_iommu_set_pf_policy, .mmu_pagefault_resume = kgsl_iommu_pagefault_resume, .mmu_get_prot_regs = kgsl_iommu_get_prot_regs, .mmu_init_pt = kgsl_iommu_init_pt, }; static struct kgsl_mmu_pt_ops iommu_pt_ops = { .mmu_map = kgsl_iommu_map, .mmu_unmap = kgsl_iommu_unmap, .mmu_destroy_pagetable = kgsl_iommu_destroy_pagetable, .get_ttbr0 = kgsl_iommu_get_ttbr0, .get_contextidr = kgsl_iommu_get_contextidr, .get_gpuaddr = kgsl_iommu_get_gpuaddr, .put_gpuaddr = kgsl_iommu_put_gpuaddr, .set_svm_region = kgsl_iommu_set_svm_region, .find_svm_region = kgsl_iommu_find_svm_region, .svm_range = kgsl_iommu_svm_range, .addr_in_range = kgsl_iommu_addr_in_range, };