65d4418c50
Prior to commit 092edaddb660 ("iommu: Support mm PASID 1:n with sva domains") the code allowed a SVA handle to be bound multiple times to the same (mm, device) pair. This was alluded to in the kdoc comment, but we had understood this to be more a remark about allowing multiple devices, not a literal same-driver re-opening the same SVA. It turns out uacce and idxd were both relying on the core code to handle reference counting for same-device same-mm scenarios. As this looks hard to resolve in the drivers bring it back to the core code. The new design has changed the meaning of the domain->users refcount to refer to the number of devices that are sharing that domain for the same mm. This is part of the design to lift the SVA domain de-duplication out of the drivers. Return the old behavior by explicitly de-duplicating the struct iommu_sva handle. The same (mm, device) will return the same handle pointer and the core code will handle tracking this. The last unbind of the handle will destroy it. Fixes: 092edaddb660 ("iommu: Support mm PASID 1:n with sva domains") Reported-by: Zhangfei Gao <zhangfei.gao@linaro.org> Closes: https://lore.kernel.org/all/20240221110658.529-1-zhangfei.gao@linaro.org/ Tested-by: Zhangfei Gao <zhangfei.gao@linaro.org> Signed-off-by: Jason Gunthorpe <jgg@nvidia.com> Reviewed-by: Lu Baolu <baolu.lu@linux.intel.com> Link: https://lore.kernel.org/r/0-v1-9455fc497a6f+3b4-iommu_sva_sharing_jgg@nvidia.com Signed-off-by: Joerg Roedel <jroedel@suse.de>
247 lines
6.1 KiB
C
247 lines
6.1 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Helpers for IOMMU drivers implementing SVA
|
|
*/
|
|
#include <linux/mmu_context.h>
|
|
#include <linux/mutex.h>
|
|
#include <linux/sched/mm.h>
|
|
#include <linux/iommu.h>
|
|
|
|
#include "iommu-sva.h"
|
|
|
|
static DEFINE_MUTEX(iommu_sva_lock);
|
|
|
|
/* Allocate a PASID for the mm within range (inclusive) */
|
|
static struct iommu_mm_data *iommu_alloc_mm_data(struct mm_struct *mm, struct device *dev)
|
|
{
|
|
struct iommu_mm_data *iommu_mm;
|
|
ioasid_t pasid;
|
|
|
|
lockdep_assert_held(&iommu_sva_lock);
|
|
|
|
if (!arch_pgtable_dma_compat(mm))
|
|
return ERR_PTR(-EBUSY);
|
|
|
|
iommu_mm = mm->iommu_mm;
|
|
/* Is a PASID already associated with this mm? */
|
|
if (iommu_mm) {
|
|
if (iommu_mm->pasid >= dev->iommu->max_pasids)
|
|
return ERR_PTR(-EOVERFLOW);
|
|
return iommu_mm;
|
|
}
|
|
|
|
iommu_mm = kzalloc(sizeof(struct iommu_mm_data), GFP_KERNEL);
|
|
if (!iommu_mm)
|
|
return ERR_PTR(-ENOMEM);
|
|
|
|
pasid = iommu_alloc_global_pasid(dev);
|
|
if (pasid == IOMMU_PASID_INVALID) {
|
|
kfree(iommu_mm);
|
|
return ERR_PTR(-ENOSPC);
|
|
}
|
|
iommu_mm->pasid = pasid;
|
|
INIT_LIST_HEAD(&iommu_mm->sva_domains);
|
|
INIT_LIST_HEAD(&iommu_mm->sva_handles);
|
|
/*
|
|
* Make sure the write to mm->iommu_mm is not reordered in front of
|
|
* initialization to iommu_mm fields. If it does, readers may see a
|
|
* valid iommu_mm with uninitialized values.
|
|
*/
|
|
smp_store_release(&mm->iommu_mm, iommu_mm);
|
|
return iommu_mm;
|
|
}
|
|
|
|
/**
|
|
* iommu_sva_bind_device() - Bind a process address space to a device
|
|
* @dev: the device
|
|
* @mm: the mm to bind, caller must hold a reference to mm_users
|
|
*
|
|
* Create a bond between device and address space, allowing the device to
|
|
* access the mm using the PASID returned by iommu_sva_get_pasid(). If a
|
|
* bond already exists between @device and @mm, an additional internal
|
|
* reference is taken. Caller must call iommu_sva_unbind_device()
|
|
* to release each reference.
|
|
*
|
|
* iommu_dev_enable_feature(dev, IOMMU_DEV_FEAT_SVA) must be called first, to
|
|
* initialize the required SVA features.
|
|
*
|
|
* On error, returns an ERR_PTR value.
|
|
*/
|
|
struct iommu_sva *iommu_sva_bind_device(struct device *dev, struct mm_struct *mm)
|
|
{
|
|
struct iommu_mm_data *iommu_mm;
|
|
struct iommu_domain *domain;
|
|
struct iommu_sva *handle;
|
|
int ret;
|
|
|
|
mutex_lock(&iommu_sva_lock);
|
|
|
|
/* Allocate mm->pasid if necessary. */
|
|
iommu_mm = iommu_alloc_mm_data(mm, dev);
|
|
if (IS_ERR(iommu_mm)) {
|
|
ret = PTR_ERR(iommu_mm);
|
|
goto out_unlock;
|
|
}
|
|
|
|
list_for_each_entry(handle, &mm->iommu_mm->sva_handles, handle_item) {
|
|
if (handle->dev == dev) {
|
|
refcount_inc(&handle->users);
|
|
mutex_unlock(&iommu_sva_lock);
|
|
return handle;
|
|
}
|
|
}
|
|
|
|
handle = kzalloc(sizeof(*handle), GFP_KERNEL);
|
|
if (!handle) {
|
|
ret = -ENOMEM;
|
|
goto out_unlock;
|
|
}
|
|
|
|
/* Search for an existing domain. */
|
|
list_for_each_entry(domain, &mm->iommu_mm->sva_domains, next) {
|
|
ret = iommu_attach_device_pasid(domain, dev, iommu_mm->pasid);
|
|
if (!ret) {
|
|
domain->users++;
|
|
goto out;
|
|
}
|
|
}
|
|
|
|
/* Allocate a new domain and set it on device pasid. */
|
|
domain = iommu_sva_domain_alloc(dev, mm);
|
|
if (!domain) {
|
|
ret = -ENOMEM;
|
|
goto out_free_handle;
|
|
}
|
|
|
|
ret = iommu_attach_device_pasid(domain, dev, iommu_mm->pasid);
|
|
if (ret)
|
|
goto out_free_domain;
|
|
domain->users = 1;
|
|
refcount_set(&handle->users, 1);
|
|
list_add(&domain->next, &mm->iommu_mm->sva_domains);
|
|
list_add(&handle->handle_item, &mm->iommu_mm->sva_handles);
|
|
|
|
out:
|
|
mutex_unlock(&iommu_sva_lock);
|
|
handle->dev = dev;
|
|
handle->domain = domain;
|
|
return handle;
|
|
|
|
out_free_domain:
|
|
iommu_domain_free(domain);
|
|
out_free_handle:
|
|
kfree(handle);
|
|
out_unlock:
|
|
mutex_unlock(&iommu_sva_lock);
|
|
return ERR_PTR(ret);
|
|
}
|
|
EXPORT_SYMBOL_GPL(iommu_sva_bind_device);
|
|
|
|
/**
|
|
* iommu_sva_unbind_device() - Remove a bond created with iommu_sva_bind_device
|
|
* @handle: the handle returned by iommu_sva_bind_device()
|
|
*
|
|
* Put reference to a bond between device and address space. The device should
|
|
* not be issuing any more transaction for this PASID. All outstanding page
|
|
* requests for this PASID must have been flushed to the IOMMU.
|
|
*/
|
|
void iommu_sva_unbind_device(struct iommu_sva *handle)
|
|
{
|
|
struct iommu_domain *domain = handle->domain;
|
|
struct iommu_mm_data *iommu_mm = domain->mm->iommu_mm;
|
|
struct device *dev = handle->dev;
|
|
|
|
mutex_lock(&iommu_sva_lock);
|
|
if (!refcount_dec_and_test(&handle->users)) {
|
|
mutex_unlock(&iommu_sva_lock);
|
|
return;
|
|
}
|
|
list_del(&handle->handle_item);
|
|
|
|
iommu_detach_device_pasid(domain, dev, iommu_mm->pasid);
|
|
if (--domain->users == 0) {
|
|
list_del(&domain->next);
|
|
iommu_domain_free(domain);
|
|
}
|
|
mutex_unlock(&iommu_sva_lock);
|
|
kfree(handle);
|
|
}
|
|
EXPORT_SYMBOL_GPL(iommu_sva_unbind_device);
|
|
|
|
u32 iommu_sva_get_pasid(struct iommu_sva *handle)
|
|
{
|
|
struct iommu_domain *domain = handle->domain;
|
|
|
|
return mm_get_enqcmd_pasid(domain->mm);
|
|
}
|
|
EXPORT_SYMBOL_GPL(iommu_sva_get_pasid);
|
|
|
|
/*
|
|
* I/O page fault handler for SVA
|
|
*/
|
|
enum iommu_page_response_code
|
|
iommu_sva_handle_iopf(struct iommu_fault *fault, void *data)
|
|
{
|
|
vm_fault_t ret;
|
|
struct vm_area_struct *vma;
|
|
struct mm_struct *mm = data;
|
|
unsigned int access_flags = 0;
|
|
unsigned int fault_flags = FAULT_FLAG_REMOTE;
|
|
struct iommu_fault_page_request *prm = &fault->prm;
|
|
enum iommu_page_response_code status = IOMMU_PAGE_RESP_INVALID;
|
|
|
|
if (!(prm->flags & IOMMU_FAULT_PAGE_REQUEST_PASID_VALID))
|
|
return status;
|
|
|
|
if (!mmget_not_zero(mm))
|
|
return status;
|
|
|
|
mmap_read_lock(mm);
|
|
|
|
vma = vma_lookup(mm, prm->addr);
|
|
if (!vma)
|
|
/* Unmapped area */
|
|
goto out_put_mm;
|
|
|
|
if (prm->perm & IOMMU_FAULT_PERM_READ)
|
|
access_flags |= VM_READ;
|
|
|
|
if (prm->perm & IOMMU_FAULT_PERM_WRITE) {
|
|
access_flags |= VM_WRITE;
|
|
fault_flags |= FAULT_FLAG_WRITE;
|
|
}
|
|
|
|
if (prm->perm & IOMMU_FAULT_PERM_EXEC) {
|
|
access_flags |= VM_EXEC;
|
|
fault_flags |= FAULT_FLAG_INSTRUCTION;
|
|
}
|
|
|
|
if (!(prm->perm & IOMMU_FAULT_PERM_PRIV))
|
|
fault_flags |= FAULT_FLAG_USER;
|
|
|
|
if (access_flags & ~vma->vm_flags)
|
|
/* Access fault */
|
|
goto out_put_mm;
|
|
|
|
ret = handle_mm_fault(vma, prm->addr, fault_flags, NULL);
|
|
status = ret & VM_FAULT_ERROR ? IOMMU_PAGE_RESP_INVALID :
|
|
IOMMU_PAGE_RESP_SUCCESS;
|
|
|
|
out_put_mm:
|
|
mmap_read_unlock(mm);
|
|
mmput(mm);
|
|
|
|
return status;
|
|
}
|
|
|
|
void mm_pasid_drop(struct mm_struct *mm)
|
|
{
|
|
struct iommu_mm_data *iommu_mm = mm->iommu_mm;
|
|
|
|
if (!iommu_mm)
|
|
return;
|
|
|
|
iommu_free_global_pasid(iommu_mm->pasid);
|
|
kfree(iommu_mm);
|
|
}
|