a0d198f79a
Fix arithmetic and logic errors in hfi1_can_pin_pages() that would allow hfi1 to attempt pinning pages in cases where it should not because of resource limits or lack of required capability. Fixes: 2c97ce4f3c29 ("IB/hfi1: Add pin query function") Link: https://lore.kernel.org/r/167656658362.2223096.10954762619837718026.stgit@awfm-02.cornelisnetworks.com Signed-off-by: Brendan Cunningham <bcunningham@cornelisnetworks.com> Signed-off-by: Patrick Kelsey <pat.kelsey@cornelisnetworks.com> Signed-off-by: Dennis Dalessandro <dennis.dalessandro@cornelisnetworks.com> Signed-off-by: Jason Gunthorpe <jgg@nvidia.com>
104 lines
3.1 KiB
C
104 lines
3.1 KiB
C
// SPDX-License-Identifier: GPL-2.0 or BSD-3-Clause
|
|
/*
|
|
* Copyright(c) 2015-2017 Intel Corporation.
|
|
*/
|
|
|
|
#include <linux/mm.h>
|
|
#include <linux/sched/signal.h>
|
|
#include <linux/device.h>
|
|
#include <linux/module.h>
|
|
|
|
#include "hfi.h"
|
|
|
|
static unsigned long cache_size = 256;
|
|
module_param(cache_size, ulong, S_IRUGO | S_IWUSR);
|
|
MODULE_PARM_DESC(cache_size, "Send and receive side cache size limit (in MB)");
|
|
|
|
/*
|
|
* Determine whether the caller can pin pages.
|
|
*
|
|
* This function should be used in the implementation of buffer caches.
|
|
* The cache implementation should call this function prior to attempting
|
|
* to pin buffer pages in order to determine whether they should do so.
|
|
* The function computes cache limits based on the configured ulimit and
|
|
* cache size. Use of this function is especially important for caches
|
|
* which are not limited in any other way (e.g. by HW resources) and, thus,
|
|
* could keeping caching buffers.
|
|
*
|
|
*/
|
|
bool hfi1_can_pin_pages(struct hfi1_devdata *dd, struct mm_struct *mm,
|
|
u32 nlocked, u32 npages)
|
|
{
|
|
unsigned long ulimit_pages;
|
|
unsigned long cache_limit_pages;
|
|
unsigned int usr_ctxts;
|
|
|
|
/*
|
|
* Perform RLIMIT_MEMLOCK based checks unless CAP_IPC_LOCK is present.
|
|
*/
|
|
if (!capable(CAP_IPC_LOCK)) {
|
|
ulimit_pages =
|
|
DIV_ROUND_DOWN_ULL(rlimit(RLIMIT_MEMLOCK), PAGE_SIZE);
|
|
|
|
/*
|
|
* Pinning these pages would exceed this process's locked memory
|
|
* limit.
|
|
*/
|
|
if (atomic64_read(&mm->pinned_vm) + npages > ulimit_pages)
|
|
return false;
|
|
|
|
/*
|
|
* Only allow 1/4 of the user's RLIMIT_MEMLOCK to be used for HFI
|
|
* caches. This fraction is then equally distributed among all
|
|
* existing user contexts. Note that if RLIMIT_MEMLOCK is
|
|
* 'unlimited' (-1), the value of this limit will be > 2^42 pages
|
|
* (2^64 / 2^12 / 2^8 / 2^2).
|
|
*
|
|
* The effectiveness of this check may be reduced if I/O occurs on
|
|
* some user contexts before all user contexts are created. This
|
|
* check assumes that this process is the only one using this
|
|
* context (e.g., the corresponding fd was not passed to another
|
|
* process for concurrent access) as there is no per-context,
|
|
* per-process tracking of pinned pages. It also assumes that each
|
|
* user context has only one cache to limit.
|
|
*/
|
|
usr_ctxts = dd->num_rcv_contexts - dd->first_dyn_alloc_ctxt;
|
|
if (nlocked + npages > (ulimit_pages / usr_ctxts / 4))
|
|
return false;
|
|
}
|
|
|
|
/*
|
|
* Pinning these pages would exceed the size limit for this cache.
|
|
*/
|
|
cache_limit_pages = cache_size * (1024 * 1024) / PAGE_SIZE;
|
|
if (nlocked + npages > cache_limit_pages)
|
|
return false;
|
|
|
|
return true;
|
|
}
|
|
|
|
int hfi1_acquire_user_pages(struct mm_struct *mm, unsigned long vaddr, size_t npages,
|
|
bool writable, struct page **pages)
|
|
{
|
|
int ret;
|
|
unsigned int gup_flags = FOLL_LONGTERM | (writable ? FOLL_WRITE : 0);
|
|
|
|
ret = pin_user_pages_fast(vaddr, npages, gup_flags, pages);
|
|
if (ret < 0)
|
|
return ret;
|
|
|
|
atomic64_add(ret, &mm->pinned_vm);
|
|
|
|
return ret;
|
|
}
|
|
|
|
void hfi1_release_user_pages(struct mm_struct *mm, struct page **p,
|
|
size_t npages, bool dirty)
|
|
{
|
|
unpin_user_pages_dirty_lock(p, npages, dirty);
|
|
|
|
if (mm) { /* during close after signal, mm can be NULL */
|
|
atomic64_sub(npages, &mm->pinned_vm);
|
|
}
|
|
}
|