badc28d492
The debugfs_remove_recursive() is invoked by unregister_shrinker(), which is holding the write lock of shrinker_rwsem. It will waits for the handler of debugfs file complete. The handler also needs to hold the read lock of shrinker_rwsem to do something. So it may cause the following deadlock: CPU0 CPU1 debugfs_file_get() shrinker_debugfs_count_show()/shrinker_debugfs_scan_write() unregister_shrinker() --> down_write(&shrinker_rwsem); debugfs_remove_recursive() // wait for (A) --> wait_for_completion(); // wait for (B) --> down_read_killable(&shrinker_rwsem) debugfs_file_put() -- (A) up_write() -- (B) The down_read_killable() can be killed, so that the above deadlock can be recovered. But it still requires an extra kill action, otherwise it will block all subsequent shrinker-related operations, so it's better to fix it. [akpm@linux-foundation.org: fix CONFIG_SHRINKER_DEBUG=n stub] Link: https://lkml.kernel.org/r/20230202105612.64641-1-zhengqi.arch@bytedance.com Fixes: 5035ebc644ae ("mm: shrinkers: introduce debugfs interface for memory shrinkers") Signed-off-by: Qi Zheng <zhengqi.arch@bytedance.com> Reviewed-by: Roman Gushchin <roman.gushchin@linux.dev> Cc: Kent Overstreet <kent.overstreet@gmail.com> Cc: Muchun Song <songmuchun@bytedance.com> Cc: <stable@vger.kernel.org> Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
290 lines
6.2 KiB
C
290 lines
6.2 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
#include <linux/idr.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/debugfs.h>
|
|
#include <linux/seq_file.h>
|
|
#include <linux/shrinker.h>
|
|
#include <linux/memcontrol.h>
|
|
|
|
/* defined in vmscan.c */
|
|
extern struct rw_semaphore shrinker_rwsem;
|
|
extern struct list_head shrinker_list;
|
|
|
|
static DEFINE_IDA(shrinker_debugfs_ida);
|
|
static struct dentry *shrinker_debugfs_root;
|
|
|
|
static unsigned long shrinker_count_objects(struct shrinker *shrinker,
|
|
struct mem_cgroup *memcg,
|
|
unsigned long *count_per_node)
|
|
{
|
|
unsigned long nr, total = 0;
|
|
int nid;
|
|
|
|
for_each_node(nid) {
|
|
if (nid == 0 || (shrinker->flags & SHRINKER_NUMA_AWARE)) {
|
|
struct shrink_control sc = {
|
|
.gfp_mask = GFP_KERNEL,
|
|
.nid = nid,
|
|
.memcg = memcg,
|
|
};
|
|
|
|
nr = shrinker->count_objects(shrinker, &sc);
|
|
if (nr == SHRINK_EMPTY)
|
|
nr = 0;
|
|
} else {
|
|
nr = 0;
|
|
}
|
|
|
|
count_per_node[nid] = nr;
|
|
total += nr;
|
|
}
|
|
|
|
return total;
|
|
}
|
|
|
|
static int shrinker_debugfs_count_show(struct seq_file *m, void *v)
|
|
{
|
|
struct shrinker *shrinker = m->private;
|
|
unsigned long *count_per_node;
|
|
struct mem_cgroup *memcg;
|
|
unsigned long total;
|
|
bool memcg_aware;
|
|
int ret, nid;
|
|
|
|
count_per_node = kcalloc(nr_node_ids, sizeof(unsigned long), GFP_KERNEL);
|
|
if (!count_per_node)
|
|
return -ENOMEM;
|
|
|
|
ret = down_read_killable(&shrinker_rwsem);
|
|
if (ret) {
|
|
kfree(count_per_node);
|
|
return ret;
|
|
}
|
|
rcu_read_lock();
|
|
|
|
memcg_aware = shrinker->flags & SHRINKER_MEMCG_AWARE;
|
|
|
|
memcg = mem_cgroup_iter(NULL, NULL, NULL);
|
|
do {
|
|
if (memcg && !mem_cgroup_online(memcg))
|
|
continue;
|
|
|
|
total = shrinker_count_objects(shrinker,
|
|
memcg_aware ? memcg : NULL,
|
|
count_per_node);
|
|
if (total) {
|
|
seq_printf(m, "%lu", mem_cgroup_ino(memcg));
|
|
for_each_node(nid)
|
|
seq_printf(m, " %lu", count_per_node[nid]);
|
|
seq_putc(m, '\n');
|
|
}
|
|
|
|
if (!memcg_aware) {
|
|
mem_cgroup_iter_break(NULL, memcg);
|
|
break;
|
|
}
|
|
|
|
if (signal_pending(current)) {
|
|
mem_cgroup_iter_break(NULL, memcg);
|
|
ret = -EINTR;
|
|
break;
|
|
}
|
|
} while ((memcg = mem_cgroup_iter(NULL, memcg, NULL)) != NULL);
|
|
|
|
rcu_read_unlock();
|
|
up_read(&shrinker_rwsem);
|
|
|
|
kfree(count_per_node);
|
|
return ret;
|
|
}
|
|
DEFINE_SHOW_ATTRIBUTE(shrinker_debugfs_count);
|
|
|
|
static int shrinker_debugfs_scan_open(struct inode *inode, struct file *file)
|
|
{
|
|
file->private_data = inode->i_private;
|
|
return nonseekable_open(inode, file);
|
|
}
|
|
|
|
static ssize_t shrinker_debugfs_scan_write(struct file *file,
|
|
const char __user *buf,
|
|
size_t size, loff_t *pos)
|
|
{
|
|
struct shrinker *shrinker = file->private_data;
|
|
unsigned long nr_to_scan = 0, ino, read_len;
|
|
struct shrink_control sc = {
|
|
.gfp_mask = GFP_KERNEL,
|
|
};
|
|
struct mem_cgroup *memcg = NULL;
|
|
int nid;
|
|
char kbuf[72];
|
|
ssize_t ret;
|
|
|
|
read_len = size < (sizeof(kbuf) - 1) ? size : (sizeof(kbuf) - 1);
|
|
if (copy_from_user(kbuf, buf, read_len))
|
|
return -EFAULT;
|
|
kbuf[read_len] = '\0';
|
|
|
|
if (sscanf(kbuf, "%lu %d %lu", &ino, &nid, &nr_to_scan) != 3)
|
|
return -EINVAL;
|
|
|
|
if (nid < 0 || nid >= nr_node_ids)
|
|
return -EINVAL;
|
|
|
|
if (nr_to_scan == 0)
|
|
return size;
|
|
|
|
if (shrinker->flags & SHRINKER_MEMCG_AWARE) {
|
|
memcg = mem_cgroup_get_from_ino(ino);
|
|
if (!memcg || IS_ERR(memcg))
|
|
return -ENOENT;
|
|
|
|
if (!mem_cgroup_online(memcg)) {
|
|
mem_cgroup_put(memcg);
|
|
return -ENOENT;
|
|
}
|
|
} else if (ino != 0) {
|
|
return -EINVAL;
|
|
}
|
|
|
|
ret = down_read_killable(&shrinker_rwsem);
|
|
if (ret) {
|
|
mem_cgroup_put(memcg);
|
|
return ret;
|
|
}
|
|
|
|
sc.nid = nid;
|
|
sc.memcg = memcg;
|
|
sc.nr_to_scan = nr_to_scan;
|
|
sc.nr_scanned = nr_to_scan;
|
|
|
|
shrinker->scan_objects(shrinker, &sc);
|
|
|
|
up_read(&shrinker_rwsem);
|
|
mem_cgroup_put(memcg);
|
|
|
|
return size;
|
|
}
|
|
|
|
static const struct file_operations shrinker_debugfs_scan_fops = {
|
|
.owner = THIS_MODULE,
|
|
.open = shrinker_debugfs_scan_open,
|
|
.write = shrinker_debugfs_scan_write,
|
|
};
|
|
|
|
int shrinker_debugfs_add(struct shrinker *shrinker)
|
|
{
|
|
struct dentry *entry;
|
|
char buf[128];
|
|
int id;
|
|
|
|
lockdep_assert_held(&shrinker_rwsem);
|
|
|
|
/* debugfs isn't initialized yet, add debugfs entries later. */
|
|
if (!shrinker_debugfs_root)
|
|
return 0;
|
|
|
|
id = ida_alloc(&shrinker_debugfs_ida, GFP_KERNEL);
|
|
if (id < 0)
|
|
return id;
|
|
shrinker->debugfs_id = id;
|
|
|
|
snprintf(buf, sizeof(buf), "%s-%d", shrinker->name, id);
|
|
|
|
/* create debugfs entry */
|
|
entry = debugfs_create_dir(buf, shrinker_debugfs_root);
|
|
if (IS_ERR(entry)) {
|
|
ida_free(&shrinker_debugfs_ida, id);
|
|
return PTR_ERR(entry);
|
|
}
|
|
shrinker->debugfs_entry = entry;
|
|
|
|
debugfs_create_file("count", 0220, entry, shrinker,
|
|
&shrinker_debugfs_count_fops);
|
|
debugfs_create_file("scan", 0440, entry, shrinker,
|
|
&shrinker_debugfs_scan_fops);
|
|
return 0;
|
|
}
|
|
|
|
int shrinker_debugfs_rename(struct shrinker *shrinker, const char *fmt, ...)
|
|
{
|
|
struct dentry *entry;
|
|
char buf[128];
|
|
const char *new, *old;
|
|
va_list ap;
|
|
int ret = 0;
|
|
|
|
va_start(ap, fmt);
|
|
new = kvasprintf_const(GFP_KERNEL, fmt, ap);
|
|
va_end(ap);
|
|
|
|
if (!new)
|
|
return -ENOMEM;
|
|
|
|
down_write(&shrinker_rwsem);
|
|
|
|
old = shrinker->name;
|
|
shrinker->name = new;
|
|
|
|
if (shrinker->debugfs_entry) {
|
|
snprintf(buf, sizeof(buf), "%s-%d", shrinker->name,
|
|
shrinker->debugfs_id);
|
|
|
|
entry = debugfs_rename(shrinker_debugfs_root,
|
|
shrinker->debugfs_entry,
|
|
shrinker_debugfs_root, buf);
|
|
if (IS_ERR(entry))
|
|
ret = PTR_ERR(entry);
|
|
else
|
|
shrinker->debugfs_entry = entry;
|
|
}
|
|
|
|
up_write(&shrinker_rwsem);
|
|
|
|
kfree_const(old);
|
|
|
|
return ret;
|
|
}
|
|
EXPORT_SYMBOL(shrinker_debugfs_rename);
|
|
|
|
struct dentry *shrinker_debugfs_remove(struct shrinker *shrinker)
|
|
{
|
|
struct dentry *entry = shrinker->debugfs_entry;
|
|
|
|
lockdep_assert_held(&shrinker_rwsem);
|
|
|
|
kfree_const(shrinker->name);
|
|
shrinker->name = NULL;
|
|
|
|
if (entry) {
|
|
ida_free(&shrinker_debugfs_ida, shrinker->debugfs_id);
|
|
shrinker->debugfs_entry = NULL;
|
|
}
|
|
|
|
return entry;
|
|
}
|
|
|
|
static int __init shrinker_debugfs_init(void)
|
|
{
|
|
struct shrinker *shrinker;
|
|
struct dentry *dentry;
|
|
int ret = 0;
|
|
|
|
dentry = debugfs_create_dir("shrinker", NULL);
|
|
if (IS_ERR(dentry))
|
|
return PTR_ERR(dentry);
|
|
shrinker_debugfs_root = dentry;
|
|
|
|
/* Create debugfs entries for shrinkers registered at boot */
|
|
down_write(&shrinker_rwsem);
|
|
list_for_each_entry(shrinker, &shrinker_list, list)
|
|
if (!shrinker->debugfs_entry) {
|
|
ret = shrinker_debugfs_add(shrinker);
|
|
if (ret)
|
|
break;
|
|
}
|
|
up_write(&shrinker_rwsem);
|
|
|
|
return ret;
|
|
}
|
|
late_initcall(shrinker_debugfs_init);
|