mirror of
git://sourceware.org/git/lvm2.git
synced 2024-12-22 17:35:59 +03:00
c631be7684
Read complete content of /proc/self/maps into one buffer without realocation in the middle of reading and before doing any m/unlock operation with these lines - as some of them gets change. With previous implementation we've read some mappings twice ([stack])
411 lines
10 KiB
C
411 lines
10 KiB
C
/*
|
|
* Copyright (C) 2003-2004 Sistina Software, Inc. All rights reserved.
|
|
* Copyright (C) 2004-2006 Red Hat, Inc. All rights reserved.
|
|
*
|
|
* This file is part of LVM2.
|
|
*
|
|
* This copyrighted material is made available to anyone wishing to use,
|
|
* modify, copy, or redistribute it subject to the terms and conditions
|
|
* of the GNU Lesser General Public License v.2.1.
|
|
*
|
|
* You should have received a copy of the GNU Lesser General Public License
|
|
* along with this program; if not, write to the Free Software Foundation,
|
|
* Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
|
|
*/
|
|
|
|
#include "lib.h"
|
|
#include "memlock.h"
|
|
#include "defaults.h"
|
|
#include "config.h"
|
|
#include "toolcontext.h"
|
|
|
|
#include <limits.h>
|
|
#include <fcntl.h>
|
|
#include <unistd.h>
|
|
#include <sys/mman.h>
|
|
#include <sys/time.h>
|
|
#include <sys/resource.h>
|
|
|
|
#ifndef DEVMAPPER_SUPPORT
|
|
|
|
void memlock_inc(struct cmd_context *cmd)
|
|
{
|
|
return;
|
|
}
|
|
void memlock_dec(struct cmd_context *cmd)
|
|
{
|
|
return;
|
|
}
|
|
int memlock(void)
|
|
{
|
|
return 0;
|
|
}
|
|
void memlock_init(struct cmd_context *cmd)
|
|
{
|
|
return;
|
|
}
|
|
|
|
#else /* DEVMAPPER_SUPPORT */
|
|
|
|
static size_t _size_stack;
|
|
static size_t _size_malloc_tmp;
|
|
static size_t _size_malloc = 2000000;
|
|
|
|
static void *_malloc_mem = NULL;
|
|
static int _memlock_count = 0;
|
|
static int _memlock_count_daemon = 0;
|
|
static int _priority;
|
|
static int _default_priority;
|
|
|
|
/* list of maps, that are unconditionaly ignored */
|
|
static const char * const _ignore_maps[] = {
|
|
"[vdso]",
|
|
"[vsyscall]",
|
|
};
|
|
|
|
/* default blacklist for maps */
|
|
static const char * const _blacklist_maps[] = {
|
|
"locale/locale-archive",
|
|
"gconv/gconv-modules.cache",
|
|
"/libreadline.so.", /* not using readline during mlock */
|
|
"/libncurses.so.", /* not using readline during mlock */
|
|
"/libdl-", /* not using dlopen,dlsym during mlock */
|
|
/* "/libdevmapper-event.so" */
|
|
};
|
|
|
|
typedef enum { LVM_MLOCK, LVM_MUNLOCK } lvmlock_t;
|
|
|
|
static unsigned _use_mlockall;
|
|
static int _maps_fd;
|
|
static size_t _maps_len = 8192; /* Initial buffer size for reading /proc/self/maps */
|
|
static char *_maps_buffer;
|
|
static char _procselfmaps[PATH_MAX] = "";
|
|
#define SELF_MAPS "/self/maps"
|
|
|
|
static size_t _mstats; /* statistic for maps locking */
|
|
|
|
static void _touch_memory(void *mem, size_t size)
|
|
{
|
|
size_t pagesize = lvm_getpagesize();
|
|
void *pos = mem;
|
|
void *end = mem + size - sizeof(long);
|
|
|
|
while (pos < end) {
|
|
*(long *) pos = 1;
|
|
pos += pagesize;
|
|
}
|
|
}
|
|
|
|
static void _allocate_memory(void)
|
|
{
|
|
void *stack_mem, *temp_malloc_mem;
|
|
|
|
if ((stack_mem = alloca(_size_stack)))
|
|
_touch_memory(stack_mem, _size_stack);
|
|
|
|
if ((temp_malloc_mem = malloc(_size_malloc_tmp)))
|
|
_touch_memory(temp_malloc_mem, _size_malloc_tmp);
|
|
|
|
if ((_malloc_mem = malloc(_size_malloc)))
|
|
_touch_memory(_malloc_mem, _size_malloc);
|
|
|
|
free(temp_malloc_mem);
|
|
}
|
|
|
|
static void _release_memory(void)
|
|
{
|
|
free(_malloc_mem);
|
|
}
|
|
|
|
/*
|
|
* mlock/munlock memory areas from /proc/self/maps
|
|
* format described in kernel/Documentation/filesystem/proc.txt
|
|
*/
|
|
static int _maps_line(struct cmd_context *cmd, lvmlock_t lock,
|
|
const char* line, size_t* mstats)
|
|
{
|
|
const struct config_node *cn;
|
|
struct config_value *cv;
|
|
long from, to;
|
|
int pos, i;
|
|
char fr, fw, fx, fp;
|
|
size_t sz;
|
|
|
|
if (sscanf(line, "%lx-%lx %c%c%c%c%n",
|
|
&from, &to, &fr, &fw, &fx, &fp, &pos) != 6) {
|
|
log_error("Failed to parse maps line: %s", line);
|
|
return 0;
|
|
}
|
|
|
|
/* Select readable maps */
|
|
if (fr != 'r') {
|
|
log_debug("%s area unreadable %s : Skipping.",
|
|
(lock == LVM_MLOCK) ? "mlock" : "munlock", line);
|
|
return 1;
|
|
}
|
|
|
|
/* always ignored areas */
|
|
for (i = 0; i < sizeof(_ignore_maps) / sizeof(_ignore_maps[0]); ++i)
|
|
if (strstr(line + pos, _ignore_maps[i])) {
|
|
log_debug("mlock ignore filter '%s' matches '%s': Skipping.",
|
|
_ignore_maps[i], line);
|
|
return 1;
|
|
}
|
|
|
|
sz = to - from;
|
|
if (!(cn = find_config_tree_node(cmd, "activation/mlock_filter"))) {
|
|
/* If no blacklist configured, use an internal set */
|
|
for (i = 0; i < sizeof(_blacklist_maps) / sizeof(_blacklist_maps[0]); ++i)
|
|
if (strstr(line + pos, _blacklist_maps[i])) {
|
|
log_debug("mlock default filter '%s' matches '%s': Skipping.",
|
|
_blacklist_maps[i], line);
|
|
return 1;
|
|
}
|
|
} else {
|
|
for (cv = cn->v; cv; cv = cv->next) {
|
|
if ((cv->type != CFG_STRING) || !cv->v.str[0])
|
|
continue;
|
|
if (strstr(line + pos, cv->v.str)) {
|
|
log_debug("mlock_filter '%s' matches '%s': Skipping.",
|
|
cv->v.str, line);
|
|
return 1;
|
|
}
|
|
}
|
|
}
|
|
|
|
*mstats += sz;
|
|
log_debug("%s %10ldKiB %12lx - %12lx %c%c%c%c%s",
|
|
(lock == LVM_MLOCK) ? "mlock" : "munlock",
|
|
((long)sz + 1023) / 1024, from, to, fr, fw, fx, fp, line + pos);
|
|
|
|
if (lock == LVM_MLOCK) {
|
|
if (mlock((const void*)from, sz) < 0) {
|
|
log_sys_error("mlock", line);
|
|
return 0;
|
|
}
|
|
} else {
|
|
if (munlock((const void*)from, sz) < 0) {
|
|
log_sys_error("munlock", line);
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
static int _memlock_maps(struct cmd_context *cmd, lvmlock_t lock, size_t *mstats)
|
|
{
|
|
char *line, *line_end;
|
|
size_t len;
|
|
ssize_t n;
|
|
int ret = 1;
|
|
|
|
if (_use_mlockall) {
|
|
#ifdef MCL_CURRENT
|
|
if (lock == LVM_MLOCK) {
|
|
if (mlockall(MCL_CURRENT | MCL_FUTURE)) {
|
|
log_sys_error("mlockall", "");
|
|
return 0;
|
|
}
|
|
} else {
|
|
if (munlockall()) {
|
|
log_sys_error("munlockall", "");
|
|
return 0;
|
|
}
|
|
}
|
|
return 1;
|
|
#else
|
|
return 0;
|
|
#endif
|
|
}
|
|
|
|
/* Force libc.mo load */
|
|
if (lock == LVM_MLOCK)
|
|
(void)strerror(0);
|
|
/* Reset statistic counters */
|
|
*mstats = 0;
|
|
|
|
/* read mapping into a single memory chunk without reallocation
|
|
* in the middle of reading maps file */
|
|
for (len = 0;;) {
|
|
if (!_maps_buffer || len >= _maps_len) {
|
|
if (_maps_buffer)
|
|
_maps_len *= 2;
|
|
if (!(_maps_buffer = dm_realloc(_maps_buffer, _maps_len))) {
|
|
log_error("Allocation of maps buffer failed");
|
|
return 0;
|
|
}
|
|
}
|
|
lseek(_maps_fd, 0, SEEK_SET);
|
|
for (len = 0 ; len < _maps_len; len += n) {
|
|
if (!(n = read(_maps_fd, _maps_buffer + len, _maps_len - len))) {
|
|
_maps_buffer[len] = '\0';
|
|
break; /* EOF */
|
|
}
|
|
if (n == -1)
|
|
return_0;
|
|
}
|
|
if (len < _maps_len) /* fits in buffer */
|
|
break;
|
|
}
|
|
|
|
line = _maps_buffer;
|
|
|
|
while ((line_end = strchr(line, '\n'))) {
|
|
*line_end = '\0'; /* remove \n */
|
|
if (!_maps_line(cmd, lock, line, mstats))
|
|
ret = 0;
|
|
line = line_end + 1;
|
|
}
|
|
|
|
log_debug("%socked %ld bytes",
|
|
(lock == LVM_MLOCK) ? "L" : "Unl", (long)*mstats);
|
|
|
|
return ret;
|
|
}
|
|
|
|
/* Stop memory getting swapped out */
|
|
static void _lock_mem(struct cmd_context *cmd)
|
|
{
|
|
_allocate_memory();
|
|
|
|
/*
|
|
* For daemon we need to use mlockall()
|
|
* so even future adition of thread which may not even use lvm lib
|
|
* will not block memory locked thread
|
|
* Note: assuming _memlock_count_daemon is updated before _memlock_count
|
|
*/
|
|
_use_mlockall = _memlock_count_daemon ? 1 :
|
|
find_config_tree_bool(cmd, "activation/use_mlockall", DEFAULT_USE_MLOCKALL);
|
|
|
|
if (!_use_mlockall) {
|
|
if (!*_procselfmaps &&
|
|
dm_snprintf(_procselfmaps, sizeof(_procselfmaps),
|
|
"%s" SELF_MAPS, cmd->proc_dir) < 0) {
|
|
log_error("proc_dir too long");
|
|
return;
|
|
}
|
|
|
|
if (!(_maps_fd = open(_procselfmaps, O_RDONLY))) {
|
|
log_sys_error("open", _procselfmaps);
|
|
return;
|
|
}
|
|
}
|
|
|
|
log_very_verbose("Locking memory");
|
|
if (!_memlock_maps(cmd, LVM_MLOCK, &_mstats))
|
|
stack;
|
|
|
|
errno = 0;
|
|
if (((_priority = getpriority(PRIO_PROCESS, 0)) == -1) && errno)
|
|
log_sys_error("getpriority", "");
|
|
else
|
|
if (setpriority(PRIO_PROCESS, 0, _default_priority))
|
|
log_error("setpriority %d failed: %s",
|
|
_default_priority, strerror(errno));
|
|
}
|
|
|
|
static void _unlock_mem(struct cmd_context *cmd)
|
|
{
|
|
size_t unlock_mstats;
|
|
|
|
log_very_verbose("Unlocking memory");
|
|
|
|
if (!_memlock_maps(cmd, LVM_MUNLOCK, &unlock_mstats))
|
|
stack;
|
|
|
|
if (!_use_mlockall) {
|
|
if (close(_maps_fd))
|
|
log_sys_error("close", _procselfmaps);
|
|
dm_free(_maps_buffer);
|
|
_maps_buffer = NULL;
|
|
if (_mstats < unlock_mstats)
|
|
log_error(INTERNAL_ERROR "Maps lock %ld < unlock %ld",
|
|
(long)_mstats, (long)unlock_mstats);
|
|
}
|
|
|
|
if (setpriority(PRIO_PROCESS, 0, _priority))
|
|
log_error("setpriority %u failed: %s", _priority,
|
|
strerror(errno));
|
|
_release_memory();
|
|
}
|
|
|
|
static void _lock_mem_if_needed(struct cmd_context *cmd)
|
|
{
|
|
if ((_memlock_count + _memlock_count_daemon) == 1)
|
|
_lock_mem(cmd);
|
|
}
|
|
|
|
static void _unlock_mem_if_possible(struct cmd_context *cmd)
|
|
{
|
|
if ((_memlock_count + _memlock_count_daemon) == 0)
|
|
_unlock_mem(cmd);
|
|
}
|
|
|
|
void memlock_inc(struct cmd_context *cmd)
|
|
{
|
|
++_memlock_count;
|
|
_lock_mem_if_needed(cmd);
|
|
log_debug("memlock_count inc to %d", _memlock_count);
|
|
}
|
|
|
|
void memlock_dec(struct cmd_context *cmd)
|
|
{
|
|
if (!_memlock_count)
|
|
log_error(INTERNAL_ERROR "_memlock_count has dropped below 0.");
|
|
--_memlock_count;
|
|
_unlock_mem_if_possible(cmd);
|
|
log_debug("memlock_count dec to %d", _memlock_count);
|
|
}
|
|
|
|
/*
|
|
* The memlock_*_daemon functions will force the mlockall() call that we need
|
|
* to stay in memory, but they will have no effect on device scans (unlike
|
|
* normal memlock_inc and memlock_dec). Memory is kept locked as long as either
|
|
* of memlock or memlock_daemon is in effect.
|
|
*/
|
|
|
|
void memlock_inc_daemon(struct cmd_context *cmd)
|
|
{
|
|
++_memlock_count_daemon;
|
|
if (_memlock_count_daemon == 1 && _memlock_count > 0)
|
|
log_error(INTERNAL_ERROR "_memlock_inc_daemon used after _memlock_inc.");
|
|
_lock_mem_if_needed(cmd);
|
|
log_debug("memlock_count_daemon inc to %d", _memlock_count_daemon);
|
|
}
|
|
|
|
void memlock_dec_daemon(struct cmd_context *cmd)
|
|
{
|
|
if (!_memlock_count_daemon)
|
|
log_error(INTERNAL_ERROR "_memlock_count_daemon has dropped below 0.");
|
|
--_memlock_count_daemon;
|
|
_unlock_mem_if_possible(cmd);
|
|
log_debug("memlock_count_daemon dec to %d", _memlock_count_daemon);
|
|
}
|
|
|
|
/*
|
|
* This disregards the daemon (dmeventd) locks, since we use memlock() to check
|
|
* whether it is safe to run a device scan, which would normally coincide with
|
|
* !memlock() -- but the daemon global memory lock breaks this assumption, so
|
|
* we do not take those into account here.
|
|
*/
|
|
int memlock(void)
|
|
{
|
|
return _memlock_count;
|
|
}
|
|
|
|
void memlock_init(struct cmd_context *cmd)
|
|
{
|
|
_size_stack = find_config_tree_int(cmd,
|
|
"activation/reserved_stack",
|
|
DEFAULT_RESERVED_STACK) * 1024;
|
|
_size_malloc_tmp = find_config_tree_int(cmd,
|
|
"activation/reserved_memory",
|
|
DEFAULT_RESERVED_MEMORY) * 1024;
|
|
_default_priority = find_config_tree_int(cmd,
|
|
"activation/process_priority",
|
|
DEFAULT_PROCESS_PRIORITY);
|
|
}
|
|
|
|
#endif
|