/* * Copyright (C) 2005-2007 Red Hat, Inc. All rights reserved. * * This file is part of the device-mapper userspace tools. * * This copyrighted material is made available to anyone wishing to use, * modify, copy, or redistribute it subject to the terms and conditions * of the GNU Lesser General Public License v.2.1. * * You should have received a copy of the GNU Lesser General Public License * along with this program; if not, write to the Free Software Foundation, * Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ /* * dmeventd - dm event daemon to monitor active mapped devices */ #define _GNU_SOURCE #define _FILE_OFFSET_BITS 64 #include "libdevmapper.h" #include "libdevmapper-event.h" #include "list.h" #include "dmeventd.h" //#include "libmultilog.h" #include "log.h" #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include /* for htonl, ntohl */ #ifdef linux #include #endif /* We must use syslog for now, because multilog is not yet implemented */ #include static volatile sig_atomic_t _exit_now = 0; /* set to '1' when signal is given to exit */ static volatile sig_atomic_t _thread_registries_empty = 1; /* registries are empty initially */ /* List (un)link macros. */ #define LINK(x, head) list_add(head, &(x)->list) #define LINK_DSO(dso) LINK(dso, &_dso_registry) #define LINK_THREAD(thread) LINK(thread, &_thread_registry) #define UNLINK(x) list_del(&(x)->list) #define UNLINK_DSO(x) UNLINK(x) #define UNLINK_THREAD(x) UNLINK(x) #define DAEMON_NAME "dmeventd" /* Global mutex for list accesses. */ static pthread_mutex_t _global_mutex; #define DM_THREAD_RUNNING 0 #define DM_THREAD_SHUTDOWN 1 #define DM_THREAD_DONE 2 /* Data kept about a DSO. */ struct dso_data { struct list list; char *dso_name; /* DSO name (eg, "evms", "dmraid", "lvm2"). */ void *dso_handle; /* Opaque handle as returned from dlopen(). */ unsigned int ref_count; /* Library reference count. */ /* * Event processing. * * The DSO can do whatever appropriate steps if an event happens * such as changing the mapping in case a mirror fails, update * the application metadata etc. */ void (*process_event)(const char *device, enum dm_event_type event); /* * Device registration. * * When an application registers a device for an event, the DSO * can carry out appropriate steps so that a later call to * the process_event() function is sane (eg, read metadata * and activate a mapping). */ int (*register_device)(const char *device); /* * Device unregistration. * * In case all devices of a mapping (eg, RAID10) are unregistered * for events, the DSO can recognize this and carry out appropriate * steps (eg, deactivate mapping, metadata update). */ int (*unregister_device)(const char *device); }; static LIST_INIT(_dso_registry); /* Structure to keep parsed register variables from client message. */ struct message_data { char *dso_name; /* Name of DSO. */ char *device_path; /* Mapped device path. */ union { char *str; /* Events string as fetched from message. */ enum dm_event_type field; /* Events bitfield. */ } events; union { char *str; uint32_t secs; } timeout; struct dm_event_daemon_message *msg; /* Pointer to message buffer. */ }; /* * Housekeeping of thread+device states. * * One thread per mapped device which can block on it until an event * occurs and the event processing function of the DSO gets called. */ struct thread_status { struct list list; pthread_t thread; struct dso_data *dso_data;/* DSO this thread accesses. */ char *device_path; /* Mapped device path. */ uint32_t event_nr; /* event number */ int processing; /* Set when event is being processed */ int status; /* running/shutdown/done */ enum dm_event_type events; /* bitfield for event filter. */ enum dm_event_type current_events;/* bitfield for occured events. */ enum dm_event_type processed_events;/* bitfield for processed events. */ time_t next_time; uint32_t timeout; struct list timeout_list; }; static LIST_INIT(_thread_registry); static LIST_INIT(_thread_registry_unused); static int _timeout_running; static LIST_INIT(timeout_registry); static pthread_mutex_t _timeout_mutex = PTHREAD_MUTEX_INITIALIZER; static pthread_cond_t _timeout_cond = PTHREAD_COND_INITIALIZER; /* Allocate/free the status structure for a monitoring thread. */ static struct thread_status *alloc_thread_status(struct message_data *data, struct dso_data *dso_data) { struct thread_status *ret = (typeof(ret)) dm_malloc(sizeof(*ret)); if (ret) { if (!memset(ret, 0, sizeof(*ret)) || !(ret->device_path = dm_strdup(data->device_path))) { dm_free(ret); ret = NULL; } else { ret->dso_data = dso_data; ret->events = data->events.field; ret->timeout = data->timeout.secs; list_init(&ret->timeout_list); } } return ret; } static void free_thread_status(struct thread_status *thread) { dm_free(thread->device_path); dm_free(thread); } /* Allocate/free DSO data. */ static struct dso_data *alloc_dso_data(struct message_data *data) { struct dso_data *ret = (typeof(ret)) dm_malloc(sizeof(*ret)); if (!ret) return NULL; if (!memset(ret, 0, sizeof(*ret)) || !(ret->dso_name = dm_strdup(data->dso_name))) { dm_free(ret); return NULL; } return ret; } static void free_dso_data(struct dso_data *data) { dm_free(data->dso_name); dm_free(data); } /* * Fetch a string off src and duplicate it into *ptr. * Pay attention to 0 lenght strings. */ /* FIXME: move to separate module to share with the client lib. */ static const char delimiter = ' '; static int fetch_string(char **ptr, char **src) { int ret = 0; char *p; size_t len; if ((p = strchr(*src, delimiter))) *p = 0; if ((*ptr = dm_strdup(*src))) { if ((len = strlen(*ptr))) *src += len; else { dm_free(*ptr); *ptr = NULL; } (*src)++; ret = 1; } if (p) *p = delimiter; return ret; } /* Free message memory. */ static void free_message(struct message_data *message_data) { if (message_data->dso_name) dm_free(message_data->dso_name); if (message_data->device_path) dm_free(message_data->device_path); } /* Parse a register message from the client. */ static int parse_message(struct message_data *message_data) { int ret = 0; char *p = message_data->msg->data; struct dm_event_daemon_message *msg = message_data->msg; if (!msg->data) return 0; /* * Retrieve application identifier, mapped device * path and events # string from message. */ if (fetch_string(&message_data->dso_name, &p) && fetch_string(&message_data->device_path, &p) && fetch_string(&message_data->events.str, &p) && fetch_string(&message_data->timeout.str, &p)) { if (message_data->events.str) { enum dm_event_type i = atoi(message_data->events.str); /* * Free string representaion of events. * Not needed an more. */ dm_free(message_data->events.str); message_data->events.field = i; } if (message_data->timeout.str) { uint32_t secs = atoi(message_data->timeout.str); dm_free(message_data->timeout.str); message_data->timeout.secs = secs ? secs : DM_EVENT_DEFAULT_TIMEOUT; } ret = 1; } dm_free(msg->data); msg->data = NULL; msg->size = 0; return ret; }; /* Global mutex to lock access to lists et al. */ static int lock_mutex(void) { return pthread_mutex_lock(&_global_mutex); } static int unlock_mutex(void) { return pthread_mutex_unlock(&_global_mutex); } /* Store pid in pidfile. */ static int storepid(int lf) { int len; char pid[8]; if ((len = snprintf(pid, sizeof(pid), "%u\n", getpid())) < 0) return 0; if (len > (int) sizeof(pid)) len = (int) sizeof(pid); if (write(lf, pid, (size_t) len) != len) return 0; fsync(lf); return 1; } /* FIXME This is unreliable: should use DM_DEVICE_INFO ioctl instead. */ /* Check, if a device exists. */ static int device_exists(char *device) { struct stat st_buf; char path2[PATH_MAX]; if (!device || !*device) return 0; if (device[0] == '/') /* absolute path */ return !stat(device, &st_buf) && S_ISBLK(st_buf.st_mode); if (PATH_MAX <= snprintf(path2, PATH_MAX, "%s/%s", dm_dir(), device)) return 0; return !stat(path2, &st_buf) && S_ISBLK(st_buf.st_mode); } /* * Find an existing thread for a device. * * Mutex must be held when calling this. */ static struct thread_status *lookup_thread_status(struct message_data *data) { struct thread_status *thread; list_iterate_items(thread, &_thread_registry) if (!strcmp(data->device_path, thread->device_path)) return thread; return NULL; } /* Cleanup at exit. */ static void exit_dm_lib(void) { dm_lib_release(); dm_lib_exit(); } static void exit_timeout(void *unused) { _timeout_running = 0; pthread_mutex_unlock(&_timeout_mutex); } /* Wake up monitor threads every so often. */ static void *timeout_thread(void *unused) { struct timespec timeout; time_t curr_time; timeout.tv_nsec = 0; pthread_cleanup_push(exit_timeout, NULL); pthread_mutex_lock(&_timeout_mutex); while (!list_empty(&timeout_registry)) { struct thread_status *thread; timeout.tv_sec = (time_t)-1; curr_time = time(NULL); list_iterate_items_gen(thread, &timeout_registry, timeout_list) { if (thread->next_time < curr_time) { thread->next_time = curr_time + thread->timeout; pthread_kill(thread->thread, SIGALRM); } if (thread->next_time < timeout.tv_sec) timeout.tv_sec = thread->next_time; } pthread_cond_timedwait(&_timeout_cond, &_timeout_mutex, &timeout); } pthread_cleanup_pop(1); return NULL; } static int register_for_timeout(struct thread_status *thread) { int ret = 0; pthread_mutex_lock(&_timeout_mutex); thread->next_time = time(NULL) + thread->timeout; if (list_empty(&thread->timeout_list)) { list_add(&timeout_registry, &thread->timeout_list); if (_timeout_running) pthread_cond_signal(&_timeout_cond); } if (!_timeout_running) { pthread_t timeout_id; if (!(ret = -pthread_create(&timeout_id, NULL, timeout_thread, NULL))) _timeout_running = 1; } pthread_mutex_unlock(&_timeout_mutex); return ret; } static void unregister_for_timeout(struct thread_status *thread) { pthread_mutex_lock(&_timeout_mutex); if (!list_empty(&thread->timeout_list)) { list_del(&thread->timeout_list); list_init(&thread->timeout_list); } pthread_mutex_unlock(&_timeout_mutex); } static void no_intr_log(int level, const char *file, int line, const char *f, ...) { va_list ap; if (errno == EINTR) return; if (level > _LOG_WARN) return; va_start(ap, f); if (level < _LOG_WARN) vfprintf(stderr, f, ap); else vprintf(f, ap); va_end(ap); if (level < _LOG_WARN) fprintf(stderr, "\n"); else fprintf(stdout, "\n"); } static sigset_t unblock_sigalrm(void) { sigset_t set, old; sigemptyset(&set); sigaddset(&set, SIGALRM); pthread_sigmask(SIG_UNBLOCK, &set, &old); return old; } #define DM_WAIT_RETRY 0 #define DM_WAIT_INTR 1 #define DM_WAIT_FATAL 2 /* Wait on a device until an event occurs. */ static int event_wait(struct thread_status *thread) { sigset_t set; int ret = DM_WAIT_RETRY; /* void *next = NULL; char *params, *target_type; uint64_t start, length; */ struct dm_task *dmt; struct dm_info info; if (!(dmt = dm_task_create(DM_DEVICE_WAITEVENT))) return DM_WAIT_RETRY; if (!(ret = dm_task_set_name(dmt, dm_basename(thread->device_path))) || !(ret = dm_task_set_event_nr(dmt, thread->event_nr))) goto out; /* * This is so that you can break out of waiting on an event, * either for a timeout event, or to cancel the thread. */ set = unblock_sigalrm(); dm_log_init(no_intr_log); errno = 0; if ((ret = dm_task_run(dmt))) { thread->current_events |= DM_EVENT_DEVICE_ERROR; ret = DM_WAIT_INTR; /* * FIXME: I am setting processed_events to zero here * because it is causing problems. for example, the * mirror target emits a signal for INSYNC, then * subsequent events (device failures) are not handled */ thread->processed_events = 0; if ((ret = dm_task_get_info(dmt, &info))) thread->event_nr = info.event_nr; } else if (thread->events & DM_EVENT_TIMEOUT && errno == EINTR) { thread->current_events |= DM_EVENT_TIMEOUT; ret = DM_WAIT_INTR; thread->processed_events = 0; } else { /* FIXME replace with log_* macro */ syslog(LOG_NOTICE, "dm_task_run failed, errno = %d, %s", errno, strerror(errno)); if (errno == ENXIO) { /* FIXME replace with log_* macro */ syslog(LOG_ERR, "%s disappeared, detaching", thread->device_path); ret = DM_WAIT_FATAL; } } pthread_sigmask(SIG_SETMASK, &set, NULL); dm_log_init(NULL); out: dm_task_destroy(dmt); return ret; } /* Register a device with the DSO. */ static int do_register_device(struct thread_status *thread) { return thread->dso_data->register_device(thread->device_path); } /* Unregister a device with the DSO. */ static int do_unregister_device(struct thread_status *thread) { return thread->dso_data->unregister_device(thread->device_path); } /* Process an event in the DSO. */ static void do_process_event(struct thread_status *thread) { thread->dso_data->process_event(thread->device_path, thread->current_events); } /* Thread cleanup handler to unregister device. */ static void monitor_unregister(void *arg) { struct thread_status *thread = arg; if (!do_unregister_device(thread)) syslog(LOG_ERR, "%s: %s unregister failed\n", __func__, thread->device_path); } /* Device monitoring thread. */ static void *monitor_thread(void *arg) { struct thread_status *thread = arg; int wait_error = 0; pthread_setcanceltype(PTHREAD_CANCEL_DEFERRED, NULL); pthread_cleanup_push(monitor_unregister, thread); /* Wait for do_process_request() to finish its task. */ lock_mutex(); thread->status = DM_THREAD_RUNNING; unlock_mutex(); /* Loop forever awaiting/analyzing device events. */ while (1) { thread->current_events = 0; wait_error = event_wait(thread); if (wait_error == DM_WAIT_RETRY) continue; /* FIXME Give a DSO a chance to clean up. */ if (wait_error == DM_WAIT_FATAL) break; /* * Check against filter. * * If there's current events delivered from event_wait() AND * the device got registered for those events AND * those events haven't been processed yet, call * the DSO's process_event() handler. * * FIXME: when does processed_events get cleared? What if * the same type of event happens later... after the first * was handled properly? */ lock_mutex(); if (thread->status == DM_THREAD_SHUTDOWN) { unlock_mutex(); break; } unlock_mutex(); if (thread->events & thread->current_events & ~thread->processed_events) { lock_mutex(); thread->processing = 1; unlock_mutex(); do_process_event(thread); thread->processed_events |= thread->current_events; lock_mutex(); thread->processing = 0; unlock_mutex(); } } lock_mutex(); thread->status = DM_THREAD_DONE; unlock_mutex(); pthread_cleanup_pop(0); return NULL; } /* Create a device monitoring thread. */ /* FIXME: call this with mutex hold ? */ static int create_thread(struct thread_status *thread) { return pthread_create(&thread->thread, NULL, monitor_thread, thread); } static int terminate_thread(struct thread_status *thread) { int ret; if ((ret = pthread_cancel(thread->thread))) return ret; return pthread_kill(thread->thread, SIGALRM); } /* DSO reference counting. */ static void lib_get(struct dso_data *data) { data->ref_count++; } static void lib_put(struct dso_data *data) { if (!--data->ref_count) { dlclose(data->dso_handle); UNLINK_DSO(data); free_dso_data(data); } } /* Find DSO data. */ static struct dso_data *lookup_dso(struct message_data *data) { struct dso_data *dso_data, *ret = NULL; lock_mutex(); list_iterate_items(dso_data, &_dso_registry) if (!strcmp(data->dso_name, dso_data->dso_name)) { lib_get(dso_data); ret = dso_data; break; } unlock_mutex(); return ret; } /* Lookup DSO symbols we need. */ static int lookup_symbol(void *dl, struct dso_data *data, void **symbol, const char *name) { if ((*symbol = dlsym(dl, name))) return 1; return 0; } static int lookup_symbols(void *dl, struct dso_data *data) { return lookup_symbol(dl, data, (void*) &data->process_event, "process_event") && lookup_symbol(dl, data, (void*) &data->register_device, "register_device") && lookup_symbol(dl, data, (void*) &data->unregister_device, "unregister_device"); } /* Load an application specific DSO. */ static struct dso_data *load_dso(struct message_data *data) { void *dl; struct dso_data *ret = NULL; if (!(dl = dlopen(data->dso_name, RTLD_NOW))){ const char *dlerr = dlerror(); syslog(LOG_ERR, "dmeventd %s dlopen failed: %s", data->dso_name, dlerr); char buf[1024]; /* FIXME */ snprintf(buf, 1024, "%s dlopen failed: %s", data->dso_name, dlerr); data->msg->size = strlen(buf) + 1; data->msg->data = dm_strdup(buf); return NULL; } if (!(ret = alloc_dso_data(data))) { dlclose(dl); return NULL; } if (!(lookup_symbols(dl, ret))) { free_dso_data(ret); dlclose(dl); return NULL; } /* * Keep handle to close the library once * we've got no references to it any more. */ ret->dso_handle = dl; lib_get(ret); lock_mutex(); LINK_DSO(ret); unlock_mutex(); return ret; } /* Return success on daemon active check. */ static int active(struct message_data *message_data) { return 0; } /* * Register for an event. * * Only one caller at a time here, because we use * a FIFO and lock it against multiple accesses. */ static int register_for_event(struct message_data *message_data) { int ret = 0; struct thread_status *thread, *thread_new = NULL; struct dso_data *dso_data; if (!device_exists(message_data->device_path)) { stack; ret = -ENODEV; goto out; } if (!(dso_data = lookup_dso(message_data)) && !(dso_data = load_dso(message_data))) { stack; /* FIXME */ #ifdef ELIBACC ret = -ELIBACC; #else ret = -ENODEV; #endif goto out; } /* Preallocate thread status struct to avoid deadlock. */ if (!(thread_new = alloc_thread_status(message_data, dso_data))) { stack; ret = -ENOMEM; goto out; } lock_mutex(); if (!(thread = lookup_thread_status(message_data))) { unlock_mutex(); /* * FIXME: better do this asynchronously in the * monitoring thread ? */ if (!(ret = do_register_device(thread_new))) goto out; thread = thread_new; thread_new = NULL; /* Try to create the monitoring thread for this device. */ lock_mutex(); if ((ret = -create_thread(thread))) { unlock_mutex(); do_unregister_device(thread); free_thread_status(thread); goto out; } else LINK_THREAD(thread); } /* Or event # into events bitfield. */ thread->events |= message_data->events.field; unlock_mutex(); /* FIXME - If you fail to register for timeout events, you still monitor all the other events. Is this the right action for newly created devices? Also, you are still on the timeout registry, so if a timeout thread is successfully started up later, you will start receiving DM_EVENT_TIMEOUT events */ if (thread->events & DM_EVENT_TIMEOUT) ret = -register_for_timeout(thread); out: /* * Deallocate thread status after releasing * the lock in case we haven't used it. */ if (thread_new) free_thread_status(thread_new); return ret; } /* * Unregister for an event. * * Only one caller at a time here as with register_for_event(). */ static int unregister_for_event(struct message_data *message_data) { int ret = 0; struct thread_status *thread; /* * Clear event in bitfield and deactivate * monitoring thread in case bitfield is 0. */ lock_mutex(); if (!(thread = lookup_thread_status(message_data))) { unlock_mutex(); ret = -ENODEV; goto out; } thread->events &= ~message_data->events.field; if (!(thread->events & DM_EVENT_TIMEOUT)) unregister_for_timeout(thread); /* * In case there's no events to monitor on this device -> * unlink and terminate its monitoring thread. */ if (!thread->events) { UNLINK_THREAD(thread); LINK(thread, &_thread_registry_unused); } unlock_mutex(); out: return ret; } /* * Get registered device. * * Only one caller at a time here as with register_for_event(). */ static int registered_device(struct message_data *message_data, struct thread_status *thread) { char test[1]; struct dm_event_daemon_message *msg = message_data->msg; const char *fmt = "%s %s %u"; const char *dso = thread->dso_data->dso_name; const char *dev = thread->device_path; unsigned events = ((thread->status == DM_THREAD_RUNNING) && (thread->events)) ? thread->events : thread->events | DM_EVENT_REGISTRATION_PENDING; if (msg->data) dm_free(msg->data); msg->size = snprintf(test, 1, fmt, dso, dev, events); msg->data = dm_malloc(msg->size); snprintf(msg->data, msg->size, fmt, dso, dev, events); unlock_mutex(); return 0; } static int want_registered_device(char *dso_name, char *device_path, struct thread_status *thread) { /* If DSO names and device paths are equal. */ if (dso_name && device_path) return !strcmp(dso_name, thread->dso_data->dso_name) && !strcmp(device_path, thread->device_path); /* If DSO names are equal. */ if (dso_name) return !strcmp(dso_name, thread->dso_data->dso_name); /* If device paths are equal. */ if (device_path) return !strcmp(device_path, thread->device_path); return 1; } static int _get_registered_device(struct message_data *message_data, int next) { int hit = 0; struct thread_status *thread; lock_mutex(); /* Iterate list of threads checking if we want a particular one. */ list_iterate_items(thread, &_thread_registry) if ((hit = want_registered_device(message_data->dso_name, message_data->device_path, thread))) break; /* * If we got a registered device and want the next one -> * fetch next conforming element off the list. */ if (!hit || !next) goto out; do { if (list_end(&_thread_registry, &thread->list)) goto out; thread = list_item(thread->list.n, struct thread_status); } while (!want_registered_device(message_data->dso_name, NULL, thread)); return registered_device(message_data, thread); out: unlock_mutex(); return -ENOENT; } static int get_registered_device(struct message_data *message_data) { return _get_registered_device(message_data, 0); } static int get_next_registered_device(struct message_data *message_data) { return _get_registered_device(message_data, 1); } static int set_timeout(struct message_data *message_data) { struct thread_status *thread; lock_mutex(); if ((thread = lookup_thread_status(message_data))) thread->timeout = message_data->timeout.secs; unlock_mutex(); return thread ? 0 : -ENODEV; } static int get_timeout(struct message_data *message_data) { struct thread_status *thread; struct dm_event_daemon_message *msg = message_data->msg; if (msg->data) dm_free(msg->data); lock_mutex(); if ((thread = lookup_thread_status(message_data))) { msg->data = dm_malloc(8*sizeof(uint32_t)); /* FIXME */ msg->size = snprintf(msg->data, 8*sizeof(uint32_t), "%"PRIu32, thread->timeout); } else { msg->data = NULL; msg->size = 0; } unlock_mutex(); return thread ? 0 : -ENODEV; } /* Initialize a fifos structure with path names. */ static void init_fifos(struct dm_event_fifos *fifos) { memset(fifos, 0, sizeof(*fifos)); fifos->client_path = DM_EVENT_FIFO_CLIENT; fifos->server_path = DM_EVENT_FIFO_SERVER; } /* Open fifos used for client communication. */ static int open_fifos(struct dm_event_fifos *fifos) { /* Create fifos */ if (((mkfifo(fifos->client_path, 0600) == -1) && errno != EEXIST) || ((mkfifo(fifos->server_path, 0600) == -1) && errno != EEXIST)) { syslog(LOG_ERR, "%s: Failed to create a fifo.\n", __func__); stack; return -errno; } /* FIXME Warn/abort if perms are wrong - not something to fix silently. */ /* If they were already there, make sure permissions are ok. */ if (chmod(fifos->client_path, 0600)) { syslog(LOG_ERR, "Unable to set correct file permissions on %s", fifos->client_path); return -errno; } if (chmod(fifos->server_path, 0600)) { syslog(LOG_ERR, "Unable to set correct file permissions on %s", fifos->server_path); return -errno; } /* Need to open read+write or we will block or fail */ if ((fifos->server = open(fifos->server_path, O_RDWR)) < 0) { stack; return -errno; } /* Need to open read+write for select() to work. */ if ((fifos->client = open(fifos->client_path, O_RDWR)) < 0) { stack; close(fifos->server); return -errno; } return 0; } /* * Read message from client making sure that data is available * and a complete message is read. Must not block indefinitely. */ static int client_read(struct dm_event_fifos *fifos, struct dm_event_daemon_message *msg) { struct timeval t; unsigned bytes = 0; int ret = 0; fd_set fds; int header = 1; size_t size = 2 * sizeof(uint32_t); /* status + size */ char *buf = alloca(size); msg->data = NULL; errno = 0; while (bytes < size && errno != EOF) { /* Watch client read FIFO for input. */ FD_ZERO(&fds); FD_SET(fifos->client, &fds); t.tv_sec = 1; t.tv_usec = 0; ret = select(fifos->client+1, &fds, NULL, NULL, &t); if (!ret && !bytes) /* nothing to read */ return 0; if (!ret) /* trying to finish read */ continue; if (ret < 0) /* error */ return 0; ret = read(fifos->client, buf + bytes, size - bytes); bytes += ret > 0 ? ret : 0; if (bytes == 2*sizeof(uint32_t) && header) { msg->cmd = ntohl(*((uint32_t *)buf)); msg->size = ntohl(*((uint32_t *)buf + 1)); buf = msg->data = dm_malloc(msg->size); size = msg->size; bytes = 0; header = 0; } } if (bytes != size) { if (msg->data) dm_free(msg->data); msg->data = NULL; } return bytes == size; } /* * Write a message to the client making sure that it is ready to write. */ static int client_write(struct dm_event_fifos *fifos, struct dm_event_daemon_message *msg) { unsigned bytes = 0; int ret = 0; fd_set fds; size_t size = 2*sizeof(uint32_t) + msg->size; char *buf = alloca(size); *((uint32_t *)buf) = htonl(msg->cmd); *((uint32_t *)buf + 1) = htonl(msg->size); memcpy(buf + 2*sizeof(uint32_t), msg->data, msg->size); errno = 0; while (bytes < size && errno != EIO) { do { /* Watch client write FIFO to be ready for output. */ FD_ZERO(&fds); FD_SET(fifos->server, &fds); } while (select(fifos->server +1, NULL, &fds, NULL, NULL) != 1); ret = write(fifos->server, buf + bytes, size - bytes); bytes += ret > 0 ? ret : 0; } return bytes == size; } /* * Handle a client request. * * We put the request handling functions into * a list because of the growing number. */ static int handle_request(struct dm_event_daemon_message *msg, struct message_data *message_data) { static struct { unsigned int cmd; int (*f)(struct message_data*); } requests[] = { { DM_EVENT_CMD_REGISTER_FOR_EVENT, register_for_event }, { DM_EVENT_CMD_UNREGISTER_FOR_EVENT, unregister_for_event }, { DM_EVENT_CMD_GET_REGISTERED_DEVICE, get_registered_device }, { DM_EVENT_CMD_GET_NEXT_REGISTERED_DEVICE, get_next_registered_device }, { DM_EVENT_CMD_SET_TIMEOUT, set_timeout }, { DM_EVENT_CMD_GET_TIMEOUT, get_timeout }, { DM_EVENT_CMD_ACTIVE, active }, }, *req; for (req = requests; req < requests + sizeof(requests); req++) if (req->cmd == msg->cmd) return req->f(message_data); return -EINVAL; } /* Process a request passed from the communication thread. */ static int do_process_request(struct dm_event_daemon_message *msg) { int ret; static struct message_data message_data; /* Parse the message. */ memset(&message_data, 0, sizeof(message_data)); message_data.msg = msg; if (msg->cmd != DM_EVENT_CMD_ACTIVE && !parse_message(&message_data)) { stack; ret = -EINVAL; } else ret = handle_request(msg, &message_data); free_message(&message_data); return ret; } /* Only one caller at a time. */ static void process_request(struct dm_event_fifos *fifos) { struct dm_event_daemon_message msg; /* FIXME: better error handling */ memset(&msg, 0, sizeof(msg)); /* * Read the request from the client. * Of course, it's tough to tell what to do when * we use fucking retarded return codes like * 0 for error. */ if (!client_read(fifos, &msg)) return; msg.cmd = do_process_request(&msg); if (!msg.data) { msg.data = dm_strdup(strerror(-msg.cmd)); msg.size = strlen(msg.data) + 1; } if (!client_write(fifos, &msg)) stack; if (msg.data) dm_free(msg.data); } static void cleanup_unused_threads(void) { int ret; struct list *l; struct thread_status *thread; lock_mutex(); while ((l = list_first(&_thread_registry_unused))) { thread = list_item(l, struct thread_status); if (thread->processing) { goto out; /* cleanup on the next round */ } if (thread->status == DM_THREAD_RUNNING) { thread->status = DM_THREAD_SHUTDOWN; goto out; } else if (thread->status == DM_THREAD_SHUTDOWN) { if (!thread->events) { /* turn codes negative -- should we be returning this? */ ret = terminate_thread(thread); if (ret == ESRCH) { thread->status = DM_THREAD_DONE; } else if (ret) { syslog(LOG_ERR, "Unable to terminate thread: %s\n", strerror(-ret)); stack; } goto out; } else { list_del(l); syslog(LOG_ERR, "thread can't be on unused list unless !thread->events"); thread->status = DM_THREAD_RUNNING; LINK_THREAD(thread); } } else if (thread->status == DM_THREAD_DONE) { list_del(l); pthread_join(thread->thread, NULL); lib_put(thread->dso_data); free_thread_status(thread); } } out: unlock_mutex(); } static void sig_alarm(int signum) { pthread_testcancel(); } /* Init thread signal handling. */ static void init_thread_signals(void) { sigset_t my_sigset; struct sigaction act; memset(&act, 0, sizeof(act)); act.sa_handler = sig_alarm; sigaction(SIGALRM, &act, NULL); sigfillset(&my_sigset); /* These are used for exiting */ sigdelset(&my_sigset, SIGTERM); sigdelset(&my_sigset, SIGINT); sigdelset(&my_sigset, SIGHUP); sigdelset(&my_sigset, SIGQUIT); pthread_sigmask(SIG_BLOCK, &my_sigset, NULL); } /* * exit_handler * @sig * * Set the global variable which the process should * be watching to determine when to exit. */ static void exit_handler(int sig) { /* * We exit when '_exit_now' is set. * That is, when a signal has been received. * * We can not simply set '_exit_now' unless all * threads are done processing. */ if (!_thread_registries_empty) { syslog(LOG_ERR, "There are still devices being monitored."); syslog(LOG_ERR, "Refusing to exit."); } else _exit_now = 1; } static int lock_pidfile(void) { int lf; char pidfile[] = "/var/run/dmeventd.pid"; /* FIXME Must be configurable at compile-time! */ if ((lf = open(pidfile, O_CREAT | O_RDWR, 0644)) < 0) exit(EXIT_OPEN_PID_FAILURE); if (flock(lf, LOCK_EX | LOCK_NB) < 0) exit(EXIT_LOCKFILE_INUSE); if (!storepid(lf)) exit(EXIT_FAILURE); return 0; } static void daemonize(void) { int status; int pid; int fd; struct rlimit rlim; struct timeval tval; sigset_t my_sigset; sigemptyset(&my_sigset); if (sigprocmask(SIG_SETMASK, &my_sigset, NULL) < 0) { fprintf(stderr, "Unable to restore signals."); exit(EXIT_FAILURE); } signal(SIGTERM, &exit_handler); pid = fork(); if (pid < 0) exit(EXIT_FAILURE); if (pid) { /* Wait for response from child */ while (!waitpid(pid, &status, WNOHANG) && !_exit_now) { tval.tv_sec = 0; tval.tv_usec = 250000; /* .25 sec */ select(0, NULL, NULL, NULL, &tval); } if (_exit_now) /* Child has signaled it is ok - we can exit now */ exit(EXIT_SUCCESS); /* Problem with child. Determine what it is by exit code */ switch (WEXITSTATUS(status)) { case EXIT_LOCKFILE_INUSE: break; case EXIT_DESC_CLOSE_FAILURE: break; case EXIT_DESC_OPEN_FAILURE: break; case EXIT_OPEN_PID_FAILURE: break; case EXIT_FIFO_FAILURE: break; case EXIT_CHDIR_FAILURE: break; default: break; } exit(EXIT_FAILURE); /* Redundant */ } setsid(); if (chdir("/")) exit(EXIT_CHDIR_FAILURE); if (getrlimit(RLIMIT_NOFILE, &rlim) < 0) fd = 256; /* just have to guess */ else fd = rlim.rlim_cur; for (--fd; fd >= 0; fd--) close(fd); if ((open("/dev/null", O_RDONLY) < 0) || (open("/dev/null", O_WRONLY) < 0) || (open("/dev/null", O_WRONLY) < 0)) exit(EXIT_DESC_OPEN_FAILURE); openlog("dmeventd", LOG_PID, LOG_DAEMON); lock_pidfile(); /* exits if failure */ /* Set the rest of the signals to cause '_exit_now' to be set */ signal(SIGINT, &exit_handler); signal(SIGHUP, &exit_handler); signal(SIGQUIT, &exit_handler); } int main(int argc, char *argv[]) { int ret; struct dm_event_fifos fifos; //struct sys_log logdata = {DAEMON_NAME, LOG_DAEMON}; daemonize(); init_thread_signals(); //multilog_clear_logging(); //multilog_add_type(std_syslog, &logdata); //multilog_init_verbose(std_syslog, _LOG_DEBUG); //multilog_async(1); init_fifos(&fifos); pthread_mutex_init(&_global_mutex, NULL); #ifdef MCL_CURRENT if (mlockall(MCL_CURRENT | MCL_FUTURE) == -1) exit(EXIT_FAILURE); #endif if ((ret = open_fifos(&fifos))) exit(EXIT_FIFO_FAILURE); /* Signal parent, letting them know we are ready to go. */ kill(getppid(), SIGTERM); syslog(LOG_INFO, "dmeventd ready for processing."); while (!_exit_now) { process_request(&fifos); cleanup_unused_threads(); if (!list_empty(&_thread_registry) || !list_empty(&_thread_registry_unused)) _thread_registries_empty = 0; else _thread_registries_empty = 1; } exit_dm_lib(); #ifdef MCL_CURRENT munlockall(); #endif pthread_mutex_destroy(&_global_mutex); syslog(LOG_INFO, "dmeventd shutting down."); closelog(); exit(EXIT_SUCCESS); }