mirror of
git://sourceware.org/git/lvm2.git
synced 2025-01-05 13:18:20 +03:00
481 lines
12 KiB
C
481 lines
12 KiB
C
|
/******************************************************************************
|
||
|
*******************************************************************************
|
||
|
**
|
||
|
** Copyright (C) Sistina Software, Inc. 2002-2003 All rights reserved.
|
||
|
**
|
||
|
*******************************************************************************
|
||
|
******************************************************************************/
|
||
|
|
||
|
/* This provides the inter-clvmd communications for a system without CMAN.
|
||
|
There is a listening TCP socket which accepts new connections in the
|
||
|
normal way.
|
||
|
It can also make outgoing connnections to the other clvmd nodes.
|
||
|
*/
|
||
|
|
||
|
|
||
|
#include <pthread.h>
|
||
|
#include <sys/types.h>
|
||
|
#include <sys/utsname.h>
|
||
|
#include <sys/ioctl.h>
|
||
|
#include <sys/socket.h>
|
||
|
#include <sys/stat.h>
|
||
|
#include <sys/socket.h>
|
||
|
#include <netinet/in.h>
|
||
|
#include <stdio.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <stdint.h>
|
||
|
#include <fcntl.h>
|
||
|
#include <string.h>
|
||
|
#include <stddef.h>
|
||
|
#include <stdint.h>
|
||
|
#include <unistd.h>
|
||
|
#include <errno.h>
|
||
|
#include <syslog.h>
|
||
|
#include <netdb.h>
|
||
|
#include <assert.h>
|
||
|
|
||
|
#include "ccs.h"
|
||
|
#include "clvm.h"
|
||
|
#include "clvmd-comms.h"
|
||
|
#include "clvmd.h"
|
||
|
#include "clvmd-gulm.h"
|
||
|
#include "hash.h"
|
||
|
|
||
|
#define DEFAULT_TCP_PORT 21064
|
||
|
|
||
|
static int listen_fd = -1;
|
||
|
static int tcp_port;
|
||
|
struct hash_table *sock_hash;
|
||
|
|
||
|
static int get_tcp_port(int default_port);
|
||
|
static int get_our_ip_address(char *addr, int *family);
|
||
|
static int read_from_tcpsock(struct local_client *fd, char *buf, int len, char *csid,
|
||
|
struct local_client **new_client);
|
||
|
|
||
|
/* Called by init_cluster() to open up the listening socket */
|
||
|
// TODO: IPv6 compat.
|
||
|
int init_comms()
|
||
|
{
|
||
|
struct sockaddr *addr = NULL;
|
||
|
struct sockaddr_in addr4;
|
||
|
struct sockaddr_in6 addr6;
|
||
|
int addr_len;
|
||
|
int family;
|
||
|
char address[MAX_CSID_LEN];
|
||
|
|
||
|
sock_hash = hash_create(100);
|
||
|
tcp_port = get_tcp_port(DEFAULT_TCP_PORT);
|
||
|
|
||
|
/* Get IP address and IP type */
|
||
|
get_our_ip_address(address, &family);
|
||
|
if (family == AF_INET)
|
||
|
{
|
||
|
memcpy(&addr4.sin_addr, addr, sizeof(struct in_addr));
|
||
|
addr = (struct sockaddr *)&addr4;
|
||
|
addr4.sin_port = htons(tcp_port);
|
||
|
addr_len = sizeof(addr4);
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
memcpy(&addr6.sin6_addr, addr, sizeof(struct in6_addr));
|
||
|
addr = (struct sockaddr *)&addr6;
|
||
|
addr6.sin6_port = htons(tcp_port);
|
||
|
addr_len = sizeof(addr6);
|
||
|
}
|
||
|
|
||
|
listen_fd = socket(family, SOCK_STREAM, 0);
|
||
|
|
||
|
if (listen_fd < 0)
|
||
|
{
|
||
|
return -1;
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
int one = 1;
|
||
|
setsockopt(listen_fd, SOL_SOCKET, SO_REUSEADDR, &one, sizeof(int));
|
||
|
}
|
||
|
|
||
|
addr->sa_family = family;
|
||
|
|
||
|
if (bind(listen_fd, addr, addr_len) < 0)
|
||
|
{
|
||
|
DEBUGLOG("Can't bind to port\n");
|
||
|
syslog(LOG_ERR, "Can't bind to port %d, is clvmd already running ?", tcp_port);
|
||
|
close(listen_fd);
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
listen(listen_fd, 5);
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
void tcp_remove_client(char *csid)
|
||
|
{
|
||
|
struct local_client *client;
|
||
|
DEBUGLOG("tcp_remove_client\n");
|
||
|
|
||
|
/* Don't actually close the socket here - that's the
|
||
|
job of clvmd.c whch will do the job when it notices the
|
||
|
other end has gone. We just need to remove the client(s) from
|
||
|
the hash table so we don't try to use it for sending any more */
|
||
|
client = hash_lookup_binary(sock_hash, csid, MAX_CSID_LEN);
|
||
|
if (client)
|
||
|
{
|
||
|
hash_remove_binary(sock_hash, csid, MAX_CSID_LEN);
|
||
|
}
|
||
|
|
||
|
/* Look for a mangled one too */
|
||
|
csid[0] ^= 0x80;
|
||
|
|
||
|
client = hash_lookup_binary(sock_hash, csid, MAX_CSID_LEN);
|
||
|
if (client)
|
||
|
{
|
||
|
hash_remove_binary(sock_hash, csid, MAX_CSID_LEN);
|
||
|
}
|
||
|
|
||
|
/* Put it back as we found it */
|
||
|
csid[0] ^= 0x80;
|
||
|
}
|
||
|
|
||
|
int alloc_client(int fd, char *csid, struct local_client **new_client)
|
||
|
{
|
||
|
struct local_client *client;
|
||
|
|
||
|
DEBUGLOG("alloc_client %d csid = [%d.%d.%d.%d]\n", fd,csid[0],csid[1],csid[2],csid[3]);
|
||
|
|
||
|
/* Create a local_client and return it */
|
||
|
client = malloc(sizeof(struct local_client));
|
||
|
if (!client)
|
||
|
{
|
||
|
DEBUGLOG("malloc failed\n");
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
memset(client, 0, sizeof(struct local_client));
|
||
|
client->fd = fd;
|
||
|
client->type = CLUSTER_DATA_SOCK;
|
||
|
client->callback = read_from_tcpsock;
|
||
|
if (new_client)
|
||
|
*new_client = client;
|
||
|
|
||
|
/* Add to our list of node sockets */
|
||
|
if (hash_lookup_binary(sock_hash, csid, MAX_CSID_LEN))
|
||
|
{
|
||
|
DEBUGLOG("alloc_client mangling CSID for second connection\n");
|
||
|
/* This is a duplicate connection but we can't close it because
|
||
|
the other end may already have started sending.
|
||
|
So, we mangle the IP address and keep it, all sending will
|
||
|
go out of the main FD
|
||
|
*/
|
||
|
csid[0] ^= 0x80;
|
||
|
client->bits.net.flags = 1; /* indicate mangled CSID */
|
||
|
|
||
|
/* If it still exists then kill the connection as we should only
|
||
|
ever have one incoming connection from each node */
|
||
|
if (hash_lookup_binary(sock_hash, csid, MAX_CSID_LEN))
|
||
|
{
|
||
|
DEBUGLOG("Multiple incoming connections from node\n");
|
||
|
syslog(LOG_ERR, " Bogus incoming connection from %d.%d.%d.%d\n", csid[0],csid[1],csid[2],csid[3]);
|
||
|
|
||
|
free(client);
|
||
|
errno = ECONNREFUSED;
|
||
|
return -1;
|
||
|
}
|
||
|
}
|
||
|
hash_insert_binary(sock_hash, csid, MAX_CSID_LEN, client);
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
int get_main_cluster_fd()
|
||
|
{
|
||
|
return listen_fd;
|
||
|
}
|
||
|
|
||
|
|
||
|
/* Read on main comms (listen) socket, accept it */
|
||
|
int cluster_fd_callback(struct local_client *fd, char *buf, int len, char *csid,
|
||
|
struct local_client **new_client)
|
||
|
{
|
||
|
int newfd;
|
||
|
struct sockaddr_in addr;
|
||
|
socklen_t addrlen = sizeof(addr);
|
||
|
int status;
|
||
|
char name[MAX_CLUSTER_MEMBER_NAME_LEN];
|
||
|
|
||
|
DEBUGLOG("cluster_fd_callback\n");
|
||
|
*new_client = NULL;
|
||
|
newfd = accept(listen_fd, (struct sockaddr *)&addr, &addrlen);
|
||
|
|
||
|
DEBUGLOG("cluster_fd_callback, newfd=%d (errno=%d)\n", newfd, errno);
|
||
|
if (!newfd)
|
||
|
{
|
||
|
syslog(LOG_ERR, "error in accept: %m");
|
||
|
errno = EAGAIN;
|
||
|
return -1; /* Don't return an error or clvmd will close the listening FD */
|
||
|
}
|
||
|
|
||
|
/* Check that the client is a member of the cluster
|
||
|
and reject if not.
|
||
|
// FIXME: IPv4 specific
|
||
|
*/
|
||
|
if (name_from_csid((char *)&addr.sin_addr.s_addr, name) < 0)
|
||
|
{
|
||
|
char *ip = (char *)&addr.sin_addr.s_addr;
|
||
|
syslog(LOG_ERR, "Got connect from non-cluster node %d.%d.%d.%d\n",
|
||
|
ip[0], ip[1], ip[2], ip[3]);
|
||
|
DEBUGLOG("Got connect from non-cluster node %d.%d.%d.%d\n",
|
||
|
ip[0], ip[1], ip[2], ip[3]);
|
||
|
close(newfd);
|
||
|
|
||
|
errno = EAGAIN;
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
status = alloc_client(newfd, (char *)&addr.sin_addr.s_addr, new_client);
|
||
|
if (status)
|
||
|
{
|
||
|
DEBUGLOG("cluster_fd_callback, alloc_client failed, status = %d\n", status);
|
||
|
close(newfd);
|
||
|
/* See above... */
|
||
|
errno = EAGAIN;
|
||
|
return -1;
|
||
|
}
|
||
|
DEBUGLOG("cluster_fd_callback, returning %d, %p\n", newfd, *new_client);
|
||
|
return newfd;
|
||
|
}
|
||
|
|
||
|
|
||
|
static int read_from_tcpsock(struct local_client *client, char *buf, int len, char *csid,
|
||
|
struct local_client **new_client)
|
||
|
{
|
||
|
struct sockaddr_in addr;
|
||
|
socklen_t slen = sizeof(addr);
|
||
|
int status;
|
||
|
|
||
|
DEBUGLOG("read_from_tcpsock fd %d\n", client->fd);
|
||
|
*new_client = NULL;
|
||
|
|
||
|
/* Get "csid" */
|
||
|
getpeername(client->fd, (struct sockaddr *)&addr, &slen);
|
||
|
memcpy(csid, &addr.sin_addr.s_addr, MAX_CSID_LEN);
|
||
|
|
||
|
status = read(client->fd, buf, len);
|
||
|
|
||
|
DEBUGLOG("read_from_tcpsock, status = %d(errno = %d)\n", status, errno);
|
||
|
|
||
|
/* Remove it from the hash table if there's an error, clvmd will
|
||
|
remove the socket from its lists and free the client struct */
|
||
|
if (status == 0 ||
|
||
|
(status < 0 && errno != EAGAIN && errno != EINTR))
|
||
|
{
|
||
|
char remcsid[MAX_CSID_LEN];
|
||
|
|
||
|
memcpy(remcsid, csid, MAX_CSID_LEN);
|
||
|
close(client->fd);
|
||
|
|
||
|
/* If the csid was mangled, then make sure we remove the right entry */
|
||
|
if (client->bits.net.flags)
|
||
|
remcsid[0] ^= 0x80;
|
||
|
hash_remove_binary(sock_hash, remcsid, MAX_CSID_LEN);
|
||
|
|
||
|
/* Tell cluster manager layer */
|
||
|
add_down_node(remcsid);
|
||
|
}
|
||
|
return status;
|
||
|
}
|
||
|
|
||
|
static int connect_csid(char *csid, struct local_client **newclient)
|
||
|
{
|
||
|
int fd;
|
||
|
struct sockaddr_in addr;
|
||
|
int status;
|
||
|
|
||
|
DEBUGLOG("Connecting socket\n");
|
||
|
fd = socket(PF_INET, SOCK_STREAM, 0);
|
||
|
|
||
|
if (fd < 0)
|
||
|
{
|
||
|
syslog(LOG_ERR, "Unable to create new socket: %m");
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
addr.sin_family = AF_INET;
|
||
|
memcpy(&addr.sin_addr.s_addr, csid, MAX_CSID_LEN);
|
||
|
addr.sin_port = htons(tcp_port);
|
||
|
|
||
|
DEBUGLOG("Connecting socket %d\n", fd);
|
||
|
if (connect(fd, (struct sockaddr *)&addr, sizeof(struct sockaddr_in)) < 0)
|
||
|
{
|
||
|
syslog(LOG_ERR, "Unable to connect to remote node: %m");
|
||
|
DEBUGLOG("Unable to connect to remote node: %s\n", strerror(errno));
|
||
|
close(fd);
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
status = alloc_client(fd, csid, newclient);
|
||
|
if (status)
|
||
|
close(fd);
|
||
|
else
|
||
|
add_client(*newclient);
|
||
|
|
||
|
/* If we can connect to it, it must be running a clvmd */
|
||
|
add_up_node(csid);
|
||
|
return status;
|
||
|
}
|
||
|
|
||
|
/* Send a message to a known CSID */
|
||
|
static int tcp_send_message(void *buf, int msglen, unsigned char *csid, const char *errtext)
|
||
|
{
|
||
|
int status;
|
||
|
struct local_client *client;
|
||
|
char ourcsid[MAX_CSID_LEN];
|
||
|
|
||
|
assert(csid);
|
||
|
|
||
|
DEBUGLOG("tcp_send_message, csid = [%d.%d.%d.%d], msglen = %d\n", csid[0],csid[1],csid[2],csid[3], msglen);
|
||
|
|
||
|
/* Don't connect to ourself */
|
||
|
get_our_csid(ourcsid);
|
||
|
if (memcmp(csid, ourcsid, MAX_CSID_LEN) == 0)
|
||
|
return msglen;
|
||
|
|
||
|
client = hash_lookup_binary(sock_hash, csid, MAX_CSID_LEN);
|
||
|
if (!client)
|
||
|
{
|
||
|
status = connect_csid(csid, &client);
|
||
|
if (status)
|
||
|
return -1;
|
||
|
}
|
||
|
DEBUGLOG("tcp_send_message, fd = %d\n", client->fd);
|
||
|
|
||
|
return write(client->fd, buf, msglen);
|
||
|
}
|
||
|
|
||
|
|
||
|
int cluster_send_message(void *buf, int msglen, char *csid, const char *errtext)
|
||
|
{
|
||
|
int status=0;
|
||
|
|
||
|
DEBUGLOG("cluster send message, csid = %p, msglen = %d\n", csid, msglen);
|
||
|
|
||
|
/* If csid is NULL then send to all known (not just connected) nodes */
|
||
|
if (!csid)
|
||
|
{
|
||
|
void *context = NULL;
|
||
|
char loop_csid[MAX_CSID_LEN];
|
||
|
|
||
|
/* Loop round all gulm-known nodes */
|
||
|
while (get_next_node_csid(&context, loop_csid))
|
||
|
{
|
||
|
status = tcp_send_message(buf, msglen, loop_csid, errtext);
|
||
|
if (status == 0 ||
|
||
|
(status < 0 && (errno == EAGAIN || errno == EINTR)))
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
|
||
|
status = tcp_send_message(buf, msglen, csid, errtext);
|
||
|
}
|
||
|
return status;
|
||
|
}
|
||
|
|
||
|
static int get_tcp_port(int default_port)
|
||
|
{
|
||
|
int ccs_handle;
|
||
|
int port = default_port;
|
||
|
char *portstr;
|
||
|
|
||
|
ccs_handle = ccs_connect();
|
||
|
if (ccs_handle)
|
||
|
{
|
||
|
return port;
|
||
|
}
|
||
|
|
||
|
if (!ccs_get(ccs_handle, "//clvm/@port", &portstr))
|
||
|
{
|
||
|
port = atoi(portstr);
|
||
|
free(portstr);
|
||
|
|
||
|
if (port <= 0 && port >= 65536)
|
||
|
port = default_port;
|
||
|
}
|
||
|
ccs_disconnect(ccs_handle);
|
||
|
|
||
|
DEBUGLOG("Using port %d for communications\n", port);
|
||
|
return port;
|
||
|
}
|
||
|
|
||
|
/* To get our own IP address we get the locally bound address of the
|
||
|
socket that's talking to GULM in the assumption(eek) that it will
|
||
|
be on the "right" network in a multi-homed system */
|
||
|
static int get_our_ip_address(char *addr, int *family)
|
||
|
{
|
||
|
/* Use a sockaddr_in6 to make sure it's big enough */
|
||
|
struct sockaddr_in6 saddr;
|
||
|
int socklen = sizeof(saddr);
|
||
|
|
||
|
if (!getsockname(gulm_fd(), (struct sockaddr *)&saddr, &socklen))
|
||
|
{
|
||
|
if (saddr.sin6_family == AF_INET6)
|
||
|
{
|
||
|
memcpy(addr, &saddr.sin6_addr, sizeof(saddr.sin6_addr));
|
||
|
}
|
||
|
else
|
||
|
{
|
||
|
struct sockaddr_in *sin4 = (struct sockaddr_in *)&saddr;
|
||
|
memcpy(addr, &sin4->sin_addr, sizeof(sin4->sin_addr));
|
||
|
}
|
||
|
return 0;
|
||
|
}
|
||
|
return -1;
|
||
|
}
|
||
|
|
||
|
/* Public version of above for those that don't care what protocol
|
||
|
we're using */
|
||
|
void get_our_csid(char *csid)
|
||
|
{
|
||
|
static char our_csid[MAX_CSID_LEN];
|
||
|
static int got_csid = 0;
|
||
|
|
||
|
if (!got_csid)
|
||
|
{
|
||
|
int family;
|
||
|
|
||
|
memset(our_csid, 0, sizeof(our_csid));
|
||
|
if (get_our_ip_address(our_csid, &family))
|
||
|
{
|
||
|
got_csid = 1;
|
||
|
}
|
||
|
}
|
||
|
memcpy(csid, our_csid, MAX_CSID_LEN);
|
||
|
}
|
||
|
|
||
|
/* Get someone else's IP address from DNS */
|
||
|
int get_ip_address(char *node, char *addr)
|
||
|
{
|
||
|
struct hostent *he;
|
||
|
|
||
|
memset(addr, 0, MAX_CSID_LEN);
|
||
|
|
||
|
// TODO: what do we do about multi-homed hosts ???
|
||
|
// CCSs ip_interfaces solved this but some bugger removed it.
|
||
|
|
||
|
/* Try IPv6 first. The man page for gethostbyname implies that
|
||
|
it will lookup ip6 & ip4 names, but it seems not to */
|
||
|
he = gethostbyname2(node, AF_INET6);
|
||
|
if (!he)
|
||
|
he = gethostbyname2(node, AF_INET);
|
||
|
if (!he)
|
||
|
return -1;
|
||
|
|
||
|
/* For IPv4 address just use the lower 4 bytes */
|
||
|
memcpy(&addr, he->h_addr_list[0],
|
||
|
he->h_length);
|
||
|
|
||
|
return 0;
|
||
|
}
|