pve-manager/bin/pvestatd
Alexandre Derumier e3ae2c58c0 pvestatd : add template value to rrd
we need it for resourcestore

Signed-off-by: Alexandre Derumier <aderumier@odiso.com>
2013-02-15 10:21:31 +01:00

480 lines
10 KiB
Perl
Executable File

#!/usr/bin/perl -w
use strict;
use PVE::SafeSyslog;
use POSIX ":sys_wait_h";
use Fcntl ':flock';
use Getopt::Long;
use Time::HiRes qw (gettimeofday);
use PVE::Tools qw(dir_glob_foreach file_read_firstline);
use PVE::ProcFSTools;
use Filesys::Df;
use PVE::INotify;
use PVE::Cluster qw(cfs_read_file);
use PVE::Storage;
use PVE::QemuServer;
use PVE::OpenVZ;
use PVE::RPCEnvironment;
use PVE::API2::Subscription;
use PVE::AutoBalloon;
$SIG{'__WARN__'} = sub {
my $err = $@;
my $t = $_[0];
chomp $t;
syslog('warning', "WARNING: %s", $t);
$@ = $err;
};
initlog('pvestatd');
$ENV{'PATH'} = '/sbin:/bin:/usr/sbin:/usr/bin';
die "please run as root\n" if $> != 0;
my $nodename = PVE::INotify::nodename();
my $opt_debug;
if (!GetOptions ('debug' => \$opt_debug)) {
die "USAGE: $0 [--debug]\n";
}
my $opt_pidfile = "/var/run/pvestatd.pid";
sub lockpidfile {
my $pidfile = shift;
my $lkfn = "$pidfile.lock";
if (!open (FLCK, ">>$lkfn")) {
my $msg = "can't aquire lock on file '$lkfn' - $!";
syslog ('err', $msg);
die "ERROR: $msg\n";
}
if (!flock (FLCK, LOCK_EX|LOCK_NB)) {
close (FLCK);
my $msg = "can't aquire lock '$lkfn' - $!";
syslog ('err', $msg);
die "ERROR: $msg\n";
}
}
sub writepidfile {
my $pidfile = shift;
if (!open (PIDFH, ">$pidfile")) {
my $msg = "can't open pid file '$pidfile' - $!";
syslog ('err', $msg);
die "ERROR: $msg\n";
}
print PIDFH "$$\n";
close (PIDFH);
}
# try to get the lock
lockpidfile($opt_pidfile);
# run in background
my $spid;
my $restart = $ENV{RESTART_PVESTATD};
if (!$opt_debug) {
open STDIN, '</dev/null' || die "can't read /dev/null";
open STDOUT, '>/dev/null' || die "can't write /dev/null";
}
if (!$restart && !$opt_debug) {
$spid = fork();
if (!defined ($spid)) {
my $msg = "can't put server into background - fork failed";
syslog('err', $msg);
die "ERROR: $msg\n";
} elsif ($spid) { #parent
exit (0);
}
}
writepidfile($opt_pidfile);
open STDERR, '>&STDOUT' || die "can't close STDERR\n";
sub cleanup {
unlink "$opt_pidfile.lock";
unlink "$opt_pidfile";
}
$SIG{INT} = $SIG{TERM} = $SIG{QUIT} = sub {
syslog('info' , "server closing");
$SIG{INT} = 'DEFAULT';
# wait for children
1 while (waitpid(-1, POSIX::WNOHANG()) > 0);
cleanup();
exit (0);
};
PVE::INotify::inotify_init();
my $reload_config;
if ($restart) {
syslog('info' , "restarting server");
} else {
syslog('info' , "starting server");
}
$SIG{HUP} = sub {
$reload_config = 1;
};
sub update_node_status {
my ($avg1, $avg5, $avg15) = PVE::ProcFSTools::read_loadavg();
my $stat = PVE::ProcFSTools::read_proc_stat();
my $netdev = PVE::ProcFSTools::read_proc_net_dev();
my ($uptime) = PVE::ProcFSTools::read_proc_uptime();
my $cpuinfo = PVE::ProcFSTools::read_cpuinfo();
my $maxcpu = $cpuinfo->{cpus};
my $subinfo = PVE::INotify::read_file('subscription');
my $sublevel = $subinfo->{level} || '';
# traffic from/to physical interface cards
my $netin = 0;
my $netout = 0;
foreach my $dev (keys %$netdev) {
next if $dev !~ m/^eth\d+$/;
$netin += $netdev->{$dev}->{receive};
$netout += $netdev->{$dev}->{transmit};
}
my $meminfo = PVE::ProcFSTools::read_meminfo();
my $dinfo = df('/', 1); # output is bytes
my $ctime = time();
# everything not free is considered to be used
my $dused = $dinfo->{blocks} - $dinfo->{bfree};
my $data = "$uptime:$sublevel:$ctime:$avg1:$maxcpu:$stat->{cpu}:$stat->{wait}:" .
"$meminfo->{memtotal}:$meminfo->{memused}:" .
"$meminfo->{swaptotal}:$meminfo->{swapused}:" .
"$dinfo->{blocks}:$dused:$netin:$netout";
PVE::Cluster::broadcast_rrd("pve2-node/$nodename", $data);
}
sub auto_balloning {
my ($vmstatus) = @_;
my $log = sub {
return if !$opt_debug;
print @_;
};
my $hostmeminfo = PVE::ProcFSTools::read_meminfo();
# to debug, run 'pvestatd -d' and set memtotal here
#$hostmeminfo->{memtotal} = int(2*1024*1024*1024/0.8); # you can set this to test
my $hostfreemem = $hostmeminfo->{memtotal} - $hostmeminfo->{memused};
# we try to use about 80% host memory
# goal: we want to change memory usage by this amount (positive or negative)
my $goal = int($hostmeminfo->{memtotal}*0.8 - $hostmeminfo->{memused});
my $maxchange = 100*1024*1024;
my $res = PVE::AutoBalloon::compute_alg1($vmstatus, $goal, $maxchange);
&$log("host goal: $goal free: $hostfreemem total: $hostmeminfo->{memtotal}\n");
foreach my $vmid (keys %$vmstatus) {
next if !$res->{$vmid};
my $d = $vmstatus->{$vmid};
my $diff = int($res->{$vmid} - $d->{balloon});
my $absdiff = $diff < 0 ? -$diff : $diff;
if ($absdiff > 0) {
&$log("BALLOON $vmid to $res->{$vmid} ($diff)\n");
eval {
PVE::QemuServer::vm_mon_cmd($vmid, "balloon",
value => int($res->{$vmid}));
};
warn $@ if $@;
}
}
}
sub update_qemu_status {
my $ctime = time();
my $vmstatus = PVE::QemuServer::vmstatus(undef, 1);
eval { auto_balloning($vmstatus); };
syslog('err', "auto ballooning error: $@") if $@;
foreach my $vmid (keys %$vmstatus) {
my $d = $vmstatus->{$vmid};
my $data;
my $status = $d->{qmpstatus} || $d->{status} || 'stopped';
my $template = $d->{template} ? $d->{template} : "0";
if ($d->{pid}) { # running
$data = "$d->{uptime}:$d->{name}:$status:$template:" .
"$ctime:$d->{cpus}:$d->{cpu}:" .
"$d->{maxmem}:$d->{mem}:" .
"$d->{maxdisk}:$d->{disk}:" .
"$d->{netin}:$d->{netout}:" .
"$d->{diskread}:$d->{diskwrite}";
} else {
$data = "0:$d->{name}:$status:$template:$ctime:$d->{cpus}::" .
"$d->{maxmem}::" .
"$d->{maxdisk}:$d->{disk}:" .
":::";
}
PVE::Cluster::broadcast_rrd("pve2.3-vm/$vmid", $data);
}
}
sub find_vzctl_console_pids {
my $res = {};
dir_glob_foreach('/proc', '\d+', sub {
my ($pid) = @_;
my $cmdline = file_read_firstline("/proc/$pid/cmdline");
return if !$cmdline;
my @args = split(/\0/, $cmdline);
# serach for vzctl console <vmid>
return if scalar(@args) != 3;
return if $args[1] ne 'console';
return if $args[2] !~ m/^\d+$/;
return if $args[0] !~ m|^(/usr/sbin/)?vzctl$|;
my $vmid = $args[2];
push @{$res->{$vmid}}, $pid;
});
return $res;
}
sub remove_stale_openvz_consoles {
my $vmstatus = PVE::OpenVZ::vmstatus();
my $pidhash = find_vzctl_console_pids();
foreach my $vmid (keys %$pidhash) {
next if defined($vmstatus->{$vmid});
syslog('info', "remove stale vzctl console for CT $vmid");
foreach my $pid (@{$pidhash->{$vmid}}) {
kill(9, $pid);
}
}
}
sub update_openvz_status {
my $ctime = time();
my $vmstatus = PVE::OpenVZ::vmstatus();
foreach my $vmid (keys %$vmstatus) {
my $d = $vmstatus->{$vmid};
my $data;
if ($d->{status} eq 'running') { # running
$data = "$d->{uptime}:$d->{name}:$d->{status}:0:$ctime:$d->{cpus}:$d->{cpu}:" .
"$d->{maxmem}:$d->{mem}:" .
"$d->{maxdisk}:$d->{disk}:" .
"$d->{netin}:$d->{netout}:" .
"$d->{diskread}:$d->{diskwrite}";
} else {
$data = "0:$d->{name}:$d->{status}:0:$ctime:$d->{cpus}::" .
"$d->{maxmem}::" .
"$d->{maxdisk}:$d->{disk}:" .
":::";
}
PVE::Cluster::broadcast_rrd("pve2.3-vm/$vmid", $data);
}
}
sub update_storage_status {
my $cfg = cfs_read_file("storage.cfg");
my $ctime = time();
my $info = PVE::Storage::storage_info($cfg);
foreach my $storeid (keys %$info) {
my $d = $info->{$storeid};
next if !$d->{active};
# everything not free is considered to be used
my $realused = $d->{total} - $d->{avail};
my $data = "$ctime:$d->{total}:$realused";
my $key = "pve2-storage/${nodename}/$storeid";
PVE::Cluster::broadcast_rrd($key, $data);
}
}
sub update_status {
# update worker list. This is not really required and
# we just call this to make sure that we have a correct
# list in case of an unexpected crash.
eval {
my $tlist = PVE::RPCEnvironment::active_workers();
PVE::Cluster::broadcast_tasklist($tlist);
};
my $err = $@;
syslog('err', $err) if $err;
eval {
update_node_status();
};
$err = $@;
syslog('err', "node status update error: $err") if $err;
eval {
update_qemu_status();
};
$err = $@;
syslog('err', "qemu status update error: $err") if $err;
eval {
update_openvz_status();
};
$err = $@;
syslog('err', "openvz status update error: $err") if $err;
eval {
update_storage_status();
};
$err = $@;
syslog('err', "storage status update error: $err") if $err;
eval {
remove_stale_openvz_consoles();
};
$err = $@;
syslog('err', "openvz console cleanup error: $err") if $err;
}
my $next_update = 0;
# do not update directly after startup, because install scripts
# have a problem with that
my $cycle = 0;
my $updatetime = 10;
my $commandline = [$0, @ARGV];
$0 = "pvestatd";
sub restart_server {
my $waittime = shift;
syslog('info', "server shutdown (restart)");
$ENV{RESTART_PVESTATD} = 1;
sleep($waittime) if $waittime; # avoid high server load due to restarts
exec (@$commandline);
exit (-1); # never reached?
}
my $initial_memory_usage;
for (;;) { # forever
eval {
$next_update = time() + $updatetime;
if ($cycle) {
my ($ccsec, $cusec) = gettimeofday ();
eval {
$reload_config = 0;
# syslog('info', "start status update");
PVE::Cluster::cfs_update();
update_status();
};
my $err = $@;
if ($err) {
syslog('err', "status update error: $err");
}
my ($ccsec_end, $cusec_end) = gettimeofday ();
my $cptime = ($ccsec_end-$ccsec) + ($cusec_end - $cusec)/1000000;
syslog('info', sprintf("status update time (%.3f seconds)", $cptime))
if ($cptime > 5);
}
$cycle++;
my $mem = PVE::ProcFSTools::read_memory_usage();
if (!defined($initial_memory_usage) || ($cycle < 10)) {
$initial_memory_usage = $mem->{resident};
} else {
my $diff = $mem->{resident} - $initial_memory_usage;
if ($diff > 5*1024*1024) {
syslog ('info', "restarting server after $cycle cycles to " .
"reduce memory usage (free $mem->{resident} ($diff) bytes)");
restart_server ();
}
}
my $wcount = 0;
while ((time() < $next_update) &&
($wcount < $updatetime) && # protect against time wrap
!$reload_config) { $wcount++; sleep (1); };
};
my $err = $@;
if ($err) {
syslog ('err', "ERROR: $err");
restart_server(5);
exit (0);
}
}
exit (0);
__END__
=head1 NAME
pvestatd - PVE Status Daemon
=head1 SYNOPSIS
pvestatd
=head1 DESCRIPTION
Documentation is available at www.proxmox.com