pve-common/src/PVE/RESTEnvironment.pm
Wolfgang Bumiller 2311859b0d fork_worker: guard more setup code with eval
As it might die with an error which should end up in the
_exit() code path rather than bailing out into the upper
scope.

Signed-off-by: Wolfgang Bumiller <w.bumiller@proxmox.com>
Reviewed-by: Thomas Lamprecht <t.lamprecht@proxmox.com>
2018-01-10 14:12:34 +01:00

707 lines
16 KiB
Perl

package PVE::RESTEnvironment;
# NOTE: you can/should provide your own specialice class, and
# use this a bas class (as example see PVE::RPCEnvironment).
# we use this singleton class to pass RPC related environment values
use strict;
use warnings;
use POSIX qw(:sys_wait_h EINTR);
use IO::Handle;
use IO::File;
use IO::Select;
use Fcntl qw(:flock);
use PVE::Exception qw(raise raise_perm_exc);
use PVE::SafeSyslog;
use PVE::Tools;
use PVE::INotify;
use PVE::ProcFSTools;
my $rest_env;
# save $SIG{CHLD} handler implementation.
# simply set $SIG{CHLD} = $worker_reaper;
# and register forked processes with &$register_worker(pid)
# Note: using $SIG{CHLD} = 'IGNORE' or $SIG{CHLD} = sub { wait (); } or ...
# has serious side effects, because perls built in system() and open()
# functions can't get the correct exit status of a child. So we cant use
# that (also see perlipc)
my $WORKER_PIDS;
my $WORKER_FLAG = 0;
my $log_task_result = sub {
my ($upid, $user, $status) = @_;
return if !$rest_env;
my $msg = 'successful';
my $pri = 'info';
if ($status != 0) {
my $ec = $status >> 8;
my $ic = $status & 255;
$msg = $ec ? "failed ($ec)" : "interrupted ($ic)";
$pri = 'err';
}
my $tlist = $rest_env->active_workers($upid);
eval { $rest_env->broadcast_tasklist($tlist); };
syslog('err', $@) if $@;
my $task;
foreach my $t (@$tlist) {
if ($t->{upid} eq $upid) {
$task = $t;
last;
}
}
if ($task && $task->{status}) {
$msg = $task->{status};
}
$rest_env->log_cluster_msg($pri, $user, "end task $upid $msg");
};
my $worker_reaper = sub {
local $!; local $?;
foreach my $pid (keys %$WORKER_PIDS) {
my $waitpid = waitpid ($pid, WNOHANG);
if (defined($waitpid) && ($waitpid == $pid)) {
my $info = $WORKER_PIDS->{$pid};
if ($info && $info->{upid} && $info->{user}) {
&$log_task_result($info->{upid}, $info->{user}, $?);
}
delete ($WORKER_PIDS->{$pid});
}
}
};
my $register_worker = sub {
my ($pid, $user, $upid) = @_;
return if !$pid;
# do not register if already finished
my $waitpid = waitpid ($pid, WNOHANG);
if (defined($waitpid) && ($waitpid == $pid)) {
delete ($WORKER_PIDS->{$pid});
return;
}
$WORKER_PIDS->{$pid} = {
user => $user,
upid => $upid,
};
};
# initialize environment - must be called once at program startup
sub init {
my ($class, $type, %params) = @_;
$class = ref($class) || $class;
die "already initialized" if $rest_env;
die "unknown environment type"
if !$type || $type !~ m/^(cli|pub|priv|ha)$/;
$SIG{CHLD} = $worker_reaper;
# environment types
# cli ... command started fron command line
# pub ... access from public server (apache)
# priv ... access from private server (pvedaemon)
# ha ... access from HA resource manager agent (rgmanager)
my $self = { type => $type };
bless $self, $class;
foreach my $p (keys %params) {
if ($p eq 'atfork') {
$self->{$p} = $params{$p};
} else {
die "unknown option '$p'";
}
}
$rest_env = $self;
my ($sysname, $nodename) = POSIX::uname();
$nodename =~ s/\..*$//; # strip domain part, if any
$self->{nodename} = $nodename;
return $self;
};
# convenience function for command line tools
sub setup_default_cli_env {
my ($class, $username) = @_;
$class = ref($class) || $class;
$username //= 'root@pam';
PVE::INotify::inotify_init();
my $rpcenv = $class->init('cli');
$rpcenv->init_request();
$rpcenv->set_language($ENV{LANG});
$rpcenv->set_user($username);
die "please run as root\n"
if ($username eq 'root@pam') && ($> != 0);
}
# get the singleton
sub get {
die "REST environment not initialized" if !$rest_env;
return $rest_env;
}
sub set_client_ip {
my ($self, $ip) = @_;
$self->{client_ip} = $ip;
}
sub get_client_ip {
my ($self) = @_;
return $self->{client_ip};
}
sub set_result_attrib {
my ($self, $key, $value) = @_;
$self->{result_attributes}->{$key} = $value;
}
sub get_result_attrib {
my ($self, $key) = @_;
return $self->{result_attributes}->{$key};
}
sub set_language {
my ($self, $lang) = @_;
# fixme: initialize I18N
$self->{language} = $lang;
}
sub get_language {
my ($self) = @_;
return $self->{language};
}
sub set_user {
my ($self, $user) = @_;
$self->{user} = $user;
}
sub get_user {
my ($self, $noerr) = @_;
return $self->{user} if defined($self->{user}) || $noerr;
die "user name not set\n";
}
sub is_worker {
my ($class) = @_;
return $WORKER_FLAG;
}
# read/update list of active workers
# we move all finished tasks to the archive index,
# but keep aktive and most recent task in the active file.
# $nocheck ... consider $new_upid still running (avoid that
# we try to read the reult to early.
sub active_workers {
my ($self, $new_upid, $nocheck) = @_;
my $lkfn = "/var/log/pve/tasks/.active.lock";
my $timeout = 10;
my $code = sub {
my $tasklist = PVE::INotify::read_file('active');
my @ta;
my $tlist = [];
my $thash = {}; # only list task once
my $check_task = sub {
my ($task, $running) = @_;
if ($running || PVE::ProcFSTools::check_process_running($task->{pid}, $task->{pstart})) {
push @$tlist, $task;
} else {
delete $task->{pid};
push @ta, $task;
}
delete $task->{pstart};
};
foreach my $task (@$tasklist) {
my $upid = $task->{upid};
next if $thash->{$upid};
$thash->{$upid} = $task;
&$check_task($task);
}
if ($new_upid && !(my $task = $thash->{$new_upid})) {
$task = PVE::Tools::upid_decode($new_upid);
$task->{upid} = $new_upid;
$thash->{$new_upid} = $task;
&$check_task($task, $nocheck);
}
@ta = sort { $b->{starttime} cmp $a->{starttime} } @ta;
my $save = defined($new_upid);
foreach my $task (@ta) {
next if $task->{endtime};
$task->{endtime} = time();
$task->{status} = PVE::Tools::upid_read_status($task->{upid});
$save = 1;
}
my $archive = '';
my @arlist = ();
foreach my $task (@ta) {
if (!$task->{saved}) {
$archive .= sprintf("%s %08X %s\n", $task->{upid}, $task->{endtime}, $task->{status});
$save = 1;
push @arlist, $task;
$task->{saved} = 1;
}
}
if ($archive) {
my $size = 0;
my $filename = "/var/log/pve/tasks/index";
eval {
my $fh = IO::File->new($filename, '>>', 0644) ||
die "unable to open file '$filename' - $!\n";
PVE::Tools::safe_print($filename, $fh, $archive);
$size = -s $fh;
close($fh) ||
die "unable to close file '$filename' - $!\n";
};
my $err = $@;
if ($err) {
syslog('err', $err);
foreach my $task (@arlist) { # mark as not saved
$task->{saved} = 0;
}
}
my $maxsize = 50000; # about 1000 entries
if ($size > $maxsize) {
rename($filename, "$filename.1");
}
}
# we try to reduce the amount of data
# list all running tasks and task and a few others
# try to limit to 25 tasks
my $max = 25 - scalar(@$tlist);
foreach my $task (@ta) {
last if $max <= 0;
push @$tlist, $task;
$max--;
}
PVE::INotify::write_file('active', $tlist) if $save;
return $tlist;
};
my $res = PVE::Tools::lock_file($lkfn, $timeout, $code);
die $@ if $@;
return $res;
}
my $kill_process_group = sub {
my ($pid, $pstart) = @_;
# send kill to process group (negative pid)
my $kpid = -$pid;
# always send signal to all pgrp members
kill(15, $kpid); # send TERM signal
# give max 5 seconds to shut down
for (my $i = 0; $i < 5; $i++) {
return if !PVE::ProcFSTools::check_process_running($pid, $pstart);
sleep (1);
}
# to be sure
kill(9, $kpid);
};
sub check_worker {
my ($self, $upid, $killit) = @_;
my $task = PVE::Tools::upid_decode($upid);
my $running = PVE::ProcFSTools::check_process_running($task->{pid}, $task->{pstart});
return 0 if !$running;
if ($killit) {
&$kill_process_group($task->{pid});
return 0;
}
return 1;
}
# acts almost as tee: writes an output both to STDOUT and a task log,
# we differ as we're worker aware and look also at the childs control pipe,
# so we know if the function could be executed successfully or not.
my $tee_worker = sub {
my ($childfd, $ctrlfd, $taskfh, $cpid) = @_;
eval {
my $int_count = 0;
local $SIG{INT} = local $SIG{QUIT} = local $SIG{TERM} = sub {
# always send signal to all pgrp members
my $kpid = -$cpid;
if ($int_count < 3) {
kill(15, $kpid); # send TERM signal
} else {
kill(9, $kpid); # send KILL signal
}
$int_count++;
};
local $SIG{PIPE} = sub { die "broken pipe\n"; };
my $select = new IO::Select;
my $fh = IO::Handle->new_from_fd($childfd, 'r');
$select->add($fh);
my $readbuf = '';
my $count;
while ($select->count) {
my @handles = $select->can_read(1);
if (scalar(@handles)) {
my $count = sysread ($handles[0], $readbuf, 4096);
if (!defined ($count)) {
my $err = $!;
die "sync pipe read error: $err\n";
}
last if $count == 0; # eof
print $readbuf;
select->flush();
print $taskfh $readbuf;
$taskfh->flush();
} else {
# some commands daemonize without closing stdout
last if !PVE::ProcFSTools::check_process_running($cpid);
}
}
# get status (error or OK)
POSIX::read($ctrlfd, $readbuf, 4096);
if ($readbuf =~ m/^TASK OK\n?$/) {
# skip printing to stdout
print $taskfh $readbuf;
} elsif ($readbuf =~ m/^TASK ERROR: (.*)\n?$/) {
print STDERR "$1\n";
print $taskfh "\n$readbuf"; # ensure start on new line for webUI
} else {
die "got unexpected control message: $readbuf\n";
}
$taskfh->flush();
};
my $err = $@;
POSIX::close($childfd);
POSIX::close($ctrlfd);
if ($err) {
$err =~ s/\n/ /mg;
print STDERR "$err\n";
print $taskfh "TASK ERROR: $err\n";
}
};
# start long running workers
# STDIN is redirected to /dev/null
# STDOUT,STDERR are redirected to the filename returned by upid_decode
# NOTE: we simulate running in foreground if ($self->{type} eq 'cli')
sub fork_worker {
my ($self, $dtype, $id, $user, $function, $background) = @_;
$dtype = 'unknown' if !defined ($dtype);
$id = '' if !defined ($id);
$user = 'root@pve' if !defined ($user);
my $sync = ($self->{type} eq 'cli' && !$background) ? 1 : 0;
local $SIG{INT} =
local $SIG{QUIT} =
local $SIG{PIPE} =
local $SIG{TERM} = 'IGNORE';
my $starttime = time ();
my @psync = POSIX::pipe();
my @csync = POSIX::pipe();
my @ctrlfd = POSIX::pipe() if $sync;
my $node = $self->{nodename};
my $cpid = fork();
die "unable to fork worker - $!" if !defined($cpid);
my $workerpuid = $cpid ? $cpid : $$;
my $pstart = PVE::ProcFSTools::read_proc_starttime($workerpuid) ||
die "unable to read process start time";
my $upid = PVE::Tools::upid_encode ({
node => $node, pid => $workerpuid, pstart => $pstart,
starttime => $starttime, type => $dtype, id => $id, user => $user });
my $outfh;
if (!$cpid) { # child
$0 = "task $upid";
$WORKER_FLAG = 1;
$SIG{INT} = $SIG{QUIT} = $SIG{TERM} = sub { die "received interrupt\n"; };
$SIG{CHLD} = $SIG{PIPE} = 'DEFAULT';
# set sess/process group - we want to be able to kill the
# whole process group
POSIX::setsid();
POSIX::close ($psync[0]);
POSIX::close ($ctrlfd[0]) if $sync;
POSIX::close ($csync[1]);
$outfh = $sync ? $psync[1] : undef;
my $resfh = $sync ? $ctrlfd[1] : undef;
eval {
PVE::INotify::inotify_close();
if (my $atfork = $self->{atfork}) {
&$atfork();
}
# same algorythm as used inside SA
# STDIN = /dev/null
my $fd = fileno (STDIN);
if (!$sync) {
close STDIN;
POSIX::close(0) if $fd != 0;
die "unable to redirect STDIN - $!"
if !open(STDIN, "</dev/null");
$outfh = PVE::Tools::upid_open($upid);
$resfh = fileno($outfh);
}
# redirect STDOUT
$fd = fileno(STDOUT);
close STDOUT;
POSIX::close (1) if $fd != 1;
die "unable to redirect STDOUT - $!"
if !open(STDOUT, ">&", $outfh);
STDOUT->autoflush (1);
# redirect STDERR to STDOUT
$fd = fileno (STDERR);
close STDERR;
POSIX::close(2) if $fd != 2;
die "unable to redirect STDERR - $!"
if !open(STDERR, ">&1");
STDERR->autoflush(1);
};
if (my $err = $@) {
my $msg = "ERROR: $err";
POSIX::write($psync[1], $msg, length ($msg));
POSIX::close($psync[1]);
POSIX::_exit(1);
kill(-9, $$);
}
# sync with parent (signal that we are ready)
POSIX::write($psync[1], $upid, length ($upid));
POSIX::close($psync[1]) if !$sync; # don't need output pipe if async
eval {
my $readbuf = '';
# sync with parent (wait until parent is ready)
POSIX::read($csync[0], $readbuf, 4096);
die "parent setup error\n" if $readbuf ne 'OK';
if ($self->{type} eq 'ha') {
print "task started by HA resource agent\n";
}
&$function($upid);
};
my $err = $@;
if ($err) {
chomp $err;
$err =~ s/\n/ /mg;
syslog('err', $err);
my $msg = "TASK ERROR: $err\n";
POSIX::write($resfh, $msg, length($msg));
POSIX::close($resfh) if $sync;
POSIX::_exit(-1);
} else {
my $msg = "TASK OK\n";
POSIX::write($resfh, $msg, length($msg));
POSIX::close($resfh) if $sync;
POSIX::_exit(0);
}
kill(-9, $$);
}
# parent
POSIX::close ($psync[1]);
POSIX::close ($ctrlfd[1]) if $sync;
POSIX::close ($csync[0]);
my $readbuf = '';
# sync with child (wait until child starts)
POSIX::read($psync[0], $readbuf, 4096);
if (!$sync) {
POSIX::close($psync[0]);
&$register_worker($cpid, $user, $upid);
} else {
chomp $readbuf;
}
eval {
die "got no worker upid - start worker failed\n" if !$readbuf;
if ($readbuf =~ m/^ERROR:\s*(.+)$/m) {
die "starting worker failed: $1\n";
}
if ($readbuf ne $upid) {
die "got strange worker upid ('$readbuf' != '$upid') - start worker failed\n";
}
if ($sync) {
$outfh = PVE::Tools::upid_open($upid);
}
};
my $err = $@;
if (!$err) {
my $msg = 'OK';
POSIX::write($csync[1], $msg, length ($msg));
POSIX::close($csync[1]);
} else {
POSIX::close($csync[1]);
kill(-9, $cpid); # make sure it gets killed
die $err;
}
$self->log_cluster_msg('info', $user, "starting task $upid");
my $tlist = $self->active_workers($upid, $sync);
eval { $self->broadcast_tasklist($tlist); };
syslog('err', $@) if $@;
my $res = 0;
if ($sync) {
$tee_worker->($psync[0], $ctrlfd[0], $outfh, $cpid);
&$kill_process_group($cpid, $pstart); # make sure it gets killed
close($outfh);
waitpid($cpid, 0);
$res = $?;
&$log_task_result($upid, $user, $res);
}
return wantarray ? ($upid, $res) : $upid;
}
# Abstract function
sub log_cluster_msg {
my ($self, $pri, $user, $msg) = @_;
syslog($pri, "%s", $msg);
# PVE::Cluster::log_msg($pri, $user, $msg);
}
sub broadcast_tasklist {
my ($self, $tlist) = @_;
# PVE::Cluster::broadcast_tasklist($tlist);
}
sub check_api2_permissions {
my ($self, $perm, $username, $param) = @_;
return 1 if !$username && $perm->{user} eq 'world';
raise_perm_exc("user != null") if !$username;
return 1 if $username eq 'root@pam';
raise_perm_exc('user != root@pam') if !$perm;
return 1 if $perm->{user} && $perm->{user} eq 'all';
##return $self->exec_api2_perm_check($perm->{check}, $username, $param)
##if $perm->{check};
raise_perm_exc();
}
# init_request - should be called before each REST/CLI request
sub init_request {
my ($self, %params) = @_;
$self->{result_attributes} = {}
# if you nedd more, implement in subclass
}
1;