start mce port

This commit is contained in:
Oliver Gorwits
2013-01-01 19:16:59 +00:00
parent c8e741b63c
commit e2b9fd3430
3 changed files with 138 additions and 102 deletions

View File

@@ -1,88 +1,76 @@
#!/usr/bin/env perl #!/usr/bin/env perl
# fix for older Perl which warns about a bug in File::Slurp
BEGIN {
no warnings 'portable';
use File::Slurp;
}
use FindBin; use FindBin;
use lib "$FindBin::Bin/../lib"; use lib "$FindBin::Bin/../lib";
use App::Netdisco; use App::Netdisco;
# for netdisco app config
use Dancer qw/:moose :script/; use Dancer qw/:moose :script/;
use Dancer::Plugin::DBIC 'schema';
use Daemon::Generic::While1; # callbacks and local job queue management
use Parallel::Prefork; use App::Netdisco::Daemon::Queue ':all';
use Net::Domain 'hostfqdn';
use MCE;
use Role::Tiny; use Role::Tiny;
use Try::Tiny; use Path::Class 'dir';
# Parallel::Prefork instance my $mce = MCE->new(
my $pp = undef; tmp_dir => dir($ENV{HOME}, 'tmp'),
spawn_delay => 0.15,
job_delay => 0.15,
user_func => \&call_worker_body,
on_post_exit => \&restart_worker,
user_tasks => build_tasks_list(),
)->run();
# track worker pids and their roles sub call_worker_body {
my %workers = (); my ($self) = @_;
my $next_role = undef; $self->worker_body if $self->can('worker_body');
}
# must come after globals initialization sub restart_worker {
newdaemon( my ($self, $e) = @_;
progname => 'netdisco-daemon', reset_jobs($e->{wid});
($> != 0 ? (pidbase => './') : ()), $self->restart_worker($e->{wid});
logpriority => 'daemon.info', }
);
sub gd_preconfig { sub build_tasks_list {
my $gd = shift; my $tasks = [{
max_workers => 1,
# used for locking jobs in central Pg queue user_begin => worker_factory('Manager'),
$gd->{nd_host} = hostfqdn; }];
set(daemon_pollers => 2) set(daemon_pollers => 2)
if !defined setting('daemon_pollers'); if !defined setting('daemon_pollers');
set(daemon_interactives => 2) set(daemon_interactives => 2)
if !defined setting('daemon_interactives'); if !defined setting('daemon_interactives');
# need to do this after setting defaults # XXX MCE does not like max_workers => 0
$pp = Parallel::Prefork->new(
max_workers => (1 + setting('daemon_pollers')
+ setting('daemon_interactives')),
spawn_interval => 2,
before_fork => \&set_next_worker_role,
after_fork => \&register_worker,
on_child_reap => \&unregister_worker,
trap_signals => {
TERM => 'TERM',
INT => 'TERM',
},
);
# do not remove this line - required by Daemon::Generic push @$tasks, {
return (); max_workers => setting('daemon_pollers'),
user_begin => worker_factory('Poller'),
} if setting('daemon_pollers');
push @$tasks, {
max_workers => setting('daemon_interactives'),
user_begin => worker_factory('Interactive'),
} if setting('daemon_interactives');
return $tasks;
} }
# main loop sub worker_factory {
sub gd_run_body { my $role = shift;
my $gd = shift; return sub {
my $self = shift;
$gd->handle_term # with "App::Netdisco::Daemon::Worker::$role";
if $pp->signal_received =~ m/^(?:TERM|INT)$/; $self->worker_begin if $self->can('worker_begin');
};
$pp->start(sub {
print STDERR ">>> new $next_role worker starting...\n";
with "App::Netdisco::Daemon::Worker::$next_role";
$gd->worker_begin if $gd->can('worker_begin');
$gd->worker_body;
$gd->worker_end if $gd->can('worker_end');
});
# I don't think Parallel::Prefork ever returns from start()
# until a child exits. Not sure this is ever reached.
$gd->gd_sleep( setting('daemon_sleep_time') || 5 )
if not $pp->signal_received;
} }
__END__
sub register_worker { sub register_worker {
my (undef, $pid) = @_; my (undef, $pid) = @_;
$workers{$pid} = $next_role; $workers{$pid} = $next_role;
@@ -102,44 +90,3 @@ sub unregister_worker {
catch { warn "error reverting jobs for pid $pid: $_\n" }; catch { warn "error reverting jobs for pid $pid: $_\n" };
} }
sub set_next_worker_role {
my $pp = shift;
$next_role = _find_next_worker_role();
}
sub _find_next_worker_role {
my @cur = values %workers;
my $manager = scalar grep {$_ eq 'Manager'} @cur;
my $poller = scalar grep {$_ eq 'Poller'} @cur;
my $inter = scalar grep {$_ eq 'Interactive'} @cur;
return 'Manager' if $manager < 1;
my $need_poller = $poller < setting('daemon_pollers');
my $need_inter = $inter < setting('daemon_interactives');
if ($need_poller and $need_inter) {
return (int(rand(2)) ? 'Interactive' : 'Poller');
}
return 'Interactive' if $need_inter;
return 'Poller' if $need_poller;
}
sub handle_term {
my $gd = shift;
$pp->wait_all_children;
$gd->gd_quit_event
}
# in case we screw up and die ourselves
END {
if (defined $pp) {
$pp->signal_all_children('TERM');
$pp->wait_all_children;
}
}
# nullify this to permit Parallel::Prefork to register handlers instead
sub gd_setup_signals {}

View File

@@ -12,6 +12,13 @@ __PACKAGE__->add_columns(
data_type => "integer", data_type => "integer",
is_nullable => 0, is_nullable => 0,
}, },
"role", # Poller, Interactive, etc
{ data_type => "text", is_nullable => 0 },
"wid", # worker ID, only assigned once taken
{ data_type => "integer", is_nullable => 1 },
"started", "started",
{ data_type => "timestamp", is_nullable => 1 }, { data_type => "timestamp", is_nullable => 1 },
"finished", "finished",

View File

@@ -0,0 +1,82 @@
package App::Netdisco::Daemon::Queue;
use Dancer qw/:moose :syntax :script/;
use Dancer::Plugin::DBIC 'schema';
use Try::Tiny;
use base 'Exporter';
our @EXPORT = ();
our @EXPORT_OK = qw/ add_jobs take_jobs reset_jobs /;
our %EXPORT_TAGS = ( all => \@EXPORT_OK );
{
my $daemon = schema('daemon');
# deploy local db if not already done
try {
$daemon->storage->dbh_do(sub {
my ($storage, $dbh) = @_;
$dbh->selectrow_arrayref("SELECT * FROM admin WHERE 0 = 1");
});
}
catch {
$daemon->txn_do(sub {
$daemon->storage->disconnect;
$daemon->deploy;
});
};
$daemon->storage->disconnect;
if ($daemon->get_db_version < $daemon->schema_version) {
$daemon->txn_do(sub { $daemon->upgrade });
}
# empty local db of any stale queued jobs
$daemon->resultset('Admin')->delete;
}
sub add_jobs {
my ($jobs) = @_;
try { schema('daemon')->resultset('Admin')->populate($jobs) }
catch { warn "error adding jobs: $_\n" };
}
sub take_jobs {
my ($wid, $role, $max) = @_;
my $jobs = [];
my $rs = schema('daemon')->resultset('Admin')
->search({role => $role, status => 'queued'});
while (my $job = $rs->next) {
last if scalar $jobs eq $max;
try {
schema('daemon')->txn_do(sub {
my $row = schema('daemon')->resultset('Admin')->find(
{job => $job->job},
{for => 'update'}
);
if ($row->status eq 'queued') {
$row->update({status => 'taken', wid => $wid});
push @$jobs, $row->get_columns;
}
});
};
}
return $jobs;
}
sub reset_jobs {
my ($wid) = @_;
try {
schema('daemon')->resultset('Admin')
->search({wid => $wid})
->update({wid => undef, status => 'queued', started => undef});
}
catch { warn "error resetting jobs for wid [$wid]: $_\n" };
}
1;