fixed several workflow/spectre related bugs

This commit is contained in:
JT Smith 2006-03-18 23:25:31 +00:00
parent ccf1b3633f
commit 9b9b63cc12
7 changed files with 134 additions and 115 deletions

View file

@ -16,18 +16,20 @@
"maxWorkers" : 3,
# How many seconds should Spectre wait between spawning jobs. This
# How many seconds should Spectre wait between spawning jobs This
# can help avoid creating a denial of service attack on overworked
# or underpowered servers.
"timeBetweenJobs" : 5,
"timeBetweenRunningWorkflows" : 5,
# The number of seconds that Spectre should wait after an activity
# has been suspended before it should start it back up again. An
# activity may be suspended if it's waiting on user input, or
# if it returns an error.
# has been suspended before it should start it back up again. This
# gives other workflows a chance to run if one particular workflow
# has a lot of activites in it, and provides an opportunity to
# bypass workflows that are waiting for input from an external
# source.
"delayAfterSuspension" : 500
"delayAfterSuspension" : 60
}

View file

@ -110,14 +110,19 @@ sub new {
name => 'Spectre',
);
POE::Session->create(
object_states => [ $self => {_start=>"_start", _stop=>"_stop", "shutdown"=>"_stop"} ],
args=>[["shutdown"]]
object_states => [ $self => {_start=>"_start", _stop=>"_stop", "shutdown"=>"_stop","test"=>"test"} ],
args=>[["shutdown","test"]]
);
$self->{_cron} = Spectre::Cron->new($config, $debug);
$self->{_workflow} = Spectre::Workflow->new($config, $debug);
POE::Kernel->run();
}
sub test {
my $arg = $_[ARG1];
use JSON;
print objToJson($arg);
}
1;

View file

@ -38,7 +38,7 @@ sub _start {
foreach my $config (keys %{$configs}) {
$kernel->yield("loadWorkflows", $configs->{$config});
}
$kernel->yield("checkJobs");
$kernel->yield("checkInstances");
}
#-------------------------------------------------------------------
@ -59,53 +59,60 @@ sub _stop {
#-------------------------------------------------------------------
=head2 addJob ( config, job )
=head2 addInstance ( params )
Adds a workflow job to the workflow processing queue.
Adds a workflow instance to the workflow processing queue.
=head3 config
=head3 params
The config file name for the site that this job belongs to.
A hash reference containing important information about the workflow instance to add to the queue.
=head3 job
=head4 sitename
A hash reference containing a row of data from the WorkflowInstance table.
The host and domain of the site this instance belongs to.
=head3 instanceId
The unqiue id for this workflow instance.
=head3 priority
The priority (1,2, or 3) that this instance should be run at.
=cut
sub addJob {
my ($self, $config, $job) = @_[OBJECT, ARG0, ARG1];
$self->debug("Adding workflow instance ".$job->{instanceId}." from ".$config->getFilename." to job queue at priority ".$job->{priority}.".");
my $sitename = $config->get("sitename");
$self->{_jobs}{$job->{instanceId}} = {
sitename=>$sitename->[0],
instanceId=>$job->{instanceId},
sub addInstance {
my ($self, $params) = @_[OBJECT, ARG0];
$self->debug("Adding workflow instance ".$params->{instanceId}." from ".$params->{sitename}." to queue at priority ".$params->{priority}.".");
$self->{_instances}{$params->{instanceId}} = {
sitename=>$params->{sitename},
instanceId=>$params->{instanceId},
status=>"waiting",
priority=>$job->{priority}
priority=>$params->{priority}
};
push(@{$self->{"_priority".$job->{priority}}}, $self->{_jobs}{$job->{instanceId}});
push(@{$self->{"_priority".$params->{priority}}}, $params->{instanceId});
}
#-------------------------------------------------------------------
=head2 checkJobs ( )
=head2 checkInstances ( )
Checks to see if there are any open job slots available, and if there are assigns a new job to be run to fill it.
Checks to see if there are any open instance slots available, and if there are assigns a new instance to be run to fill it.
=cut
sub checkJobs {
sub checkInstances {
my ($kernel, $self) = @_[KERNEL, OBJECT];
$self->debug("Checking to see if we can run anymore jobs right now.");
if ($self->countRunningJobs < $self->config->get("maxWorkers")) {
my $job = $self->getNextJob;
if (defined $job) {
$job->{status} = "running";
push(@{$self->{_runningJobs}}, $job);
$kernel->yield("runWorker",$job);
$self->debug("Checking to see if we can run anymore instances right now.");
if ($self->countRunningInstances < $self->config->get("maxWorkers")) {
my $instance = $self->getNextInstance;
if (defined $instance) {
$instance->{status} = "running";
push(@{$self->{_runningInstances}}, $instance->{instanceId});
$kernel->yield("runWorker",$instance);
}
}
$kernel->delay_set("checkJobs",$self->config->get("timeBetweenJobs"));
$kernel->delay_set("checkInstances",$self->config->get("timeBetweenRunningWorkflows"));
}
#-------------------------------------------------------------------
@ -123,18 +130,18 @@ sub config {
#-------------------------------------------------------------------
=head2 countRunningJobs ( )
=head2 countRunningInstances ( )
Returns an integer representing the number of running jobs.
Returns an integer representing the number of running instances.
=cut
sub countRunningJobs {
sub countRunningInstances {
my $self = shift;
my $runningJobs = $self->{_runningJobs} || [];
my $jobCount = scalar(@{$runningJobs});
$self->debug("There are $jobCount running jobs.");
return $jobCount;
my $runningInstances = $self->{_runningInstances} || [];
my $instanceCount = scalar(@{$runningInstances});
$self->debug("There are $instanceCount running instances.");
return $instanceCount;
}
#-------------------------------------------------------------------
@ -157,43 +164,46 @@ sub debug {
#-------------------------------------------------------------------
=head2 deleteJob ( instanceId )
=head2 deleteInstance ( instanceId )
Removes a workflow job from the processing queue.
Removes a workflow instance from the processing queue.
=cut
sub deleteJob {
my ($self, $instanceId,$kernel) = @_[OBJECT, ARG0, KERNEL];
$kernel->yield("suspendJob",$instanceId);
$self->debug("Deleting workflow instance $instanceId from job queue.");
my $priority = $self->{_jobs}{$instanceId}{priority};
delete $self->{_jobs}{$instanceId};
for (my $i=0; $i < scalar(@{$self->{"_priority".$priority}}); $i++) {
if ($self->{"_priority".$priority}[$i]{instanceId} eq $instanceId) {
splice(@{$self->{"_priority".$priority}}, $i, 1);
sub deleteInstance {
my ($self, $instanceId,$kernel, $session ) = @_[OBJECT, ARG0, KERNEL, SESSION];
$kernel->call($session, "suspendInstance",$instanceId);
$self->debug("Deleting workflow instance $instanceId from instance queue.");
if ($self->{_instances}{$instanceId}) {
my $priority = $self->{_instances}{$instanceId}{priority};
delete $self->{_instances}{$instanceId};
for (my $i=0; $i < scalar(@{$self->{"_priority".$priority}}); $i++) {
if ($self->{"_priority".$priority}[$i] eq $instanceId) {
splice(@{$self->{"_priority".$priority}}, $i, 1);
}
}
}
}
#-------------------------------------------------------------------
=head2 getNextJob ( )
=head2 getNextInstance ( )
=cut
sub getNextJob {
sub getNextInstance {
my $self = shift;
$self->debug("Looking for a workflow instance to execute.");
$self->debug("Looking for a workflow instance to run.");
foreach my $priority (1..3) {
foreach my $job (@{$self->{"_priority".$priority}}) {
if (time() > $job->{statusDelay} & $job->{status}) {
delete $job->{statusDelay};
$job->{status} eq "waiting";
foreach my $instanceId (@{$self->{"_priority".$priority}}) {
if (time() > $self->{_instances}{$instanceId}{statusDelay} && $self->{_instances}{$instanceId}{status} eq "delay") {
$self->debug("Returning $instanceId to available pool.");
delete $self->{_instances}{$instanceId}{statusDelay};
$self->{_instances}{$instanceId}{status} = "waiting";
}
if ($job->{status} eq "waiting") {
$self->debug("Looks like ".$job->{instanceId}." would be a good workflow instance to run.");
return $job;
if ($self->{_instances}{$instanceId}{status} eq "waiting") {
$self->debug("Looks like ".$instanceId." would be a good workflow instance to run.");
return $self->{_instances}{$instanceId};
}
}
}
@ -211,9 +221,9 @@ sub loadWorkflows {
my ($kernel, $self, $config) = @_[KERNEL, OBJECT, ARG0];
$self->debug("Loading workflows for ".$config->getFilename.".");
my $session = WebGUI::Session->open($config->getWebguiRoot, $config->getFilename);
my $result = $session->db->read("select * from WorkflowInstance");
while (my $data = $result->hashRef) {
$kernel->yield("addJob", $config, $data);
my $result = $session->db->read("select instanceId,priority from WorkflowInstance");
while (my ($id, $priority) = $result->array) {
$kernel->yield("addInstance", {sitename=>$config->get("sitename")->[0], instanceId=>$id, priority=>$priority});
}
$session->close;
}
@ -240,9 +250,9 @@ sub new {
my $debug = shift;
my $self = {_debug=>$debug, _config=>$config};
bless $self, $class;
my @publicEvents = qw(addJob deleteJob);
my @publicEvents = qw(addInstance deleteInstance);
POE::Session->create(
object_states => [ $self => [qw(_start _stop checkJobs deleteJob suspendJob loadWorkflows runWorker workerResponse), @publicEvents] ],
object_states => [ $self => [qw(_start _stop addInstance checkInstances deleteInstance suspendInstance loadWorkflows runWorker workerResponse), @publicEvents] ],
args=>[\@publicEvents]
);
}
@ -256,36 +266,38 @@ Calls a worker to execute a workflow activity.
=cut
sub runWorker {
my ($kernel, $self, $job, $session) = @_[KERNEL, OBJECT, ARG0, SESSION];
$self->debug("Preparing to run workflow instance ".$job->{instanceId}.".");
my ($kernel, $self, $instance, $session) = @_[KERNEL, OBJECT, ARG0, SESSION];
$self->debug("Preparing to run workflow instance ".$instance->{instanceId}.".");
POE::Component::Client::UserAgent->new;
my $url = "http://".$job->{sitename}.'/';
my $request = POST $url, [op=>"runWorkflow", instanceId=>$job->{instanceId}];
my $cookie = $self->{_cookies}{$job->{sitename}};
my $url = "http://".$instance->{sitename}.'/';
my $request = POST $url, [op=>"runWorkflow", instanceId=>$instance->{instanceId}];
my $cookie = $self->{_cookies}{$instance->{sitename}};
$request->header("Cookie","wgSession=".$cookie) if (defined $cookie);
$request->header("User-Agent","Spectre");
$request->header("X-JobId",$job->{instanceId});
$self->debug("Posting workflow instance ".$job->{instanceId}." to $url.");
$request->header("X-instanceId",$instance->{instanceId});
$self->debug("Posting workflow instance ".$instance->{instanceId}." to $url.");
$kernel->post( useragent => 'request', { request => $request, response => $session->postback('workerResponse') });
$self->debug("Workflow instance ".$job->{instanceId}." posted.");
$self->debug("Workflow instance ".$instance->{instanceId}." posted.");
}
#-------------------------------------------------------------------
=head2 suspendJob ( )
=head2 suspendInstance ( )
This method puts a running job back into the available jobs pool thusly freeing up a slot in the running jobs pool. This is done when a job has executed a workflow activity, but the entire workflow has not yet completed.
This method puts a running instance back into the available instances pool thusly freeing up a slot in the running instances pool. This is done when a instance has executed a workflow activity, but the entire workflow has not yet completed.
=cut
sub suspendJob {
sub suspendInstance {
my ($self, $instanceId) = @_[OBJECT, ARG0];
$self->debug("Suspending workflow instance ".$instanceId.".");
$self->{_jobs}{$instanceId}{status} = "delay";
$self->{_jobs}{$instanceId}{statusDelay} = $self->config->get("delayAfterSuspension") + time();
for (my $i=0; $i < scalar(@{$self->{_runningJobs}}); $i++) {
if ($self->{_runningJobs}[$i]{instanceId} eq $instanceId) {
splice(@{$self->{_runningJobs}}, $i, 1);
$self->debug("Suspending workflow instance ".$instanceId." for ".$self->config->get("delayAfterSuspension")." seconds.");
if ($self->{_instances}{$instanceId}) {
$self->{_instances}{$instanceId}{status} = "delay";
$self->{_instances}{$instanceId}{statusDelay} = $self->config->get("delayAfterSuspension") + time();
for (my $i=0; $i < scalar(@{$self->{_runningInstances}}); $i++) {
if ($self->{_runningInstances}[$i] eq $instanceId) {
splice(@{$self->{_runningInstances}}, $i, 1);
}
}
}
}
@ -300,44 +312,44 @@ This method is called when the response from the runWorker() method is received.
sub workerResponse {
my ($self, $kernel) = @_[OBJECT, KERNEL];
$self->debug("Retrieving response from workflow instance job.");
$self->debug("Retrieving response from workflow instance.");
my ($request, $response, $entry) = @{$_[ARG1]};
my $jobId = $request->header("X-JobId"); # got to figure out how to get this from the request, cuz the response may die
$self->debug("Response retrieved is for $jobId.");
my $instanceId = $request->header("X-instanceId"); # got to figure out how to get this from the request, cuz the response may die
$self->debug("Response retrieved is for $instanceId.");
if ($response->is_success) {
$self->debug("Response for $jobId retrieved successfully.");
$self->debug("Response for $instanceId retrieved successfully.");
if ($response->header("Cookie") ne "") {
$self->debug("Storing cookie for $jobId for later use.");
$self->debug("Storing cookie for $instanceId for later use.");
my $cookie = $response->header("Set-Cookie");
$cookie =~ s/wgSession=([a-zA-Z0-9\_\-]{22})/$1/;
$self->{_cookies}{$self->{_jobs}{$jobId}{sitename}} = $cookie;
$self->{_cookies}{$self->{_instances}{$instanceId}{sitename}} = $cookie;
}
my $state = $response->content;
if ($state eq "waiting") {
$self->debug("Was told to wait on $jobId because we're still waiting on some external event.");
$kernel->yield("suspendJob",$jobId);
$self->debug("Was told to wait on $instanceId because we're still waiting on some external event.");
$kernel->yield("suspendInstance",$instanceId);
} elsif ($state eq "complete") {
$self->debug("Workflow instance $jobId ran one of it's activities successfully.");
$kernel->yield("suspendJob",$jobId);
$self->debug("Workflow instance $instanceId ran one of it's activities successfully.");
$kernel->yield("suspendInstance",$instanceId);
} elsif ($state eq "disabled") {
$self->debug("Workflow instance $jobId is disabled.");
$kernel->yield("deleteJob",$jobId);
$self->debug("Workflow instance $instanceId is disabled.");
$kernel->yield("suspendInstance",$instanceId);
} elsif ($state eq "done") {
$self->debug("Workflow instance $jobId is now complete.");
$kernel->yield("deleteJob",$jobId);
$self->debug("Workflow instance $instanceId is now complete.");
$kernel->yield("deleteInstance",$instanceId);
} elsif ($state eq "error") {
$self->debug("Got an error for $jobId.");
$kernel->yield("suspendJob",$jobId);
$self->debug("Got an error for $instanceId.");
$kernel->yield("suspendInstance",$instanceId);
} else {
$self->debug("Something bad happened on the return of $jobId.");
$kernel->yield("suspendJob",$jobId);
$self->debug("Something bad happened on the return of $instanceId.");
$kernel->yield("suspendInstance",$instanceId);
# something bad happened
}
} elsif ($response->is_redirect) {
$self->debug("Response for $jobId was redirected.");
$self->debug("Response for $instanceId was redirected.");
} elsif ($response->is_error) {
$self->debug("Response for $jobId had a communications error.");
$kernel->yield("suspendJob",$jobId)
$self->debug("Response for $instanceId had a communications error.");
$kernel->yield("suspendInstance",$instanceId)
# we should probably log something
}
}

View file

@ -207,8 +207,8 @@ sub www_commitVersionTagConfirm {
my $tag = WebGUI::VersionTag->new($session, $tagId);
if (defined $tag && $session->user->isInGroup($tag->get("groupToUse"))) {
$tag->set({comments=>$session->form->process("comments", "textarea")});
$tag->commit;
#$tag->requestCommit;
# $tag->commit;
$tag->requestCommit;
my $i18n = WebGUI::International->new($session, "VersionTag");
my $ac = WebGUI::AdminConsole->new($session,"versions");
return $ac->render(

View file

@ -84,7 +84,7 @@ sub delete {
my $self = shift;
$self->session->db->write("delete from WorkflowInstanceScratch where instanceId=?",[$self->getId]);
$self->session->db->deleteRow("WorkflowInstance","instanceId",$self->getId);
WebGUI::Workflow::Spectre->new($self->session)->notify("workflow/deleteJob",$self->getId);
WebGUI::Workflow::Spectre->new($self->session)->notify("workflow/deleteInstance",$self->getId);
undef $self;
}
@ -306,8 +306,8 @@ sub set {
$self->{_data}{lastUpdate} = time();
$self->session->db->setRow("WorkflowInstance","instanceId",$self->{_data});
my $spectre = WebGUI::Workflow::Spectre->new($self->session);
$spectre->notify("workflow/deleteJob",$self->getId);
$spectre->notify("workflow/addJob",$self->session->config->getFilename, $self->{_data});
$spectre->notify("workflow/deleteInstance",$self->getId);
$spectre->notify("workflow/addInstance", {sitename=>$self->session->config->get("sitename")->[0], instanceId=>$self->getId, priority=>$self->{_data}{priority}});
}
#-------------------------------------------------------------------

View file

@ -81,7 +81,7 @@ sub notify {
timeout=>10
);
if ($remote) {
my $result = $remote->post('admin/shutdown', @params);
my $result = $remote->post(@params);
unless (defined $result) {
$self->session->errorHandler->warn("Couldn't send command to Spectre because ".$POE::Component::IKC::ClientLite::error);
}

View file

@ -35,8 +35,8 @@ if ($help || !($shutdown||$daemon||$run)) {
print <<STOP;
S.P.E.C.T.R.E. is the Supervisor of Perplexing Event-handling Contraptions for
Triggering Relentless Executions. It handles WebGUI's workflow, mail sending,
search engine indexing, and other background processes.
Triggering Relentless Executions. It triggers WebGUI's workflow and scheduling
functions.
Usage: perl spectre.pl [ options ]