[ARVADOS] created: a925c8936cba33e6d2504bd984b52750fafc638a
Git user
git at public.curoverse.com
Thu Mar 31 17:47:05 EDT 2016
at a925c8936cba33e6d2504bd984b52750fafc638a (commit)
commit a925c8936cba33e6d2504bd984b52750fafc638a
Author: Brett Smith <brett at curoverse.com>
Date: Thu Mar 31 17:46:51 2016 -0400
8811: crunch-job srun_sync detects and reports SLURM tempfails.
diff --git a/sdk/cli/bin/crunch-job b/sdk/cli/bin/crunch-job
index 4bd58a8..168f238 100755
--- a/sdk/cli/bin/crunch-job
+++ b/sdk/cli/bin/crunch-job
@@ -1984,6 +1984,11 @@ sub srun_sync
delete $reader{$jobstepidx};
my $j = pop @jobstep;
+ # If the srun showed signs of tempfail, ensure the caller treats that as a
+ # failure case.
+ if ($main::please_freeze || $j->{tempfail}) {
+ $exited ||= 255;
+ }
return ($exited, $j->{stdout_captured}, $j->{stderr_captured});
}
-----------------------------------------------------------------------
hooks/post-receive
--
More information about the arvados-commits
mailing list