Skip to content

Commit c3519ca

Browse files
committed
Additional pipeline job debugging
1 parent 0c68afa commit c3519ca

File tree

1 file changed

+8
-1
lines changed

1 file changed

+8
-1
lines changed

cluster/src/org/labkey/cluster/pipeline/AbstractClusterExecutionEngine.java

Lines changed: 8 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -588,7 +588,14 @@ else if (pj.getErrors() > 0)
588588
else if (pj.getActiveTaskStatus() == PipelineJob.TaskStatus.complete)
589589
{
590590
//NOTE: this can occur when the cluster job has a non-zero exit after the java process terminates.
591-
pj.getLogger().info("Pipeline job JSON marked complete, but the cluster status was: " + taskStatus);
591+
//Note: if cluster status is error, go with completed anyway
592+
pj.getLogger().info("Pipeline job JSON marked complete, but the cluster status was: " + taskStatus + ", status file was: " + (sf == null ? null : sf.getStatus()) + ", cluster job: " + mostRecent.getStatus(), new Exception());
593+
if (taskStatus == PipelineJob.TaskStatus.error && PipelineJob.TaskStatus.running.matches(sf.getStatus()))
594+
{
595+
// TODO: consider updating this?
596+
//pj.getLogger().info("Ignoring ERROR status and deferring to pipeline JSON status of " + pj.getActiveTaskStatus());
597+
//taskStatus = PipelineJob.TaskStatus.complete;
598+
}
592599
}
593600

594601
pj.getLogger().debug("setting active task status for job: " + j.getClusterId() + " to: " + taskStatus.name() + ". status was: " + pj.getActiveTaskStatus() + " (JSON) /" + sf.getStatus() + " (StatusFile) / " + status + " (Cluster), activeTaskId: " + (pj.getActiveTaskId() != null ? pj.getActiveTaskId().toString() : "no active task") + ", hostname: " + sf.getActiveHostName() + ", rowid: " + j.getRowId());

0 commit comments

Comments
 (0)