Skip to content

Commit

Permalink
fix: sets jobStatus=Failed/Payload failed iff the job was running
Browse files Browse the repository at this point in the history
  • Loading branch information
fstagni committed Nov 22, 2023
1 parent 2881a6e commit a797a63
Showing 1 changed file with 8 additions and 2 deletions.
10 changes: 8 additions & 2 deletions src/DIRAC/WorkloadManagementSystem/Agent/JobAgent.py
Original file line number Diff line number Diff line change
Expand Up @@ -32,6 +32,7 @@
from DIRAC.WorkloadManagementSystem.Client.MatcherClient import MatcherClient
from DIRAC.WorkloadManagementSystem.Client.PilotManagerClient import PilotManagerClient
from DIRAC.WorkloadManagementSystem.Client.JobManagerClient import JobManagerClient
from DIRAC.WorkloadManagementSystem.Client.JobMonitoringClient import JobMonitoringClient
from DIRAC.WorkloadManagementSystem.Client.JobStateUpdateClient import JobStateUpdateClient
from DIRAC.WorkloadManagementSystem.Client.JobReport import JobReport
from DIRAC.WorkloadManagementSystem.Client import JobStatus
Expand Down Expand Up @@ -691,7 +692,7 @@ def _checkSubmittedJobs(self):
payloadErrors = []
originalJobID = self.jobReport.jobID
for jobID, taskID in self.submissionDict.items():
if not taskID in self.computingElement.taskResults:
if taskID not in self.computingElement.taskResults:
continue

result = self.computingElement.taskResults[taskID]
Expand All @@ -714,7 +715,12 @@ def _checkSubmittedJobs(self):

# The payload failed (if result["Value"] is not 0)
elif result["Value"]:
self.jobReport.setJobStatus(status=JobStatus.FAILED, minorStatus="Payload failed")
# In order to avoid overriding perfectly valid states, the status is updated iff the job was running
res = JobMonitoringClient().getJobsStatus(jobID)
if not res["OK"]:
return res
if res["Value"][jobID]["Status"] == JobStatus.RUNNING:
self.jobReport.setJobStatus(status=JobStatus.FAILED, minorStatus="Payload failed")

# Do not keep running and do not overwrite the Payload error
message = f"Payload execution failed with error code {result['Value']}"
Expand Down

0 comments on commit a797a63

Please sign in to comment.