We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent f8470e8 commit 02318b7Copy full SHA for 02318b7
dpdispatcher/dp_cloud_server_context.py
@@ -307,7 +307,7 @@ def machine_subfields(cls) -> List[Argument]:
307
"retry_count",
308
[int, type(None)],
309
optional=True,
310
- default=3,
+ default=2,
311
doc=doc_retry_count,
312
),
313
Argument(
dpdispatcher/submission.py
@@ -841,7 +841,7 @@ def handle_unexpected_job_state(self):
841
retry_count = 3
842
assert self.machine is not None
843
if hasattr(self.machine, "retry_count") and self.machine.retry_count > 0:
844
- retry_count = self.machine.retry_count
+ retry_count = self.machine.retry_count + 1
845
if (self.fail_count) > 0 and (self.fail_count % retry_count == 0):
846
raise RuntimeError(
847
f"job:{self.job_hash} {self.job_id} failed {self.fail_count} times.job_detail:{self}"
0 commit comments