Skip to content

Commit

Permalink
increased badWorkedFailInterval and added more failure attempts (#2936)
Browse files Browse the repository at this point in the history
  • Loading branch information
jeffrey856 authored and adamnovak committed Jan 23, 2020
1 parent 38c2fd8 commit 74596b3
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions src/toil/test/src/jobServiceTest.py
Original file line number Diff line number Diff line change
Expand Up @@ -162,7 +162,7 @@ def testServiceParallelRecursive(self, checkpoint=True):
finally:
list(map(os.remove, outFiles))

def runToil(self, rootJob, retryCount=1, badWorker=0.5, badWorkedFailInterval=0.05, maxServiceJobs=sys.maxsize, deadlockWait=60):
def runToil(self, rootJob, retryCount=1, badWorker=0.5, badWorkedFailInterval=0.1, maxServiceJobs=sys.maxsize, deadlockWait=60):
# Create the runner for the workflow.
options = Job.Runner.getDefaultOptions(self._getTestJobStorePath())
options.logLevel = "DEBUG"
Expand All @@ -182,7 +182,7 @@ def runToil(self, rootJob, retryCount=1, badWorker=0.5, badWorkedFailInterval=0.
break
except FailedJobsException as e:
i = e.numberOfFailedJobs
if totalTrys > 40: #p(fail after this many restarts) = 0.5**32
if totalTrys > 50: #p(fail after this many restarts) = 0.5**32
self.fail() #Exceeded a reasonable number of restarts
totalTrys += 1
options.restart = True
Expand Down

0 comments on commit 74596b3

Please sign in to comment.