Skip to content

Commit

Permalink
check in robustify test
Browse files Browse the repository at this point in the history
Signed-off-by: Jack Luar <[email protected]>
  • Loading branch information
luarss committed Sep 12, 2024
1 parent e0f3b03 commit 9d9388b
Showing 1 changed file with 10 additions and 2 deletions.
12 changes: 10 additions & 2 deletions tools/AutoTuner/test/resume_check.py
Original file line number Diff line number Diff line change
Expand Up @@ -68,8 +68,16 @@ def test_tune_resume(self):
with managed_process(self.commands[0], shell=True) as proc:
time.sleep(120)

# Close all ray instances
subprocess.run("ray stop", shell=True)
# Keep trying to stop the ray cluster until it is stopped
while 1:
proc = subprocess.run("ray status", shell=True)
no_nodes = proc.returncode != 0
proc = subprocess.run("ray stop", shell=True)
successful = proc.returncode == 0

if no_nodes and successful:
break
time.sleep(10)

# Run the second config to completion
print("Running the second config")
Expand Down

0 comments on commit 9d9388b

Please sign in to comment.