diff --git a/sky/backends/cloud_vm_ray_backend.py b/sky/backends/cloud_vm_ray_backend.py index d6e7528135b2..ee8cdac5f25b 100644 --- a/sky/backends/cloud_vm_ray_backend.py +++ b/sky/backends/cloud_vm_ray_backend.py @@ -271,8 +271,8 @@ def get_or_fail(futures, pg) -> List[int]: ready = [] # Keep invoking ray.wait if ready is empty. This is because # ray.wait with timeout=None will only wait for 10**6 seconds, - # which will cause the task longer than 12 days returned before - # it is ready. + # which will cause tasks running for more than 12 days to return before + # becoming ready. (Such tasks are common in serving jobs.) # Reference: https://github.com/ray-project/ray/blob/ray-2.9.3/python/ray/_private/worker.py#L2845-L2846 while not ready: ready, unready = ray.wait(futures)