skypilot-org · Michaelvll · Jun 26, 2023 · Jun 24, 2023 · Jun 24, 2023 · Jun 25, 2023
diff --git a/sky/backends/cloud_vm_ray_backend.py b/sky/backends/cloud_vm_ray_backend.py
@@ -3668,7 +3668,8 @@ def run_on_head(
 
     @timeline.event
     def _check_existing_cluster(
-            self, task: task_lib.Task, to_provision: resources_lib.Resources,
+            self, task: task_lib.Task,
+            to_provision: Optional[resources_lib.Resources],
             cluster_name: str) -> RetryingVmProvisioner.ToProvisionConfig:
         """Checks if the cluster exists and returns the provision config.
 
@@ -3678,6 +3679,8 @@ def _check_existing_cluster(
             exceptions.InvalidClusterNameError: If the cluster name is invalid.
             # TODO(zhwu): complete the list of exceptions.
         """
+        previous_handle = global_user_state.get_handle_from_cluster_name(
+            cluster_name)
         prev_cluster_status, handle = (
             backend_utils.refresh_cluster_status_handle(
                 cluster_name, acquire_per_cluster_status_lock=False))
@@ -3701,6 +3704,20 @@ def _check_existing_cluster(
                       if resources.cloud is not None else clouds.Cloud)
         task_cloud.check_cluster_name_is_valid(cluster_name)
 
+        if to_provision is None:
+            logger.info(
+                f'The cluster {cluster_name!r} was autodowned or manually '
+                'terminated on the cloud console. Using the original resources '
+                'to provision a new cluster.')
+            # The cluster is recently terminated either by autostop or manually
+            # terminated on the cloud. We should use the original resources to
+            # provision the cluster.
+            assert isinstance(previous_handle,
+                              CloudVmRayResourceHandle), (previous_handle,
+                                                          cluster_name)
-            assert isinstance(previous_handle,
-                              CloudVmRayResourceHandle), (previous_handle,
-                                                          cluster_name)
+            is_cloud_vm_handle = isinstance(previous_handle,
+                                                                      CloudVmRayResourceHandle)
+            assert is_cloud_vm_handle, (previous_handle, cluster_name)
-            assert isinstance(previous_handle,
-                              CloudVmRayResourceHandle), (previous_handle,
-                                                          cluster_name)
+            is_cloud_vm_handle = isinstance(previous_handle,
+                                                                      CloudVmRayResourceHandle)
+            assert is_cloud_vm_handle, (previous_handle, cluster_name)
+            to_provision = previous_handle.launched_resources
+            self.check_resources_fit_cluster(previous_handle, task)
+
         cloud = to_provision.cloud
         if isinstance(cloud, clouds.Local):
             # The field ssh_user is specified in the cluster config file.

diff --git a/sky/skylet/providers/oci/query_helper.py b/sky/skylet/providers/oci/query_helper.py
@@ -57,7 +57,7 @@ def query_instances_by_tags(cls, tag_filters, region):
 
     @classmethod
     def terminate_instances_by_tags(cls, tag_filters, region) -> int:
-        logger.info(f"Terminate instance by tags: {tag_filters}")
+        logger.debug(f"Terminate instance by tags: {tag_filters}")
         insts = cls.query_instances_by_tags(tag_filters, region)
         fail_count = 0
         for inst in insts:
@@ -73,7 +73,7 @@ def terminate_instances_by_tags(cls, tag_filters, region) -> int:
                 traceback.print_exc()
 
         if fail_count == 0:
-            logger.info(f"Instance teardown result: OK")
+            logger.debug(f"Instance teardown result: OK")
         else:
             logger.warn(f"Instance teardown result: {fail_count} failed!")