MeetKai · jeffreymeetkai · Sep 27, 2024 · Oct 24, 2024 · Oct 25, 2024 · Oct 25, 2024
diff --git a/README.md b/README.md
@@ -387,7 +387,38 @@ modal serve modal_server_vllm
 ```shell Python
 modal deploy modal_server_vllm
 ```
-
+
+## Quick Cloud Deployment
+
+Use the `deploy_skypilot.py` script to deploy a Functionary model onto various clouds using Skypilot. Currently, we support the following clouds:
+- Lambdalabs
+- RunPod
+
+### Get Started
+
+1. Install Skypilot:
+
+```bash
+pip install skypilot[all]
+```
+
+2. Set up your cloud credentials by following the instructions [here](https://skypilot.readthedocs.io/en/latest/getting-started/installation.html#cloud-account-setup)
+
+3. Run the following command to check the available arguments:
+```bash
+python deploy_skypilot.py --help
+```
+
+4. SkyPilot does not support stopping instances and opening ports for both Lambdalabs and RunPod currently.
+For Lambdalabs, please expose the port for the server manually first [here](https://cloud.lambdalabs.com/firewall) before running `deploy_skypilot.py`.
+For Runpod, please run `deploy_skypilot.py` twice. After the first command, check the [RunPod Dashboard](https://www.runpod.io/console/pods) for the instance created by Skypilot. Once the instance is created, expose the port for the server manually. Thereafter, ctrl-c the first command and run the command again.
+
+5. To stop the cluster, run the following command and manually stop the instance on RunPod/Lambdalabs:
+```bash
+sky stop <cluster_name>
+```
+
+
 # Use Cases
 
 Here are a few examples of how you can use this function calling system:

diff --git a/deploy_skypilot.py b/deploy_skypilot.py
@@ -0,0 +1,198 @@
+import argparse
+import logging
+
+import sky
+
+# Set up logging
+logging.basicConfig(
+    level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s"
+)
+logger = logging.getLogger(__name__)
+
+CLOUD_MAPPING = {
+    "lambda": sky.Lambda(),
+    "runpod": sky.RunPod(),
+}
+
+
+def get_cloud_provider(cloud_name: str) -> sky.clouds.Cloud:
+    """
+    Get the cloud provider object based on the given cloud name.
+
+    Args:
+        cloud_name (str): The name of the cloud provider.
+
+    Returns:
+        sky.clouds.Cloud: The corresponding cloud provider object.
+
+    Raises:
+        AssertionError: If an invalid cloud provider name is given.
+    """
+    assert cloud_name.lower() in CLOUD_MAPPING, f"Invalid cloud provider: {cloud_name}"
+    return CLOUD_MAPPING[cloud_name.lower()]
+
+
+def check_features(cloud: sky.clouds.Cloud):
+    """
+    Check if the cloud provider supports certain features and update arguments accordingly.
+
+    This function checks if the given cloud provider supports stopping instances and opening ports.
+    If these features are not supported, it updates the corresponding arguments and logs warnings.
+
+    Args:
+        cloud (sky.clouds.Cloud): The cloud provider object to check.
+
+    Side effects:
+        - May modify global 'args' object.
+        - Logs warnings for unsupported features.
+    """
+    unsupported_features = cloud._unsupported_features_for_resources(None)
+
+    if sky.clouds.CloudImplementationFeatures.STOP in unsupported_features:
+        logger.warning(
+            f"Stopping is not supported on {repr(cloud)}. Setting args.idle_timeout and args.down to None."
+        )
+        args.idle_timeout = None
+        args.down = None
+    if sky.clouds.CloudImplementationFeatures.OPEN_PORTS in unsupported_features:
+        logger.warning(
+            f"Opening port is not supported on {repr(cloud)}. Setting args.port_to_open to None. Please open port manually."
+        )
+        args.port_to_open = None
+
+
+def form_command() -> str:
+    """
+    Form the command to run the vLLM server.
+
+    This function constructs the command string to start the vLLM server
+    based on the provided arguments. It includes the model, port, host,
+    and optional parameters like max_model_len and tensor_parallel_size.
+
+    Returns:
+        str: The formatted command string to run the vLLM server.
+    """
+    command = f"cd functionary && python server_vllm.py --model {args.model} --port {args.port} --host {args.host}"
+    if args.max_model_len is not None:
+        command += f" --max-model-len {args.max_model_len}"
+    if args.tensor_parallel_size is not None:
+        command += f" --tensor-parallel-size {args.tensor_parallel_size}"
+    return command
+
+
+def main():
+    """
+    Main function to deploy a Functionary model using Skypilot.
+
+    This function performs the following steps:
+    1. Retrieves the cloud provider based on the specified argument.
+    2. Checks the features supported by the cloud provider.
+    3. Creates a Skypilot Task with the necessary setup and run commands.
+    4. Sets the resources for the task, including cloud, accelerators, ports, and disk size.
+    5. Launches the task using Skypilot, with specified cluster name and optional timeout settings.
+
+    Side effects:
+        - Modifies global 'args' object based on cloud provider features.
+        - Launches a Skypilot task, which may create or modify cloud resources.
+
+    Raises:
+        Any exceptions raised by Skypilot during task creation or launch.
+    """
+    cloud = get_cloud_provider(cloud_name=args.cloud)
+    check_features(cloud=cloud)
+
+    task = sky.Task(
+        setup="if [ ! -d 'functionary' ]; then git clone https://github.com/meetkai/functionary.git; fi && cd functionary && pip install -r requirements.txt",
+        run=form_command(),
+        envs=None,
+        workdir=None,
+    )
+    task.set_resources(
+        sky.Resources(
+            cloud=cloud,
+            accelerators=f"{args.accelerators}:{args.num_accelerators}",
+            ports=args.port_to_open,
+            disk_size=args.disk_size,
+        )
+    )
+
+    sky.launch(
+        task,
+        cluster_name=args.cluster_name,
+        idle_minutes_to_autostop=args.idle_timeout,
+        down=args.down,
+    )
+
+
+def parse_args():
+    parser = argparse.ArgumentParser(description="Deploy Skypilot")
+    parser.add_argument(
+        "--cluster-name", type=str, required=True, help="Name of the cluster"
+    )
+    parser.add_argument(
+        "--cloud",
+        type=str,
+        default=None,
+        help=f"Cloud provider (default: None). Currently only supports {list(CLOUD_MAPPING.keys())}",
+    )
+    parser.add_argument(
+        "--accelerators",
+        type=str,
+        default="A100",
+        help="Accelerator type. Check available types with `sky show-gpus --all`",
+    )
+    parser.add_argument(
+        "--num-accelerators",
+        type=int,
+        default=1,
+        help="Number of accelerators. Check available values with `sky show-gpus --all`",
+    )
+    parser.add_argument(
+        "--disk-size",
+        type=str,
+        default=256,
+        help="The size of the OS disk in GiB. If None, defaults to 256 GiB",
+    )
+    parser.add_argument(
+        "--region", type=str, default=None, help="Region (default: None)"
+    )
+    parser.add_argument(
+        "--idle-timeout",
+        type=int,
+        default=-1,
+        help="Idle timeout in minutes. `-1` means no timeout",
+    )
+    parser.add_argument(
+        "--down",
+        type=bool,
+        default=False,
+        help="Whether to tear down the cluster when timeout",
+    )
+    parser.add_argument(
+        "--model",
+        type=str,
+        default="meetkai/functionary-small-v3.2",
+        help="Model to use",
+    )
+    parser.add_argument("--max-model-len", type=int, default=None, help="Model to use")
+    parser.add_argument(
+        "--tensor-parallel-size", type=int, default=1, help="Tensor parallel size"
+    )
+    parser.add_argument("--port", type=int, default=8000, help="Port to use")
+    parser.add_argument("--host", type=str, default="0.0.0.0", help="host to use")
+
+    args = parser.parse_args()
+
+    if args.disk_size is None:
+        args.disk_size = 256
+    args.disk_size = min(int(args.disk_size), 1024)  # Set max disk size to 1TB
+    if args.idle_timeout == -1:
+        args.idle_timeout = None
+    args.port_to_open = args.port
+
+    return args
+
+
+if __name__ == "__main__":
+    args = parse_args()
+    main()