From 0377e9badf770c77814d2ce3565e784817ab7cb8 Mon Sep 17 00:00:00 2001 From: Eugene Rakhmatulin Date: Thu, 18 Dec 2025 23:12:39 -0800 Subject: [PATCH] Bugfix: don't shut down on exit if cluster is already running --- launch-cluster.sh | 15 +++++++++++++-- 1 file changed, 13 insertions(+), 2 deletions(-) diff --git a/launch-cluster.sh b/launch-cluster.sh index 09e8b85..56fd05b 100755 --- a/launch-cluster.sh +++ b/launch-cluster.sh @@ -22,6 +22,7 @@ COMMAND_TO_RUN="" DAEMON_MODE="false" CHECK_CONFIG="false" ACTION="start" +CLUSTER_WAS_RUNNING="false" # Function to print usage usage() { @@ -275,6 +276,11 @@ cleanup() { # Remove traps to prevent nested cleanup trap - EXIT INT TERM HUP + if [[ "$CLUSTER_WAS_RUNNING" == "true" ]]; then + echo "Cluster was already running when script started. Skipping cleanup." + return + fi + echo "" echo "Stopping cluster..." @@ -347,8 +353,9 @@ check_cluster_running() { done if [[ "$running" == "true" ]]; then - echo "Cluster containers are already running. Please stop them first or use a different name." - exit 1 + echo "Cluster containers are already running. Skipping launch." + CLUSTER_WAS_RUNNING="true" + return 0 fi } @@ -356,6 +363,10 @@ check_cluster_running() { start_cluster() { check_cluster_running + if [[ "$CLUSTER_WAS_RUNNING" == "true" ]]; then + return + fi + # Start Head Node echo "Starting Head Node on $HEAD_IP..." docker run -d --privileged --gpus all --rm \