Bugfix: don't shut down on exit if cluster is already running
This commit is contained in:
@@ -22,6 +22,7 @@ COMMAND_TO_RUN=""
|
|||||||
DAEMON_MODE="false"
|
DAEMON_MODE="false"
|
||||||
CHECK_CONFIG="false"
|
CHECK_CONFIG="false"
|
||||||
ACTION="start"
|
ACTION="start"
|
||||||
|
CLUSTER_WAS_RUNNING="false"
|
||||||
|
|
||||||
# Function to print usage
|
# Function to print usage
|
||||||
usage() {
|
usage() {
|
||||||
@@ -275,6 +276,11 @@ cleanup() {
|
|||||||
# Remove traps to prevent nested cleanup
|
# Remove traps to prevent nested cleanup
|
||||||
trap - EXIT INT TERM HUP
|
trap - EXIT INT TERM HUP
|
||||||
|
|
||||||
|
if [[ "$CLUSTER_WAS_RUNNING" == "true" ]]; then
|
||||||
|
echo "Cluster was already running when script started. Skipping cleanup."
|
||||||
|
return
|
||||||
|
fi
|
||||||
|
|
||||||
echo ""
|
echo ""
|
||||||
echo "Stopping cluster..."
|
echo "Stopping cluster..."
|
||||||
|
|
||||||
@@ -347,8 +353,9 @@ check_cluster_running() {
|
|||||||
done
|
done
|
||||||
|
|
||||||
if [[ "$running" == "true" ]]; then
|
if [[ "$running" == "true" ]]; then
|
||||||
echo "Cluster containers are already running. Please stop them first or use a different name."
|
echo "Cluster containers are already running. Skipping launch."
|
||||||
exit 1
|
CLUSTER_WAS_RUNNING="true"
|
||||||
|
return 0
|
||||||
fi
|
fi
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -356,6 +363,10 @@ check_cluster_running() {
|
|||||||
start_cluster() {
|
start_cluster() {
|
||||||
check_cluster_running
|
check_cluster_running
|
||||||
|
|
||||||
|
if [[ "$CLUSTER_WAS_RUNNING" == "true" ]]; then
|
||||||
|
return
|
||||||
|
fi
|
||||||
|
|
||||||
# Start Head Node
|
# Start Head Node
|
||||||
echo "Starting Head Node on $HEAD_IP..."
|
echo "Starting Head Node on $HEAD_IP..."
|
||||||
docker run -d --privileged --gpus all --rm \
|
docker run -d --privileged --gpus all --rm \
|
||||||
|
|||||||
Reference in New Issue
Block a user