# Example .env configuration file for spark-vllm-docker # Copy this file to .env and customize for your environment # Cluster configuration # CLUSTER_NODES: Comma-separated list of node IPs (first node is the head node) CLUSTER_NODES="192.168.177.11,192.168.177.12" # ETH_IF: Ethernet interface name (optional, auto-detected if not specified) ETH_IF="enp1s0f1np1" # IB_IF: InfiniBand interface name (optional, auto-detected if not specified) IB_IF="rocep1s0f1,roceP2p1s0f1" # LOCAL_IP: Local IP address (optional, auto-detected if not specified) # Useful for solo mode or overriding auto-detection LOCAL_IP="192.168.177.11" # MASTER_PORT: Port for cluster coordination (default: 29501) MASTER_PORT="29501" # CONTAINER_NAME: Container name (default: vllm_node) # Note: This is a configuration variable, NOT passed as env var to container CONTAINER_NAME="vllm_node" # Container environment variables # Any variable starting with CONTAINER_ (except CONTAINER_NAME) will be converted to -e flags # Example: CONTAINER_NCCL_DEBUG=INFO becomes -e NCCL_DEBUG=INFO CONTAINER_NCCL_DEBUG="INFO" CONTAINER_HF_TOKEN="your_huggingface_token_here" CONTAINER_NCCL_IGNORE_CPU_AFFINITY="1" # COPY_HOSTS: Comma-separated list of hosts for build-and-copy.sh (optional) # Used by build-and-copy.sh to distribute images across cluster COPY_HOSTS="192.168.177.12" # Additional container environment variables # CONTAINER_MAX_JOBS="16" # CONTAINER_CUDA_VISIBLE_DEVICES="0,1"