VectorInstitute
diff --git a/‎vec_inf/client/_client_vars.py‎
Lines changed: 3 additions & 152 deletions b/‎vec_inf/client/_client_vars.py‎
Lines changed: 3 additions & 152 deletions
@@ -1,8 +1,7 @@
 """Global variables for Vector Inference.
 
 This module contains configuration constants and templates used throughout the
-Vector Inference package, including SLURM script templates, model configurations,
-and metric definitions.
+Vector Inference package, including model configurations, and metric definitions.
 
 Constants
 ---------
@@ -19,14 +18,6 @@
 """
 
 from pathlib import Path
-from typing import TypedDict
-
-from vec_inf.client.slurm_vars import (
-    LD_LIBRARY_PATH,
-    SINGULARITY_IMAGE,
-    SINGULARITY_LOAD_CMD,
-    VLLM_NCCL_SO_PATH,
-)
 
 
 MODEL_READY_SIGNATURE = "INFO:     Application startup complete."
@@ -77,145 +68,5 @@
     "-q": "--quantization",
 }
 
-# Slurm script templates
-class ShebangConfig(TypedDict):
-    """TypedDict for SLURM script shebang configuration.
-
-    Parameters
-    ----------
-    base : str
-        Base shebang line for all SLURM scripts
-    multinode : list[str]
-        Additional SLURM directives for multi-node configurations
-    """
-
-    base: str
-    multinode: list[str]
-
-
-class ServerSetupConfig(TypedDict):
-    """TypedDict for server setup configuration.
-
-    Parameters
-    ----------
-    single_node : list[str]
-        Setup commands for single-node deployments
-    multinode : list[str]
-        Setup commands for multi-node deployments, including Ray initialization
-    """
-
-    single_node: list[str]
-    multinode: list[str]
-
-
-class SlurmScriptTemplate(TypedDict):
-    """TypedDict for complete SLURM script template configuration.
-
-    Parameters
-    ----------
-    shebang : ShebangConfig
-        Shebang and SLURM directive configuration
-    singularity_setup : list[str]
-        Commands for Singularity container setup
-    imports : str
-        Import statements and source commands
-    env_vars : list[str]
-        Environment variables to set
-    singularity_command : str
-        Template for Singularity execution command
-    activate_venv : str
-        Template for virtual environment activation
-    server_setup : ServerSetupConfig
-        Server initialization commands for different deployment modes
-    find_vllm_port : list[str]
-        Commands to find available ports for vLLM server
-    write_to_json : list[str]
-        Commands to write server configuration to JSON
-    launch_cmd : list[str]
-        vLLM server launch commands
-    """
-
-    shebang: ShebangConfig
-    singularity_setup: list[str]
-    imports: str
-    env_vars: list[str]
-    singularity_command: str
-    activate_venv: str
-    server_setup: ServerSetupConfig
-    find_vllm_port: list[str]
-    write_to_json: list[str]
-    launch_cmd: list[str]
-
-
-SLURM_SCRIPT_TEMPLATE: SlurmScriptTemplate = {
-    "shebang": {
-        "base": "#!/bin/bash",
-        "multinode": [
-            "#SBATCH --exclusive",
-            "#SBATCH --tasks-per-node=1",
-        ],
-    },
-    "singularity_setup": [
-        SINGULARITY_LOAD_CMD,
-        f"singularity exec {SINGULARITY_IMAGE} ray stop",
-    ],
-    "imports": "source {src_dir}/find_port.sh",
-    "env_vars": [
-        f"export LD_LIBRARY_PATH={LD_LIBRARY_PATH}",
-        f"export VLLM_NCCL_SO_PATH={VLLM_NCCL_SO_PATH}",
-    ],
-    "singularity_command": f"singularity exec --nv --bind {{model_weights_path}}{{additional_binds}} --containall {SINGULARITY_IMAGE}",
-    "activate_venv": "source {venv}/bin/activate",
-    "server_setup": {
-        "single_node": [
-            "\n# Find available port",
-            "head_node_ip=${SLURMD_NODENAME}",
-        ],
-        "multinode": [
-            "\n# Get list of nodes",
-            'nodes=$(scontrol show hostnames "$SLURM_JOB_NODELIST")',
-            "nodes_array=($nodes)",
-            "head_node=${nodes_array[0]}",
-            'head_node_ip=$(srun --nodes=1 --ntasks=1 -w "$head_node" hostname --ip-address)',
-            "\n# Start Ray head node",
-            "head_node_port=$(find_available_port $head_node_ip 8080 65535)",
-            "ray_head=$head_node_ip:$head_node_port",
-            'echo "Ray Head IP: $ray_head"',
-            'echo "Starting HEAD at $head_node"',
-            'srun --nodes=1 --ntasks=1 -w "$head_node" \\',
-            "    SINGULARITY_PLACEHOLDER \\",
-            '    ray start --head --node-ip-address="$head_node_ip" --port=$head_node_port \\',
-            '    --num-cpus "$SLURM_CPUS_PER_TASK" --num-gpus "$SLURM_GPUS_PER_NODE" --block &',
-            "sleep 10",
-            "\n# Start Ray worker nodes",
-            "worker_num=$((SLURM_JOB_NUM_NODES - 1))",
-            "for ((i = 1; i <= worker_num; i++)); do",
-            "    node_i=${nodes_array[$i]}",
-            '    echo "Starting WORKER $i at $node_i"',
-            '    srun --nodes=1 --ntasks=1 -w "$node_i" \\',
-            "        SINGULARITY_PLACEHOLDER \\",
-            '        ray start --address "$ray_head" \\',
-            '        --num-cpus "$SLURM_CPUS_PER_TASK" --num-gpus "$SLURM_GPUS_PER_NODE" --block &',
-            "    sleep 5",
-            "done",
-        ],
-    },
-    "find_vllm_port": [
-        "\nvllm_port_number=$(find_available_port $head_node_ip 8080 65535)",
-        'server_address="http://${head_node_ip}:${vllm_port_number}/v1"',
-    ],
-    "write_to_json": [
-        '\njson_path="{log_dir}/{model_name}.$SLURM_JOB_ID/{model_name}.$SLURM_JOB_ID.json"',
-        'jq --arg server_addr "$server_address" \\',
-        "    '. + {{\"server_address\": $server_addr}}' \\",
-        '    "$json_path" > temp.json \\',
-        '    && mv temp.json "$json_path"',
-    ],
-    "launch_cmd": [
-        "vllm serve {model_weights_path} \\",
-        "    --served-model-name {model_name} \\",
-        '    --host "0.0.0.0" \\',
-        "    --port $vllm_port_number \\",
-        "    --trust-remote-code \\",
-    ],
-}
+# Required matching arguments for batch mode
+BATCH_MODE_REQUIRED_MATCHING_ARGS = ["venv", "log_dir"]