We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent c501599 commit 6980317Copy full SHA for 6980317
1 file changed
benchmarks/multi_node/llm-d/job.slurm
@@ -12,9 +12,13 @@ set -euo pipefail
12
echo "=== llm-d job start ==="
13
echo "UTC: $(TZ=UTC date '+%Y-%m-%d %H:%M:%S %Z')"
14
15
-# Repo root (benchmarks/multi_node/llm-d/job.slurm -> ../../..)
16
-DI_REPO_DIR=$(cd "$(dirname "$0")/../../.." && pwd)
+# Repo root. $(pwd) = the sbatch submit dir, which the wrapper sets to
+# benchmarks/multi_node/llm-d/ before invoking submit.sh, so 3 up =
17
+# repo root. Using $(dirname "$0") would resolve to a SLURM staging
18
+# copy under /var/spool/... and miss the checkout entirely.
19
+DI_REPO_DIR=$(cd "$(pwd)/../../.." && pwd)
20
export DI_REPO_DIR
21
+echo "REPO DIR: ${DI_REPO_DIR}"
22
23
ALL_NODES=$(scontrol show hostnames "$SLURM_JOB_NODELIST")
24
TOTAL_NODES=$(echo "$ALL_NODES" | wc -l)
0 commit comments