-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathtrain.slurm
More file actions
53 lines (47 loc) · 1.8 KB
/
Copy pathtrain.slurm
File metadata and controls
53 lines (47 loc) · 1.8 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#!/bin/bash
#SBATCH --job-name=cross_attn_train
#SBATCH --output=/home/rnallaperumal/deep-vio/cross_attention/logs/train_%j.out
#SBATCH --error=/home/rnallaperumal/deep-vio/cross_attention/logs/train_%j.err
#SBATCH --time=2-00:00:00
#SBATCH --partition=academic
#SBATCH --account=rbe577
#SBATCH --gres=gpu:1
#SBATCH --cpus-per-task=8
#SBATCH --mem=32G
# Submit:
# sbatch --export=ALL,DATA_ROOT=/path/to/data,\
# VISION_CKPT=../vision_only/checkpoints/branch_a/best.pt,\
# AIRIO_CKPT=../imu_only/checkpoints/airio/best.pt \
# train.slurm
set -euo pipefail
if command -v module >/dev/null 2>&1; then
module purge || true
module load python/3.10 || module load python/3.11 || module load python || true
module load cuda/12.1 || module load cuda/11.8 || module load cuda || true
fi
PROJECT_DIR="/home/rnallaperumal/deep-vio/cross_attention"
VENV_DIR="${VENV_DIR:-${PROJECT_DIR}/.venv}"
if [ -z "${DATA_ROOT:-}" ]; then
echo "ERROR: DATA_ROOT not set."; exit 1
fi
mkdir -p "${PROJECT_DIR}/logs"
# shellcheck disable=SC1091
source "${VENV_DIR}/bin/activate"
cd "${PROJECT_DIR}"
VIS_ARG=""; [ -n "${VISION_CKPT:-}" ] && VIS_ARG="--vision_checkpoint ${VISION_CKPT}"
AIO_ARG=""; [ -n "${AIRIO_CKPT:-}" ] && AIO_ARG="--airio_checkpoint ${AIRIO_CKPT}"
python train.py \
--data_root "${DATA_ROOT}" \
${VIS_ARG} ${AIO_ARG} \
--epochs "${EPOCHS:-100}" \
--warmup_epochs "${WARMUP_EPOCHS:-5}" \
--batch_size "${BATCH_SIZE:-8}" \
--lr "${LR:-1e-4}" \
--lr_finetune "${LR_FINETUNE:-2e-5}" \
--feat_dim "${FEAT_DIM:-128}" \
--num_heads "${NUM_HEADS:-4}" \
--num_layers "${NUM_LAYERS:-2}" \
--sequence_length "${SEQ_LEN:-10}" \
--imu_context "${IMU_CONTEXT:-100}" \
--imu_rate "${IMU_RATE:-1000.0}" \
--num_workers "${NUM_WORKERS:-4}"