@@ -23,8 +23,6 @@ key_segments:
2323 hidden_dropout : False
2424 precision : False
2525 seq_length : False
26- pckg_url : False
27- file_name_wheel : False
2826script_args :
2927 # All arguments referenced in the script string must be specified here.
3028 # Arguments not referenced in the script string must have the 'arg' field specified.
@@ -56,8 +54,6 @@ script_args:
5654 batch_size : 2
5755 variant : finetune
5856 precision : fp8
59- pckg_url : gitlab-master.nvidia.com/api/v4/projects/180496/packages/pypi/simple/
60- file_name_wheel : subquadratic-ops
6157 products :
6258 - variant : finetune
6359 lora_enabled : " "
@@ -68,15 +64,6 @@ script_args:
6864 task : lora_finetune_from_ckpt
6965 experiment_name : evo2-lora-finetune
7066script : |-
71- INSTALL_FLAG="/tmp/install_done_${{SLURMD_NODENAME}}";
72- if [ "$SLURM_LOCALID" = "0" ]; then
73- pip install ${file_name_wheel} --index-url https://oauth2:$JET_GITLAB_TOKEN@${pckg_url} --extra-index-url https://pypi.org/simple/
74- touch $INSTALL_FLAG
75- fi
76- # All ranks wait until install flag file appears
77- while [ ! -f $INSTALL_FLAG ]; do
78- sleep 1
79- done
8067 WANDB_API_KEY=$BIONEMO_WANDB_API_KEY train_${model} \
8168 -d ${data_base_path}/${dataset_config} \
8269 --dataset-dir=${data_base_path}/${dataset_dir} \
@@ -102,7 +89,6 @@ script: |-
10289 --devices=${gpus} \
10390 --num-nodes=${nodes} \
10491 --val-check-interval=${val_check_interval} \
105- --use-subquadratic_ops \
10692 --create-tensorboard-logger \
10793 --activation-checkpoint-recompute-num-layers=${activation_checkpoint_layers} \
10894 --disable-checkpointing \
0 commit comments