Skip to content

Commit 36da15b

Browse files
committed
save checkpoints with train loss
1 parent dac2993 commit 36da15b

2 files changed

Lines changed: 28 additions & 42 deletions

File tree

train_kwcoco_demo.sh

Lines changed: 27 additions & 41 deletions
Original file line numberDiff line numberDiff line change
@@ -96,49 +96,9 @@ LOG_BATCH_VIZ_TO_DISK=1 python -m yolo.lazy \
9696
device=0 \
9797
accelerator=auto \
9898
task.data.batch_size=2 \
99-
"image_size=[224,224]" \
99+
"image_size=[640, 640]" \
100100
task.optimizer.args.lr=0.0003
101101

102-
LOG_BATCH_VIZ_TO_DISK=1 python -m yolo.lazy \
103-
task=train \
104-
dataset=kwcoco-demo \
105-
use_wandb=False \
106-
out_path="$BUNDLE_DPATH"/training \
107-
name=kwcoco-demo \
108-
cpu_num=0 \
109-
device=0 \
110-
accelerator=auto \
111-
task.data.batch_size=2 \
112-
"image_size=[224,224]" \
113-
task.optimizer.args.lr=0.0003
114-
115-
116-
### TODO: show how to validate
117-
118-
# Grab a checkpoint
119-
CKPT_FPATH=$(python -c "if 1:
120-
import pathlib
121-
ckpt_dpath = pathlib.Path('$BUNDLE_DPATH') / 'training/train/kwcoco-demo/checkpoints'
122-
checkpoints = sorted(ckpt_dpath.glob('*'))
123-
print(checkpoints[-1])
124-
")
125-
echo "CKPT_FPATH = $CKPT_FPATH"
126-
127-
128-
#DISABLE_RICH_HANDLER=1
129-
LOG_BATCH_VIZ_TO_DISK=1 python -m yolo.lazy \
130-
task=validation \
131-
dataset=kwcoco-demo \
132-
use_wandb=False \
133-
out_path="$BUNDLE_DPATH"/training \
134-
name=kwcoco-demo \
135-
cpu_num=0 \
136-
device=0 \
137-
weight="'$CKPT_FPATH'" \
138-
accelerator=auto \
139-
"task.data.batch_size=2" \
140-
"image_size=[224,224]"
141-
142102

143103
### show how to run inference
144104

@@ -168,3 +128,29 @@ python yolo/lazy.py \
168128
task.nms.min_confidence=0.01 \
169129
task.nms.min_iou=0.3 \
170130
task.nms.max_bbox=10
131+
132+
133+
### Show how to run validation
134+
135+
# Grab a checkpoint
136+
CKPT_FPATH=$(python -c "if 1:
137+
import pathlib
138+
ckpt_dpath = pathlib.Path('$BUNDLE_DPATH') / 'training/train/kwcoco-demo/checkpoints'
139+
checkpoints = sorted(ckpt_dpath.glob('*'))
140+
print(checkpoints[-1])
141+
")
142+
echo "CKPT_FPATH = $CKPT_FPATH"
143+
144+
#DISABLE_RICH_HANDLER=1
145+
LOG_BATCH_VIZ_TO_DISK=1 python -m yolo.lazy \
146+
task=validation \
147+
dataset=kwcoco-demo \
148+
use_wandb=False \
149+
out_path="$BUNDLE_DPATH"/training \
150+
name=kwcoco-demo \
151+
cpu_num=0 \
152+
device=0 \
153+
weight="'$CKPT_FPATH'" \
154+
accelerator=auto \
155+
"task.data.batch_size=2" \
156+
"image_size=[224,224]"

yolo/utils/logging_utils.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -345,7 +345,7 @@ def custom_wandb_log(string="", level=int, newline=True, repeat=True, prefix=Tru
345345
'monitor': 'train_loss',
346346
'mode': 'min',
347347
'save_top_k': 5,
348-
'filename': '{epoch:04d}-{step:06d}-trainloss{Loss/BoxLoss:.3f}.ckpt',
348+
'filename': '{epoch:04d}-{step:06d}-trainloss{train_loss.3f}.ckpt',
349349
'save_last': True,
350350
}
351351
import lightning

0 commit comments

Comments
 (0)