We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent b928344 commit 7ecbc69Copy full SHA for 7ecbc69
1 file changed
src/lmms_engine/train/fsdp2/fsdp2_trainer.py
@@ -669,7 +669,7 @@ def calculate_training_metrics(
669
total_tokens += total_seq_len.item()
670
671
tokens_per_second = total_seq_len.item() / delta_time
672
- tokens_per_gpu = tokens_per_second / sp_size / world_size
+ tokens_per_gpu = tokens_per_second / world_size
673
674
# Log total tokens and total tokens per second
675
metrics["train/total_tokens"] = TrainUtilities.format_tokens(total_tokens)
0 commit comments