We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 699ca4f commit ce96315Copy full SHA for ce96315
1 file changed
src/maxtext/trainers/post_train/distillation/train_distill.py
@@ -463,6 +463,7 @@ def train_distill(
463
strategy = distillation_utils.CombinedDistillationStrategy(
464
student_forward_fn=student_forward_fn,
465
teacher_forward_fn=teacher_forward_fn,
466
+ pad_id=pad_id,
467
temperature=student_config.distill_temperature,
468
alpha=student_config.distill_alpha,
469
beta_feature=student_config.distill_beta,
0 commit comments