We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent a35a042 commit eeed7bfCopy full SHA for eeed7bf
modelopt/torch/speculative/plugins/megatron_eagle.py
@@ -750,8 +750,6 @@ def modify(
750
with FakeTensorMode():
751
d2t = torch.load(draft_vocab_cache, mmap=True)
752
self.eagle_config.draft_vocab_size = d2t.shape[0]
753
- else:
754
- self.eagle_config.draft_vocab_size = self.vocab_size
755
756
if self.eagle_config.draft_vocab_size != self.eagle_config.vocab_size:
757
assert eagle_self_logit_distillation, (
0 commit comments