We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3d662e5 commit ddd812eCopy full SHA for ddd812e
1 file changed
tensorrt_llm/_torch/pyexecutor/py_executor.py
@@ -328,7 +328,6 @@ def __init__(
328
self.max_beam_width = max_beam_width
329
self.max_draft_len = max_draft_len
330
self.max_total_draft_tokens = max_total_draft_tokens
331
- self.use_spec_decode = self.model_engine.enable_spec_decode
332
self.llm_args = self.model_engine.llm_args
333
self.max_stats_len = max(self.llm_args.max_stats_len, 1)
334
self.max_num_tokens = self.llm_args.max_num_tokens
0 commit comments