[TRTLLM-12669][chore] Apply CI yapf reformat to interface.py

zhaoyangwang-nvidia · zhaoyangwang-nvidia · commit df3dc51c34ac · 2026-06-03T18:56:18.000-07:00
CI yapf hook reformatted a few line wraps in interface.py — apply locally
to keep CI green. No functional change.

Signed-off-by: ZhaoyangWang &lt;zhaoyangw@nvidia.com&gt;
diff --git a/tensorrt_llm/_torch/speculative/interface.py b/tensorrt_llm/_torch/speculative/interface.py
@@ -1057,8 +1057,8 @@ def _sample_and_accept_draft_tokens_base(
                                          device=logits.device)
 
         # Sample tokens using per-request sampling parameters
-        target_tokens = self._sample_tokens_for_batch(
-            logits, spec_metadata, num_contexts, batch_size)
+        target_tokens = self._sample_tokens_for_batch(logits, spec_metadata,
+                                                      num_contexts, batch_size)
 
         # Context requests: only accept the sampled token (no draft tokens yet)
         accepted_tokens[:num_contexts, 0] = target_tokens[:num_contexts]
@@ -1072,8 +1072,7 @@ def _sample_and_accept_draft_tokens_base(
         # Compare draft tokens with target tokens using cumulative product
         # Counts consecutive matches from the start
         num_accepted_tokens[num_contexts:] += torch.cumprod(
-            (draft_tokens
-             == gen_target_tokens[:, :runtime_draft_len]).int(),
+            (draft_tokens == gen_target_tokens[:, :runtime_draft_len]).int(),
             dim=-1).sum(1)
 
         # Apply force override if set
@@ -1182,8 +1181,9 @@ def _sample_and_accept_draft_tokens_rejection(
 
             target_probs_flat = compute_probs_from_logits(
                 gen_logits, temperatures, top_ks, top_ps)
-            target_probs = target_probs_flat.reshape(
-                num_gens, runtime_draft_len + 1, vocab_size)
+            target_probs = target_probs_flat.reshape(num_gens,
+                                                     runtime_draft_len + 1,
+                                                     vocab_size)
 
             draft_vocab_size = draft_probs.shape[-1]
             assert draft_probs.shape[0] == num_gens, (
@@ -1200,8 +1200,7 @@ def _sample_and_accept_draft_tokens_rejection(
                 # configured, e.g. when use_rejection_sampling was off at
                 # prepare() time.
                 if spec_metadata.full_draft_probs is not None:
-                    full_draft_probs = spec_metadata.full_draft_probs[:
-                                                                      num_gens]
+                    full_draft_probs = spec_metadata.full_draft_probs[:num_gens]
                 else:
                     full_draft_probs = torch.zeros(
                         (num_gens, runtime_draft_len, vocab_size),