File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -238,7 +238,7 @@ def test_speculative_decoding_use_logprobs(self):
238238 for i , request_output in enumerate (batch_result_buffer ):
239239 assert isinstance (request_output , RequestOutput )
240240 assert len (request_output .outputs .token_ids ) == accept_num [i ]
241- assert len (request_output .outputs .top_logprobs ) == 3
241+ assert len (request_output .outputs .top_logprobs ) == 7
242242 # tokens, scores, ranks
243243 assert len (request_output .outputs .top_logprobs [0 ][0 ]) == K + 1
244244 assert len (request_output .outputs .top_logprobs [1 ][0 ]) == K + 1
@@ -251,8 +251,8 @@ def test_speculative_decoding_use_logprobs(self):
251251 for c in cached_generated_tokens .cache :
252252 assert isinstance (request_output , RequestOutput )
253253 assert len (request_output .outputs .token_ids ) == accept_num [i ]
254- assert len (request_output .outputs .top_logprobs ) == 3
255- assert len (request_output .outputs .draft_top_logprobs ) == 3
254+ assert len (request_output .outputs .top_logprobs ) == 7
255+ assert len (request_output .outputs .draft_top_logprobs ) == 7
256256 # tokens, scores, ranks
257257 assert len (request_output .outputs .draft_top_logprobs [0 ][0 ]) == K + 1
258258 assert len (request_output .outputs .draft_top_logprobs [1 ][0 ]) == K + 1
Original file line number Diff line number Diff line change @@ -55,7 +55,7 @@ def __init__(
5555 num_speculative_tokens = 2 ,
5656 enable_draft_logprob = True ,
5757 )
58- self .model_config = types .SimpleNamespace (enable_logprob = enable_logprob )
58+ self .model_config = types .SimpleNamespace (enable_logprob = enable_logprob , compute_logits_stats = False )
5959 self .scheduler_config = types .SimpleNamespace (name = "default" , splitwise_role = "decode" )
6060 self .cache_config = types .SimpleNamespace (
6161 enable_prefix_caching = enable_prefix_caching ,
You can’t perform that action at this time.
0 commit comments