File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -23,7 +23,7 @@ llama_tokens common_ngram_simple_draft(
2323 common_ngram_simple_state & state,
2424 const llama_tokens & tokens, llama_token sampled) {
2525
26- // Simple implementation of self-speculative decoding without draft model, without ngram-map .
26+ // Simple implementation of self-speculative decoding without a draft model.
2727 //
2828 const size_t cur_len = tokens.size ();
2929 // Only check every check_rate tokens to save compute
Original file line number Diff line number Diff line change @@ -119,7 +119,7 @@ struct common_speculative_state {
119119 // TODO: track performance of most recent calls
120120 const bool gen_perf = true ; // whether to generate performance stats.
121121
122- int64_t gen_duration_us = 0 ; // total time spent in this implementation in milliseconds .
122+ int64_t gen_duration_us = 0 ; // total time spent in this implementation in microseconds .
123123
124124 virtual ~common_speculative_state () = default ;
125125
You can’t perform that action at this time.
0 commit comments