We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent 3571fe2 commit a7e8bc1Copy full SHA for a7e8bc1
1 file changed
tools/server/server-context.cpp
@@ -1177,6 +1177,8 @@ struct server_context_impl {
1177
slot.smpl.reset();
1178
}
1179
1180
+ slot.task = std::make_unique<const server_task>(std::move(task));
1181
+
1182
// initialize draft batch
1183
// TODO: rework speculative decoding [TAG_SERVER_SPEC_REWORK]
1184
if (slot.can_speculate()) {
@@ -1185,8 +1187,6 @@ struct server_context_impl {
1185
1187
slot.batch_spec = llama_batch_init(task.params.speculative.n_max + 1, 0, 1);
1186
1188
1189
- slot.task = std::make_unique<const server_task>(std::move(task));
-
1190
slot.state = slot.task->is_child()
1191
? SLOT_STATE_WAIT_OTHER // wait for the parent to process prompt
1192
: SLOT_STATE_STARTED;
0 commit comments