Skip to content

Commit d905266

Browse files
committed
server : final touches
ggml-ci
1 parent ddb155c commit d905266

File tree

1 file changed

+3
-1
lines changed

1 file changed

+3
-1
lines changed

examples/server/server.cpp

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -2296,7 +2296,7 @@ struct server_context {
22962296
}
22972297

22982298
// check if the slot supports speculative decoding
2299-
if (!slot.ctx_dft || slot.params.speculative.n_max <= 0) {
2299+
if (!slot.ctx_dft || slot.params.speculative.n_max <= 0 || !slot.params.cache_prompt) {
23002300
continue;
23012301
}
23022302

@@ -2348,6 +2348,8 @@ struct server_context {
23482348
break;
23492349
}
23502350
}
2351+
2352+
SRV_DBG("accepted %d/%d draft tokens\n", (int) ids.size() - 1, (int) draft.size());
23512353
}
23522354
}
23532355

0 commit comments

Comments
 (0)