We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent ddb155c commit d905266Copy full SHA for d905266
examples/server/server.cpp
@@ -2296,7 +2296,7 @@ struct server_context {
2296
}
2297
2298
// check if the slot supports speculative decoding
2299
- if (!slot.ctx_dft || slot.params.speculative.n_max <= 0) {
+ if (!slot.ctx_dft || slot.params.speculative.n_max <= 0 || !slot.params.cache_prompt) {
2300
continue;
2301
2302
@@ -2348,6 +2348,8 @@ struct server_context {
2348
break;
2349
2350
2351
+
2352
+ SRV_DBG("accepted %d/%d draft tokens\n", (int) ids.size() - 1, (int) draft.size());
2353
2354
2355
0 commit comments