Skip to content

Commit

Permalink
server : final touches
Browse files Browse the repository at this point in the history
ggml-ci
  • Loading branch information
ggerganov committed Nov 24, 2024
1 parent ddb155c commit d905266
Showing 1 changed file with 3 additions and 1 deletion.
4 changes: 3 additions & 1 deletion examples/server/server.cpp
Original file line number Diff line number Diff line change
Expand Up @@ -2296,7 +2296,7 @@ struct server_context {
}

// check if the slot supports speculative decoding
if (!slot.ctx_dft || slot.params.speculative.n_max <= 0) {
if (!slot.ctx_dft || slot.params.speculative.n_max <= 0 || !slot.params.cache_prompt) {
continue;
}

Expand Down Expand Up @@ -2348,6 +2348,8 @@ struct server_context {
break;
}
}

SRV_DBG("accepted %d/%d draft tokens\n", (int) ids.size() - 1, (int) draft.size());
}
}

Expand Down

0 comments on commit d905266

Please sign in to comment.