We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 7ae2932 commit 2baf077Copy full SHA for 2baf077
tools/server/server.cpp
@@ -233,6 +233,7 @@ struct server_task {
233
slot_params defaults;
234
defaults.sampling = params_base.sampling;
235
defaults.speculative = params_base.speculative;
236
+ defaults.n_keep = params_base.n_keep;
237
238
// enabling this will output extra debug information in the HTTP responses from the server
239
params.verbose = params_base.verbosity > 9;
@@ -2060,6 +2061,7 @@ struct server_context {
2060
2061
SLT_INF(slot, "new slot n_ctx_slot = %d\n", slot.n_ctx);
2062
2063
slot.params.sampling = params_base.sampling;
2064
+ slot.params.n_keep = params_base.n_keep;
2065
2066
slot.callback_on_release = [this](int) {
2067
queue_tasks.pop_deferred_task();
0 commit comments