server: rename --clear-idle to --cache-idle-slots (#21741)

This commit is contained in:
Yes You Can Have Your Own
2026-04-20 08:30:24 +03:00
committed by GitHub
parent e365e658f0
commit 9d49acb2a7
6 changed files with 16 additions and 16 deletions
+1 -1
View File
@@ -567,7 +567,7 @@ struct common_params {
int32_t n_threads_http = -1; // number of threads to process HTTP requests (TODO: support threadpool)
int32_t n_cache_reuse = 0; // min chunk size to reuse from the cache via KV shifting
bool cache_prompt = true; // whether to enable prompt caching
bool clear_idle = true; // save and clear idle slots upon starting a new task
bool cache_idle_slots = true; // save and clear idle slots upon starting a new task
int32_t n_ctx_checkpoints = 32; // max number of context checkpoints per slot
int32_t checkpoint_every_nt = 8192; // make a checkpoint every n tokens during prefill
int32_t cache_ram_mib = 8192; // -1 = no limit, 0 - disable, 1 = 1 MiB, etc.