server : use 4 slots + unified KV by default

This commit is contained in:
Georgi Gerganov
2025-10-30 20:15:34 +02:00
parent a5d27aafe3
commit 2d69109dc1

View File

@@ -4432,6 +4432,13 @@ int main(int argc, char ** argv) {
return 1;
}
if (params.n_parallel == 1 && params.kv_unified == false) {
LOG_WRN("%s: setting n_parallel = 4 and kv_unified = true\n", __func__);
params.n_parallel = 4;
params.kv_unified = true;
}
common_init();
// struct that contains llama context and inference