Skip to content

Commit 1a014b2

Browse files
llama-router: add --jinja to default spawn configuration
1 parent 47408bc commit 1a014b2

File tree

3 files changed

+4
-3
lines changed

3 files changed

+4
-3
lines changed

tools/router/README.md

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -196,7 +196,7 @@ Override with `--config`:
196196
"notify_model_swap": false
197197
},
198198
"default_spawn": {
199-
"command": ["llama-server", "--ctx-size", "4096", "--n-gpu-layers", "99"],
199+
"command": ["llama-server", "--jinja", "--ctx-size", "4096", "--n-gpu-layers", "99"],
200200
"proxy_endpoints": ["/v1/", "/health", "/slots", "/props"],
201201
"health_endpoint": "/health"
202202
},
@@ -233,7 +233,7 @@ The `default_spawn` block defines how llama-server instances are launched:
233233

234234
```json
235235
{
236-
"command": ["llama-server", "--ctx-size", "4096", "--n-gpu-layers", "99"],
236+
"command": ["llama-server", "--jinja", "--ctx-size", "4096", "--n-gpu-layers", "99"],
237237
"proxy_endpoints": ["/v1/", "/health", "/slots", "/props"],
238238
"health_endpoint": "/health"
239239
}
@@ -293,6 +293,7 @@ Individual models can override the default spawn configuration:
293293
"spawn": {
294294
"command": [
295295
"llama-server",
296+
"--jinja",
296297
"--ctx-size", "8192",
297298
"--n-gpu-layers", "99",
298299
"--mmproj", "/path/to/mmproj-model-f16.gguf"

tools/router/router-config.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -107,7 +107,7 @@ static json serialize_spawn_config(const SpawnConfig & spawn) {
107107
const SpawnConfig & get_default_spawn() {
108108
static const SpawnConfig spawn = [] {
109109
SpawnConfig default_spawn = {
110-
/*command =*/ {"llama-server", "--ctx-size", "4096", "--n-gpu-layers", "99"},
110+
/*command =*/ {"llama-server", "--jinja", "--ctx-size", "4096", "--n-gpu-layers", "99"},
111111
/*proxy_endpoints =*/ {"/v1/", "/health", "/slots", "/props"},
112112
/*health_endpoint =*/ "/health",
113113
};

tools/server/public/index.html.gz

11.7 KB
Binary file not shown.

0 commit comments

Comments
 (0)