-
Notifications
You must be signed in to change notification settings - Fork 55
Expand file tree
/
Copy pathmodels.json
More file actions
54 lines (54 loc) · 1.53 KB
/
models.json
File metadata and controls
54 lines (54 loc) · 1.53 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
{
"providers": {
"llamacpp": {
"api": "openai-completions",
"baseUrl": "http://127.0.0.1:8888/v1",
"apiKey": "LLAMACPP_API_KEY",
"models": [
{
"id": "qwen3.6-27b",
"name": "Qwen3.6-27B (dense, local llama.cpp)",
"reasoning": true,
"input": ["text"],
"contextWindow": 32768,
"maxTokens": 4096,
"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }
},
{
"id": "qwen3.6-35b-a3b",
"name": "Qwen3.6-35B-A3B (MoE, local llama.cpp)",
"reasoning": true,
"input": ["text"],
"contextWindow": 32768,
"maxTokens": 4096,
"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }
},
{
"id": "qwen3.5-9b",
"name": "Qwen3.5-9B (local llama.cpp)",
"reasoning": true,
"input": ["text"],
"contextWindow": 32768,
"maxTokens": 4096,
"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }
}
]
},
"ollama": {
"api": "openai-completions",
"baseUrl": "http://127.0.0.1:11434/v1",
"apiKey": "OLLAMA_API_KEY",
"models": [
{
"id": "qwen3.5",
"name": "Qwen3.5 (ollama)",
"reasoning": true,
"input": ["text"],
"contextWindow": 32768,
"maxTokens": 4096,
"cost": { "input": 0, "output": 0, "cacheRead": 0, "cacheWrite": 0 }
}
]
}
}
}