opencode: vllm-36b → vllm-14b/35b 분리, baseURL 포트 변경
This commit is contained in:
@@ -7,7 +7,7 @@
|
||||
"npm": "@ai-sdk/openai-compatible",
|
||||
"name": "Qwen 27B",
|
||||
"options": {
|
||||
"baseURL": "http://localhost:8000/v1"
|
||||
"baseURL": "http://localhost:8002/v1"
|
||||
},
|
||||
"models": {
|
||||
"Qwen3.6-27B-FP8": {
|
||||
@@ -20,11 +20,28 @@
|
||||
}
|
||||
}
|
||||
},
|
||||
"vllm-36b": {
|
||||
"vllm-14b": {
|
||||
"npm": "@ai-sdk/openai-compatible",
|
||||
"name": "Qwen 14B",
|
||||
"options": {
|
||||
"baseURL": "http://localhost:8001/v1"
|
||||
},
|
||||
"models": {
|
||||
"Qwen3-14B-FP8": {
|
||||
"name": "Qwen3 14B FP8",
|
||||
"reasoning": true,
|
||||
"limit": {
|
||||
"context": 32768,
|
||||
"output": 8192
|
||||
}
|
||||
}
|
||||
}
|
||||
},
|
||||
"vllm-35b": {
|
||||
"npm": "@ai-sdk/openai-compatible",
|
||||
"name": "Qwen 35B A3B",
|
||||
"options": {
|
||||
"baseURL": "http://localhost:8001/v1"
|
||||
"baseURL": "http://localhost:8000/v1"
|
||||
},
|
||||
"models": {
|
||||
"Qwen3.6-35B-A3B-FP8": {
|
||||
|
||||
Reference in New Issue
Block a user