Files
ragflow/conf/models/astraflow.json
dripsmvcp d5ba14a128 feat(go): implement provider Astraflow (#15062) (#15064)
- Adds an `Astraflow` Go driver so the new API server can route
Astraflow (UCloud ModelVerse) chat instances, matching the existing
Python `AstraflowChat` (`rag/llm/chat_model.py:1237`). Follows the same
SaaS-driver shape used for Avian, Novita, TogetherAI, Replicate,
DeepInfra, Upstage, and LongCat.

Closes #15062

---------

Co-authored-by: Jin Hai <haijin.chn@gmail.com>
2026-05-21 15:32:56 +08:00

104 lines
2.0 KiB
JSON

{
"name": "Astraflow",
"url": {
"default": "https://api-us-ca.umodelverse.ai/v1"
},
"url_suffix": {
"chat": "chat/completions",
"models": "models"
},
"class": "astraflow",
"models": [
{
"name": "claude-opus-4-7",
"max_tokens": 200000,
"model_types": ["chat"]
},
{
"name": "claude-opus-4-6",
"max_tokens": 200000,
"model_types": ["chat"]
},
{
"name": "claude-sonnet-4-5-20250929",
"max_tokens": 200000,
"model_types": ["chat"]
},
{
"name": "claude-haiku-4-5-20251001",
"max_tokens": 200000,
"model_types": ["chat"]
},
{
"name": "gpt-5.4",
"max_tokens": 400000,
"model_types": ["chat"]
},
{
"name": "gpt-5.4-mini",
"max_tokens": 400000,
"model_types": ["chat"]
},
{
"name": "gpt-5.4-nano",
"max_tokens": 400000,
"model_types": ["chat"]
},
{
"name": "gpt-4o-mini",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "Qwen/Qwen3-Max",
"max_tokens": 131072,
"model_types": ["chat"]
},
{
"name": "Qwen/Qwen3-Coder",
"max_tokens": 131072,
"model_types": ["chat"]
},
{
"name": "Qwen/Qwen3-32B",
"max_tokens": 131072,
"model_types": ["chat"]
},
{
"name": "Qwen/Qwen3-VL-235B-A22B-Instruct",
"max_tokens": 131072,
"model_types": ["chat"]
},
{
"name": "kimi-k2.6",
"max_tokens": 200000,
"model_types": ["chat"]
},
{
"name": "glm-5.1",
"max_tokens": 128000,
"model_types": ["chat"]
},
{
"name": "MiniMax-M2.7",
"max_tokens": 1000000,
"model_types": ["chat"]
},
{
"name": "MiniMax-M2",
"max_tokens": 1000000,
"model_types": ["chat"]
},
{
"name": "gemini-2.5-pro",
"max_tokens": 1000000,
"model_types": ["chat"]
},
{
"name": "gemini-2.5-flash",
"max_tokens": 1000000,
"model_types": ["chat"]
}
]
}