mirror of
https://github.com/infiniflow/ragflow.git
synced 2026-05-28 19:53:06 +08:00
### What problem does this PR solve? This PR implement implement provider and Mistral, DeepInfra, XunFei **The following functionalities are now supported:** **DeepInfra** - [x] chat / think chat / stream chat / stream think chat - [x] Embedding - [x] ASR - [x] TTS - [x] ListModels - [x] Provider connection checking - [x] Balance - [ ] ~~Rerank~~ **XunFei** - [x] chat / think chat / stream chat / stream think chat ### Type of change - [x] New Feature (non-breaking change which adds functionality) - [x] Refactoring
49 lines
948 B
JSON
49 lines
948 B
JSON
{
|
|
"name": "DeepInfra",
|
|
"url": {
|
|
"default": "https://api.deepinfra.com"
|
|
},
|
|
"url_suffix": {
|
|
"chat": "v1/chat/completions",
|
|
"models": "models/list",
|
|
"balance": "payment/checklist",
|
|
"embedding": "v1/embeddings",
|
|
"tts": "v1/text-to-speech",
|
|
"asr": "v1/audio/transcriptions"
|
|
},
|
|
"class": "deepinfra",
|
|
"models": [
|
|
{
|
|
"name": "deepseek-ai/DeepSeek-V3.2",
|
|
"max_tokens": 32768,
|
|
"model_types": [
|
|
"chat"
|
|
],
|
|
"thinking": {
|
|
"default_value": true,
|
|
"clear_thinking": true
|
|
}
|
|
},
|
|
{
|
|
"name": "Qwen/Qwen3-Embedding-4B",
|
|
"max_tokens": 8192,
|
|
"model_types": [
|
|
"embedding"
|
|
]
|
|
},
|
|
{
|
|
"name": "hexgrad/Kokoro-82M",
|
|
"max_tokens": 16384,
|
|
"model_types": [
|
|
"tts"
|
|
]
|
|
},
|
|
{
|
|
"name": "bosonai/HiggsAudioV2.5",
|
|
"max_tokens": 8192,
|
|
"model_types": [
|
|
"asr"
|
|
]
|
|
}
|
|
]
|
|
} |