Feat: add VLLM (#5380)

### What problem does this PR solve?

Read to add VLMM.

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
This commit is contained in:
Yongteng Lei 2025-02-26 16:04:53 +08:00 committed by GitHub
parent 96e9d50060
commit cdcaae17c6
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
4 changed files with 16 additions and 0 deletions

View File

@ -172,6 +172,10 @@ def add_llm():
llm_name = req["llm_name"] + "___OpenAI-API" llm_name = req["llm_name"] + "___OpenAI-API"
api_key = req.get("api_key", "xxxxxxxxxxxxxxx") api_key = req.get("api_key", "xxxxxxxxxxxxxxx")
elif factory == "VLLM":
llm_name = req["llm_name"] + "___OpenAI-API"
api_key = req.get("api_key", "xxxxxxxxxxxxxxx")
elif factory == "XunFei Spark": elif factory == "XunFei Spark":
llm_name = req["llm_name"] llm_name = req["llm_name"]
if req["model_type"] == "chat": if req["model_type"] == "chat":

View File

@ -316,6 +316,13 @@
"status": "1", "status": "1",
"llm": [] "llm": []
}, },
{
"name": "VLLM",
"logo": "",
"tags": "LLM,TEXT EMBEDDING,SPEECH2TEXT,MODERATION",
"status": "1",
"llm": []
},
{ {
"name": "Moonshot", "name": "Moonshot",
"logo": "", "logo": "",

View File

@ -42,6 +42,7 @@ A complete list of models supported by RAGFlow, which will continue to expand.
| Ollama | :heavy_check_mark: | :heavy_check_mark: | | :heavy_check_mark: | | | | Ollama | :heavy_check_mark: | :heavy_check_mark: | | :heavy_check_mark: | | |
| OpenAI | :heavy_check_mark: | :heavy_check_mark: | | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | | OpenAI | :heavy_check_mark: | :heavy_check_mark: | | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: |
| OpenAI-API-Compatible | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | | | | OpenAI-API-Compatible | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | | |
| VLMM | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | :heavy_check_mark: | | |
| OpenRouter | :heavy_check_mark: | | | :heavy_check_mark: | | | | OpenRouter | :heavy_check_mark: | | | :heavy_check_mark: | | |
| PerfXCloud | :heavy_check_mark: | :heavy_check_mark: | | | | | | PerfXCloud | :heavy_check_mark: | :heavy_check_mark: | | | | |
| Replicate | :heavy_check_mark: | :heavy_check_mark: | | | | | | Replicate | :heavy_check_mark: | :heavy_check_mark: | | | | |

View File

@ -160,6 +160,7 @@ EmbeddingModel = {
"NVIDIA": NvidiaEmbed, "NVIDIA": NvidiaEmbed,
"LM-Studio": LmStudioEmbed, "LM-Studio": LmStudioEmbed,
"OpenAI-API-Compatible": OpenAI_APIEmbed, "OpenAI-API-Compatible": OpenAI_APIEmbed,
"VLLM": OpenAI_APIEmbed,
"Cohere": CoHereEmbed, "Cohere": CoHereEmbed,
"TogetherAI": TogetherAIEmbed, "TogetherAI": TogetherAIEmbed,
"PerfXCloud": PerfXCloudEmbed, "PerfXCloud": PerfXCloudEmbed,
@ -188,6 +189,7 @@ CvModel = {
"LM-Studio": LmStudioCV, "LM-Studio": LmStudioCV,
"StepFun": StepFunCV, "StepFun": StepFunCV,
"OpenAI-API-Compatible": OpenAI_APICV, "OpenAI-API-Compatible": OpenAI_APICV,
"VLLM": OpenAI_APICV,
"TogetherAI": TogetherAICV, "TogetherAI": TogetherAICV,
"01.AI": YiCV, "01.AI": YiCV,
"Tencent Hunyuan": HunyuanCV, "Tencent Hunyuan": HunyuanCV,
@ -215,6 +217,7 @@ ChatModel = {
"NVIDIA": NvidiaChat, "NVIDIA": NvidiaChat,
"LM-Studio": LmStudioChat, "LM-Studio": LmStudioChat,
"OpenAI-API-Compatible": OpenAI_APIChat, "OpenAI-API-Compatible": OpenAI_APIChat,
"VLLM": OpenAI_APIChat,
"Cohere": CoHereChat, "Cohere": CoHereChat,
"LeptonAI": LeptonAIChat, "LeptonAI": LeptonAIChat,
"TogetherAI": TogetherAIChat, "TogetherAI": TogetherAIChat,
@ -244,6 +247,7 @@ RerankModel = {
"NVIDIA": NvidiaRerank, "NVIDIA": NvidiaRerank,
"LM-Studio": LmStudioRerank, "LM-Studio": LmStudioRerank,
"OpenAI-API-Compatible": OpenAI_APIRerank, "OpenAI-API-Compatible": OpenAI_APIRerank,
"VLLM": OpenAI_APIRerank,
"Cohere": CoHereRerank, "Cohere": CoHereRerank,
"TogetherAI": TogetherAIRerank, "TogetherAI": TogetherAIRerank,
"SILICONFLOW": SILICONFLOWRerank, "SILICONFLOW": SILICONFLOWRerank,