From 7944aacafa36d67365e0afaf9f51c80b725af6d7 Mon Sep 17 00:00:00 2001
From: Alex Chen <nanyilikai@hotmail.com>
Date: Wed, 15 Jan 2025 14:15:58 +0800
Subject: [PATCH] Feat: add gpustack model provider (#4469)

### What problem does this PR solve?

Add GPUStack as a new model provider.
[GPUStack](https://github.com/gpustack/gpustack) is an open-source GPU
cluster manager for running LLMs. Currently, locally deployed models in
GPUStack cannot integrate well with RAGFlow. GPUStack provides both
OpenAI compatible APIs (Models / Chat Completions / Embeddings /
Speech2Text / TTS) and other APIs like Rerank. We would like to use
GPUStack as a model provider in ragflow.

[GPUStack Docs](https://docs.gpustack.ai/latest/quickstart/)

Related issue: https://github.com/infiniflow/ragflow/issues/4064.

### Type of change

- [x] New Feature (non-breaking change which adds functionality)


### Testing Instructions
1. Install GPUStack and deploy the `llama-3.2-1b-instruct` llm, `bge-m3`
text embedding model, `bge-reranker-v2-m3` rerank model,
`faster-whisper-medium` Speech-to-Text model, `cosyvoice-300m-sft` in
GPUStack.
2. Add provider in ragflow settings.
3. Testing in ragflow.
---
 api/apps/llm_app.py                           |  4 +-
 conf/llm_factories.json                       |  7 +++
 rag/llm/__init__.py                           | 10 ++++
 rag/llm/chat_model.py                         |  8 +++
 rag/llm/embedding_model.py                    | 13 ++++-
 rag/llm/rerank_model.py                       | 52 +++++++++++++++++++
 rag/llm/sequence2txt_model.py                 | 12 +++++
 rag/llm/tts_model.py                          | 32 ++++++++++++
 web/src/assets/svg/llm/gpustack.svg           | 14 +++++
 web/src/constants/setting.ts                  |  1 +
 web/src/pages/user-setting/constants.tsx      |  1 +
 .../setting-model/ollama-modal/index.tsx      |  8 +++
 12 files changed, 159 insertions(+), 3 deletions(-)
 create mode 100644 web/src/assets/svg/llm/gpustack.svg

diff --git a/api/apps/llm_app.py b/api/apps/llm_app.py
index 494854dd6..5acd764b3 100644
--- a/api/apps/llm_app.py
+++ b/api/apps/llm_app.py
@@ -329,7 +329,7 @@ def my_llms():
 @manager.route('/list', methods=['GET'])  # noqa: F821
 @login_required
 def list_app():
-    self_deploied = ["Youdao", "FastEmbed", "BAAI", "Ollama", "Xinference", "LocalAI", "LM-Studio"]
+    self_deployed = ["Youdao", "FastEmbed", "BAAI", "Ollama", "Xinference", "LocalAI", "LM-Studio", "GPUStack"]
     weighted = ["Youdao", "FastEmbed", "BAAI"] if settings.LIGHTEN != 0 else []
     model_type = request.args.get("model_type")
     try:
@@ -339,7 +339,7 @@ def list_app():
         llms = [m.to_dict()
                 for m in llms if m.status == StatusEnum.VALID.value and m.fid not in weighted]
         for m in llms:
-            m["available"] = m["fid"] in facts or m["llm_name"].lower() == "flag-embedding" or m["fid"] in self_deploied
+            m["available"] = m["fid"] in facts or m["llm_name"].lower() == "flag-embedding" or m["fid"] in self_deployed
 
         llm_set = set([m["llm_name"] + "@" + m["fid"] for m in llms])
         for o in objs:
diff --git a/conf/llm_factories.json b/conf/llm_factories.json
index 5cfcea247..d7a30bc23 100644
--- a/conf/llm_factories.json
+++ b/conf/llm_factories.json
@@ -2543,6 +2543,13 @@
             "tags": "TEXT EMBEDDING",
             "status": "1",
             "llm": []
+        },
+        {
+            "name": "GPUStack",
+            "logo": "",
+            "tags": "LLM,TEXT EMBEDDING,TTS,SPEECH2TEXT,TEXT RE-RANK",
+            "status": "1",
+            "llm": []
         }
     ]
 }
\ No newline at end of file
diff --git a/rag/llm/__init__.py b/rag/llm/__init__.py
index bc35fe63d..923f55cf6 100644
--- a/rag/llm/__init__.py
+++ b/rag/llm/__init__.py
@@ -42,6 +42,7 @@ from .embedding_model import (
     VoyageEmbed,
     HuggingFaceEmbed,
     VolcEngineEmbed,
+    GPUStackEmbed,
 )
 from .chat_model import (
     GptTurbo,
@@ -80,6 +81,7 @@ from .chat_model import (
     AnthropicChat,
     GoogleChat,
     HuggingFaceChat,
+    GPUStackChat,
 )
 
 from .cv_model import (
@@ -116,6 +118,7 @@ from .rerank_model import (
     BaiduYiyanRerank,
     VoyageRerank,
     QWenRerank,
+    GPUStackRerank,
 )
 from .sequence2txt_model import (
     GPTSeq2txt,
@@ -123,6 +126,7 @@ from .sequence2txt_model import (
     AzureSeq2txt,
     XinferenceSeq2txt,
     TencentCloudSeq2txt,
+    GPUStackSeq2txt,
 )
 from .tts_model import (
     FishAudioTTS,
@@ -130,6 +134,7 @@ from .tts_model import (
     OpenAITTS,
     SparkTTS,
     XinferenceTTS,
+    GPUStackTTS,
 )
 
 EmbeddingModel = {
@@ -161,6 +166,7 @@ EmbeddingModel = {
     "Voyage AI": VoyageEmbed,
     "HuggingFace": HuggingFaceEmbed,
     "VolcEngine": VolcEngineEmbed,
+    "GPUStack": GPUStackEmbed,
 }
 
 CvModel = {
@@ -220,6 +226,7 @@ ChatModel = {
     "Anthropic": AnthropicChat,
     "Google Cloud": GoogleChat,
     "HuggingFace": HuggingFaceChat,
+    "GPUStack": GPUStackChat,
 }
 
 RerankModel = {
@@ -237,6 +244,7 @@ RerankModel = {
     "BaiduYiyan": BaiduYiyanRerank,
     "Voyage AI": VoyageRerank,
     "Tongyi-Qianwen": QWenRerank,
+    "GPUStack": GPUStackRerank,
 }
 
 Seq2txtModel = {
@@ -245,6 +253,7 @@ Seq2txtModel = {
     "Azure-OpenAI": AzureSeq2txt,
     "Xinference": XinferenceSeq2txt,
     "Tencent Cloud": TencentCloudSeq2txt,
+    "GPUStack": GPUStackSeq2txt,
 }
 
 TTSModel = {
@@ -253,4 +262,5 @@ TTSModel = {
     "OpenAI": OpenAITTS,
     "XunFei Spark": SparkTTS,
     "Xinference": XinferenceTTS,
+    "GPUStack": GPUStackTTS,
 }
diff --git a/rag/llm/chat_model.py b/rag/llm/chat_model.py
index f7e12b4d7..605339ad7 100644
--- a/rag/llm/chat_model.py
+++ b/rag/llm/chat_model.py
@@ -1514,3 +1514,11 @@ class GoogleChat(Base):
                 yield ans + "\n**ERROR**: " + str(e)
 
             yield response._chunks[-1].usage_metadata.total_token_count
+
+class GPUStackChat(Base):
+    def __init__(self, key=None, model_name="", base_url=""):
+        if not base_url:
+            raise ValueError("Local llm url cannot be None")
+        if base_url.split("/")[-1] != "v1-openai":
+            base_url = os.path.join(base_url, "v1-openai")
+        super().__init__(key, model_name, base_url)
\ No newline at end of file
diff --git a/rag/llm/embedding_model.py b/rag/llm/embedding_model.py
index 182d4cf7a..df57f5d9f 100644
--- a/rag/llm/embedding_model.py
+++ b/rag/llm/embedding_model.py
@@ -30,7 +30,7 @@ import asyncio
 from api import settings
 from api.utils.file_utils import get_home_cache_dir
 from rag.utils import num_tokens_from_string, truncate
-import google.generativeai as genai 
+import google.generativeai as genai
 import json
 
 
@@ -799,3 +799,14 @@ class VolcEngineEmbed(OpenAIEmbed):
         ark_api_key = json.loads(key).get('ark_api_key', '')
         model_name = json.loads(key).get('ep_id', '') + json.loads(key).get('endpoint_id', '')
         super().__init__(ark_api_key,model_name,base_url)
+
+class GPUStackEmbed(OpenAIEmbed):
+    def __init__(self, key, model_name, base_url):
+        if not base_url:
+            raise ValueError("url cannot be None")
+        if base_url.split("/")[-1] != "v1-openai":
+            base_url = os.path.join(base_url, "v1-openai")
+
+        print(key,base_url)
+        self.client = OpenAI(api_key=key, base_url=base_url)
+        self.model_name = model_name
\ No newline at end of file
diff --git a/rag/llm/rerank_model.py b/rag/llm/rerank_model.py
index c42ee8944..c937e7798 100644
--- a/rag/llm/rerank_model.py
+++ b/rag/llm/rerank_model.py
@@ -18,10 +18,12 @@ import threading
 from urllib.parse import urljoin
 
 import requests
+import httpx
 from huggingface_hub import snapshot_download
 import os
 from abc import ABC
 import numpy as np
+from yarl import URL
 
 from api import settings
 from api.utils.file_utils import get_home_cache_dir
@@ -457,3 +459,53 @@ class QWenRerank(Base):
             return rank, resp.usage.total_tokens
         else:
             raise ValueError(f"Error calling QWenRerank model {self.model_name}: {resp.status_code} - {resp.text}")
+
+class GPUStackRerank(Base):
+    def __init__(
+            self, key, model_name, base_url
+    ):
+        if not base_url:
+            raise ValueError("url cannot be None")
+
+        self.model_name = model_name
+        self.base_url = str(URL(base_url)/ "v1" / "rerank")
+        self.headers = {
+            "accept": "application/json",
+            "content-type": "application/json",
+            "authorization": f"Bearer {key}",
+        }
+
+    def similarity(self, query: str, texts: list):
+        payload = {
+            "model": self.model_name,
+            "query": query,
+            "documents": texts,
+            "top_n": len(texts),
+        }
+
+        try:
+            response = requests.post(
+                self.base_url, json=payload, headers=self.headers
+            )
+            response.raise_for_status()
+            response_json = response.json()
+
+            rank = np.zeros(len(texts), dtype=float)
+            if "results" not in response_json:
+                return rank, 0
+
+            token_count = 0
+            for t in texts:
+                token_count += num_tokens_from_string(t)
+
+            for result in response_json["results"]:
+                rank[result["index"]] = result["relevance_score"]
+
+            return (
+                rank,
+                token_count,
+            )
+
+        except httpx.HTTPStatusError as e:
+            raise ValueError(f"Error calling GPUStackRerank model {self.model_name}: {e.response.status_code} - {e.response.text}")
+
diff --git a/rag/llm/sequence2txt_model.py b/rag/llm/sequence2txt_model.py
index 73c8f37df..e5bcae4fa 100644
--- a/rag/llm/sequence2txt_model.py
+++ b/rag/llm/sequence2txt_model.py
@@ -13,6 +13,7 @@
 #  See the License for the specific language governing permissions and
 #  limitations under the License.
 #
+import os
 import requests
 from openai.lib.azure import AzureOpenAI
 import io
@@ -191,3 +192,14 @@ class TencentCloudSeq2txt(Base):
             return "**ERROR**: " + str(e), 0
         except Exception as e:
             return "**ERROR**: " + str(e), 0
+
+
+class GPUStackSeq2txt(Base):
+    def __init__(self, key, model_name, base_url):
+        if not base_url:
+            raise ValueError("url cannot be None")
+        if base_url.split("/")[-1] != "v1-openai":
+            base_url = os.path.join(base_url, "v1-openai")
+        self.base_url = base_url
+        self.model_name = model_name
+        self.key = key
diff --git a/rag/llm/tts_model.py b/rag/llm/tts_model.py
index fa82cc827..71fb93b74 100644
--- a/rag/llm/tts_model.py
+++ b/rag/llm/tts_model.py
@@ -355,3 +355,35 @@ class OllamaTTS(Base):
         for chunk in response.iter_content():
             if chunk:
                 yield chunk
+
+class GPUStackTTS:
+    def __init__(self, key, model_name, **kwargs):
+        self.base_url = kwargs.get("base_url", None)
+        self.api_key = key
+        self.model_name = model_name
+        self.headers = {
+            "accept": "application/json",
+            "Content-Type": "application/json",
+            "Authorization": f"Bearer {self.api_key}"
+        }
+
+    def tts(self, text, voice="Chinese Female", stream=True):
+        payload = {
+            "model": self.model_name,
+            "input": text,
+            "voice": voice
+        }
+
+        response = requests.post(
+            f"{self.base_url}/v1-openai/audio/speech",
+            headers=self.headers,
+            json=payload,
+            stream=stream
+        )
+
+        if response.status_code != 200:
+            raise Exception(f"**Error**: {response.status_code}, {response.text}")
+
+        for chunk in response.iter_content(chunk_size=1024):
+            if chunk:
+                yield chunk
\ No newline at end of file
diff --git a/web/src/assets/svg/llm/gpustack.svg b/web/src/assets/svg/llm/gpustack.svg
new file mode 100644
index 000000000..95a07f912
--- /dev/null
+++ b/web/src/assets/svg/llm/gpustack.svg
@@ -0,0 +1,14 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<svg width="600px" height="600px" viewBox="0 0 600 600" version="1.1" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink">
+    <title>Combined Shape</title>
+    <defs>
+        <linearGradient x1="91.3304535%" y1="91.5781745%" x2="13.2347393%" y2="15.0079541%" id="linearGradient-1">
+            <stop stop-color="#00FFF0" offset="0%"></stop>
+            <stop stop-color="#4400FF" offset="50.0947333%"></stop>
+            <stop stop-color="#0055FF" offset="100%"></stop>
+        </linearGradient>
+    </defs>
+    <g id="Page-1" stroke="none" stroke-width="1" fill="none" fill-rule="evenodd">
+        <path d="M309.090909,586 L309.091,489.985 L310.358658,489.974277 C399.311145,488.546471 473.705649,427.830321 494.980476,346.001903 L309.090909,346 L309.090909,250 L494.980995,250.000095 L595.977495,249.998363 L595.977,250 L600,250 L600,296 L599.996522,296.576567 C599.99884,297.050775 600,297.525253 600,298 C600,457.058008 469.755564,586 309.090909,586 Z M309.090909,10 C416.768593,10 510.782428,67.9168718 561.081894,154.0006 L435.430071,153.996646 C401.9868,124.775728 358.285821,106.795018 310.358658,106.025723 L309.091,106.015 L309.090909,10 Z M305.050505,63.5 C305.050505,65.58059 304.374905,67.5049629 303.22904,69.0698355 L303.206447,69.0990238 C301.441112,71.5092747 298.573285,73.0769231 295.335521,73.0769231 C295.218029,73.0769231 295.101025,73.0748588 294.984543,73.0707649 L285.349944,90.8976501 C289.922425,93.9519375 292.929293,99.1283345 292.929293,105 C292.929293,112.665406 287.804669,119.145861 280.762149,121.266706 C279.082799,121.817645 277.286432,122.115385 275.419803,122.115385 C269.340285,122.115385 264.006077,118.957047 261.000747,114.207705 L235.228269,126.961046 C235.310687,127.461958 235.353535,127.976025 235.353535,128.5 C235.353535,130.503743 234.72692,132.362595 233.657104,133.894977 C231.945525,136.635529 228.882032,138.461538 225.387634,138.461538 C222.563928,138.461538 220.021591,137.269206 218.246541,135.365479 L189.622406,149.531693 C190.451693,151.525597 190.909091,153.709917 190.909091,156 C190.909091,164.147963 185.118942,170.957088 177.38991,172.61462 C176.113529,172.91667 174.781907,173.076923 173.412469,173.076923 C171.836684,173.076923 170.310972,172.864739 168.862906,172.467662 L148.698897,219.908263 C151.02281,221.641997 152.525253,224.397296 152.525253,227.5 C152.525253,227.564997 152.524593,227.629843 152.523281,227.694529 C152.524628,227.75749 152.525253,227.82098 152.525253,227.884615 C152.525253,233.195046 148.175706,237.5 142.810268,237.5 C142.28687,237.5 141.77314,237.459034 141.272171,237.380165 L122.683126,281.115347 C125.327831,282.637029 127.519965,284.844464 129.010959,287.491633 C130.475018,289.993881 131.313131,292.900043 131.313131,296 C131.313131,301.60728 128.57095,306.580494 124.341789,309.676993 L141.364175,348.345982 C142.183681,348.12051 143.047322,348 143.939394,348 C149.239096,348 153.535354,352.253295 153.535354,357.5 C153.535354,358.148122 153.469795,358.781086 153.344884,359.392745 C152.862908,362.068092 151.262765,364.360111 149.040035,365.778878 L170.003881,413.402945 C171.205849,413.13912 172.455201,413 173.737374,413 C183.221051,413 190.909091,420.611159 190.909091,430 C190.909091,431.567895 190.69469,433.086216 190.293331,434.527793 L221.003276,451.771745 C222.738937,450.058896 225.133449,449 227.777778,449 C228.10871,449 228.435729,449.016584 228.758034,449.04896 C233.911654,449.284348 238.017114,453.494572 238.017114,458.653846 C238.017114,459.513565 237.903116,460.346931 237.689265,461.139944 L263.109309,475.413647 C263.972881,474.51658 264.935521,473.71378 265.97986,473.022436 C268.754797,471.117031 272.124421,470 275.757576,470 C285.241253,470 292.929293,477.611159 292.929293,487 C292.929293,493.866893 288.816733,499.782851 282.896966,502.465577 L290.501,526.923 L290.754628,526.926899 C295.992158,527.071823 300.193013,531.31959 300.193013,536.538462 C300.193013,541.848892 295.843466,546.153846 290.478029,546.153846 C290.192655,546.153846 289.910155,546.141668 289.63103,546.117808 L282.993838,567.578686 C288.861551,570.281825 292.929293,576.170627 292.929293,583 C292.929293,592.388841 285.241253,600 275.757576,600 C275.708756,600 275.659984,599.999798 275.611261,599.999396 L275.419803,600 C266.030287,600 258.418581,592.46633 258.418581,583.173077 C258.418581,581.659144 258.620585,580.191908 258.999371,578.796332 L215.6473,561.572644 C213.873357,563.888666 211.063518,565.384615 207.900663,565.384615 C204.461258,565.384615 201.439302,563.615627 199.712918,560.946772 C198.620776,559.404943 197.979798,557.526577 197.979798,555.5 C197.979798,555.186631 197.995124,554.876807 198.025074,554.57122 L153.611619,536.925653 C150.806842,542.401118 145.065471,546.153846 138.438525,546.153846 C133.193918,546.153846 128.503968,543.803423 125.385317,540.108795 C122.784861,537.129369 121.212121,533.246514 121.212121,529 C121.212121,524.803878 122.747756,520.962836 125.293007,517.997632 L96.6287479,485.529788 C95.3234406,486.175288 93.8507466,486.538462 92.2923503,486.538462 C86.9269126,486.538462 82.577366,482.233507 82.577366,476.923077 C82.577366,474.956468 83.17388,473.127754 84.1975967,471.60451 C84.2172123,471.574278 84.2361065,471.543621 84.2551706,471.513079 L60.0709025,444.120026 C58.3198438,445.285002 56.3401925,446.139178 54.212573,446.602734 C52.8752713,446.937569 51.4747008,447.115385 50.0321688,447.115385 C40.642653,447.115385 33.0309464,439.581715 33.0309464,430.288462 C33.0309464,426.054318 34.6110214,422.185437 37.2194089,419.227925 C38.9262898,417.167693 41.1128531,415.511037 43.61025,414.42587 L33.1900615,371.953637 C29.7087686,371.314168 26.8793675,368.837417 25.7673676,365.577972 C25.4335654,364.612205 25.2525253,363.577033 25.2525253,362.5 C25.2525253,361.456197 25.4225663,360.451713 25.7367208,359.512215 C26.3447329,357.671023 27.4984479,356.074536 29.0088626,354.910024 L18.7100591,312.932709 C18.203287,312.977252 17.6901855,313 17.1717172,313 C7.68803965,313 0,305.388841 0,296 C0,295.945042 0.00026342378,295.890145 0.00078908952,295.83531 C0.000259353548,295.78151 0,295.727324 0,295.673077 C0,286.379824 7.61170655,278.846154 17.0012224,278.846154 C17.2548473,278.846154 17.507175,278.851651 17.7580906,278.86253 L28.4059564,236.706762 C26.1831843,235.153666 24.6484073,232.70031 24.3432604,229.882777 C24.2768557,229.431435 24.2424242,228.969698 24.2424242,228.5 C24.2424242,223.578546 28.0225293,219.531154 32.8651277,219.048259 L42.6924765,180.142682 C42.1196739,179.852456 41.5655031,179.531312 41.0322105,179.181474 C36.2271589,176.20909 33.0309464,170.925899 33.0309464,164.903846 C33.0309464,156.506839 39.2452943,149.54639 47.3704181,148.281951 C48.3869054,148.09698 49.4345381,148 50.5050505,148 C52.9778265,148 55.3285252,148.517448 57.4526947,149.448937 L91.1640021,108.668034 C90.6401084,107.486484 90.3493534,106.180695 90.3493534,104.807692 C90.3493534,100.714173 92.9338635,97.2181099 96.5759433,95.8307887 C97.7752659,95.2967673 99.1051513,95 100.505051,95 C101.126465,95 101.734083,95.058477 102.322597,95.1701758 L124.244658,68.64961 C122.33219,65.9083252 121.212121,62.5836576 121.212121,59 C121.212121,49.6111593 128.900161,42 138.383838,42 C144.507862,42 149.883132,45.1737371 152.923029,49.9504587 L203.031,34.582 L203.030303,34.5 C203.030303,29.3437553 207.179691,25.1469606 212.353052,25.0037764 L212.626263,25 C212.638312,25 212.650356,25.000022 212.662395,25.0000659 L212.758155,25 C216.071607,25 218.997625,26.6417977 220.751067,29.1483019 L258.4358,17.5910816 C258.424361,17.3377789 258.418581,17.0830191 258.418581,16.8269231 C258.418581,7.53367008 266.030287,0 275.419803,0 L275.621,0.001 L275.757576,0 C285.132245,0 292.752319,7.43719565 292.926255,16.6769603 L292.929293,17 C292.929293,22.7209388 290.074818,27.7818462 285.698954,30.8629665 L295.924883,53.8635568 C301.015887,54.1650779 305.050505,58.346971 305.050505,63.4615385 Z M197.619662,519.648885 L155.453918,527.139671 C155.521087,527.750643 155.555556,528.371337 155.555556,529 C155.555556,529.81976 155.496947,530.625967 155.383651,531.41474 L200.330236,549.271047 C202.089578,547.267021 204.683209,546 207.575758,546 C209.036573,546 210.421149,546.323157 211.660524,546.9012 C215.159174,548.35542 217.615647,551.778397 217.615647,555.769231 C217.615647,555.892095 217.613319,556.014421 217.608703,556.136168 L261.464904,573.559109 L261.676935,573.267014 C261.918801,572.924707 262.173079,572.591628 262.439122,572.268417 L223.352702,529.349692 C220.690971,531.027794 217.530875,532 214.141414,532 C206.28588,532 199.662362,526.777858 197.619662,519.648885 Z M260.35294,494.821872 L230.149352,508.835531 C230.90081,510.746712 231.313131,512.825686 231.313131,515 C231.313131,518.950152 229.952253,522.585633 227.669327,525.471999 L266.832003,568.474049 C269.432963,566.90432 272.488595,566 275.757576,566 C276.298868,566 276.83431,566.024795 277.362807,566.0733 L284.22177,543.894916 C282.10676,542.13109 280.763044,539.490088 280.763044,536.538462 C280.763044,533.267184 282.413559,530.377453 284.935325,528.640541 L277.255949,503.936176 C276.762172,503.978432 276.262418,504 275.757576,504 C272.813957,504 270.043332,503.266736 267.621899,501.974647 C264.518949,500.387483 261.974035,497.882048 260.35294,494.821872 Z M146.001857,478.876823 C144.562186,480.449774 142.597566,481.543071 140.381724,481.885726 L140.381492,512.113805 C146.3126,512.794088 151.322491,516.466346 153.831245,521.566456 L197.005304,513.896346 C197.123958,512.063193 197.536095,510.309088 198.195693,508.679592 Z M89.0197515,406.106807 L65.4653289,421.648616 C66.873257,424.115216 67.6767677,426.964711 67.6767677,430 C67.6767677,433.797804 66.4188368,437.304741 64.2929656,440.134719 L88.6750954,467.752418 C89.8268666,467.267992 91.0939419,467 92.4242424,467 C97.7239446,467 102.020202,471.253295 102.020202,476.5 C102.020202,476.680921 102.015094,476.860661 102.005012,477.039085 L102.007334,476.923077 C102.007334,478.587491 101.580059,480.153133 100.828149,481.518416 L129.764661,514.293428 C131.235874,513.446518 132.845779,512.809776 134.552425,512.424737 L134.552184,480.976792 C131.965024,479.676974 130.052886,477.250447 129.47468,474.349534 C129.300582,473.632975 129.20929,472.884731 129.20929,472.115385 C129.20929,469.536636 130.234948,467.194988 131.904532,465.468256 L107.232134,411.202828 C105.588369,411.7206 103.837244,412 102.020202,412 C96.824968,412 92.1685934,409.71594 89.0197515,406.106807 Z M187.798156,439.761031 C186.698729,441.310379 185.344651,442.669764 183.796124,443.779586 L209.346309,498.671663 C210.868148,498.234397 212.477131,498 214.141414,498 C219.32459,498 223.971405,500.273469 227.119914,503.868083 L258.570227,489.276457 C258.470216,488.538135 258.418581,487.784651 258.418581,487.019231 C258.418581,484.600709 258.934102,482.30136 259.862317,480.222955 L234.555406,466.012787 C232.865603,467.420868 230.683965,468.269231 228.30213,468.269231 C226.506322,468.269231 224.824318,467.786974 223.38111,466.946173 C220.292992,465.367701 218.181818,462.177931 218.181818,458.5 C218.181818,457.953381 218.228451,457.417544 218.317992,456.896176 Z M163.795491,444.166462 L145.811769,465.334107 C147.559276,467.072722 148.639259,469.469225 148.639259,472.115385 C148.639259,472.638281 148.597088,473.151429 148.515928,473.651679 L201.253861,503.765086 C202.103725,502.81035 203.060136,501.950798 204.104684,501.204658 L178.564661,446.328843 C176.939533,446.839733 175.208525,447.115385 173.412469,447.115385 C169.843063,447.115385 166.530573,446.026675 163.795491,444.166462 Z M116.728133,403.915189 C116.295698,404.569049 115.818516,405.191302 115.300892,405.777687 C114.449611,406.80424 113.479168,407.73069 112.410487,408.535931 L137.029859,462.68271 C137.642581,462.562843 138.276013,462.5 138.924275,462.5 C139.459497,462.5 139.98461,462.542838 140.496305,462.625238 L159.614579,440.121528 C157.598873,437.355621 156.411246,433.959312 156.411246,430.288462 C156.411246,428.027972 156.861598,425.871589 157.678343,423.90241 L116.728133,403.915189 Z M119.126988,312.272416 C117.762907,312.681488 116.327052,312.927055 114.84269,312.986082 L107.200485,378.537977 C114.300184,380.558561 119.494306,387.034692 119.494306,394.711538 C119.494306,396.052877 119.335735,397.357558 119.036135,398.608222 L160.694916,418.941523 C161.820671,417.641436 163.141327,416.511621 164.612048,415.596466 L143.349104,367.298327 C138.184439,367.074302 134.066782,362.85924 134.066782,357.692308 C134.066782,355.316441 134.937402,353.141834 136.380105,351.463963 Z M66.4522294,335.483196 C66.0178845,335.5435 65.5743271,335.575378 65.1235388,335.576868 L54.9093664,413.564354 C57.4786671,414.237384 59.8118679,415.485217 61.7600569,417.160432 L86.0099018,401.158456 C85.2599422,399.248928 84.8484848,397.172034 84.8484848,395 C84.8484848,389.278635 87.7033857,384.217399 92.0798026,381.136344 L66.4522294,335.483196 Z M30.8117729,306.328652 C29.118774,308.516633 26.9007669,310.285439 24.3441004,311.450583 L34.5133361,352.895232 C34.6659775,352.88818 34.8195398,352.884615 34.9739433,352.884615 C40.3393809,352.884615 44.6889275,357.18957 44.6889275,362.5 C44.6889275,366.382958 42.3634622,369.728342 39.0157571,371.246289 L49.159,412.586 L59.4769437,333.810268 C56.9950994,332.06829 55.3754102,329.202125 55.3754102,325.961538 C55.3754102,324.882027 55.5551479,323.844064 55.8866199,322.875368 Z M100.053694,305.72296 L73.9217198,321.638763 C74.3258324,322.537027 74.5932741,323.508838 74.6978935,324.528306 C74.768796,324.995959 74.8053786,325.47452 74.8053786,325.961538 C74.8053786,328.734957 73.6190217,331.234128 71.7211812,332.989046 L97.3431571,378.638198 C97.655808,378.550778 97.9720808,378.471905 98.291702,378.40185 C99.2963145,378.149582 100.33698,377.985326 101.40439,377.91856 L109.061639,312.243871 C105.373277,311.114679 102.216177,308.788134 100.053694,305.72296 Z M96.9814407,296.634622 L34.3316907,296.634622 C34.2730133,298.217509 33.9957374,299.745138 33.5288657,301.188797 L59.1451993,318.090647 C60.7893815,316.782655 62.8781257,316 65.1515152,316 C66.904238,316 68.5472076,316.46521 69.961313,317.27771 L97.5677216,300.463599 C97.2314226,299.236828 97.030385,297.954948 96.9814407,296.634622 Z M74.8629028,235.831738 L29.694511,284.368053 C31.430892,286.199492 32.7620283,288.411961 33.54622,290.865178 L97.7669113,290.865178 C98.2562031,289.334508 98.9584238,287.897562 99.8391538,286.588417 C101.358079,284.247532 103.447554,282.304318 105.912914,280.950092 L88.983922,238.503765 C87.659373,238.827981 86.2742204,239 84.8484848,239 C81.1240521,239 77.6765592,237.826137 74.8629028,235.831738 Z M108.926444,139.57707 L66.4724787,158.733486 C67.249615,160.672623 67.6767677,162.786927 67.6767677,165 C67.6767677,174.388841 59.988728,182 50.5050505,182 C49.7471541,182 49.0007256,181.951391 48.2687724,181.85715 L38.5750396,220.23611 C39.4861543,220.749049 40.3041458,221.405405 40.9976792,222.174159 C42.6818088,223.903072 43.7174291,226.254912 43.7174291,228.846154 C43.7174291,234.156584 39.3678825,238.461538 34.0024448,238.461538 L33.97,238.461 L23.4529355,280.100062 C23.9988328,280.321842 24.5304915,280.570922 25.0461777,280.845587 L70.7607648,231.72296 C68.8169443,228.967724 67.6767677,225.615682 67.6767677,222 C67.6767677,216.832203 70.0059454,212.202974 73.6817096,209.085079 C76.6878147,206.424597 80.6561833,204.807692 85.0061121,204.807692 C85.8497987,204.807692 86.6791317,204.868517 87.4898788,204.985979 L110.24355,140.942851 C109.76087,140.531447 109.319502,140.073878 108.926444,139.57707 Z M160.734505,167.461552 L99.7410567,213.235171 C101.116779,215.594242 101.930791,218.314569 102.002204,221.217119 C102.014198,221.476638 102.020202,221.737625 102.020202,222 C102.020202,227.921342 98.9622409,233.135601 94.3244632,236.179414 L111.426336,279.061102 C112.313485,278.919658 113.223602,278.846154 114.151065,278.846154 C115.194928,278.846154 116.216819,278.939266 117.208721,279.117557 L136.050314,234.79048 C134.227965,233.042679 133.095284,230.594567 133.095284,227.884615 C133.095284,225.833779 133.743988,223.932902 134.849386,222.372026 C136.556445,219.74229 139.537347,218 142.929293,218 C143.014977,218 143.100399,218.001112 143.185545,218.003322 L163.593658,169.988594 C162.546851,169.254382 161.587618,168.405915 160.734505,167.461552 Z M124.425443,139.325706 C122.658081,141.716477 119.802157,143.269231 116.579811,143.269231 C116.253636,143.269231 115.931216,143.253321 115.613299,143.222243 L93.0262,206.793907 C94.0912369,207.358905 95.0883983,208.03293 96.0024528,208.800905 L157.640432,162.543869 C156.847673,160.599649 156.411246,158.475269 156.411246,156.25 C156.411246,154.562479 156.662229,152.932978 157.129266,151.396068 L124.425443,139.325706 Z M153.339529,67.3594157 C150.391197,72.5181547 144.798239,76 138.383838,76 C134.638136,76 131.172545,74.8126908 128.350113,72.7974882 L107.510071,98.0071733 C109.117063,99.7057385 110.10101,101.989112 110.10101,104.5 C110.10101,107.047969 109.087787,109.361653 107.438468,111.067696 C105.656595,113.122019 103.013979,114.423077 100.064338,114.423077 C98.2378322,114.423077 96.5290544,113.924192 95.0695173,113.056587 L62.3236444,152.667048 C62.7000936,153.020734 63.0603637,153.391134 63.4032418,153.777048 L106.87814,134.161615 C106.869301,133.993466 106.864827,133.824173 106.864827,133.653846 C106.864827,129.442126 109.600748,125.862863 113.409523,124.562076 L113.53522,124.517331 C114.51664,124.182067 115.570177,124 116.666667,124 C118.8898,124 120.936362,124.748434 122.563294,126.004676 L182.349551,90.7824713 C181.907348,89.2835328 181.670205,87.6980224 181.670205,86.0576923 C181.670205,84.2432427 181.960364,82.4958686 182.497263,80.8585449 Z M214.701293,92.8709016 C212.035275,98.8370832 206.003648,103 198.989899,103 C196.648918,103 194.417349,102.53624 192.383815,101.69646 C189.38727,100.515265 186.80978,98.5144305 184.93439,95.9737264 L125.862024,130.775019 C125.929453,130.998352 125.988807,131.225135 126.039752,131.455037 C126.20654,132.161356 126.294795,132.8974 126.294795,133.653846 L126.291,133.858 L159.710763,146.190988 C162.820724,141.840266 167.944009,139 173.737374,139 C178.803059,139 183.356423,141.171569 186.499467,144.625686 L215.760429,130.144267 C215.702543,129.719726 215.67265,129.286395 215.67265,128.846154 C215.67265,125.202745 217.720039,122.032628 220.738214,120.401365 C222.198315,119.512759 223.91746,119 225.757576,119 C228.426717,119 230.841331,120.078861 232.580763,121.820135 L258.799186,108.845647 C258.549854,107.698983 258.418581,106.508895 258.418581,105.288462 C258.418581,104.800602 258.439557,104.317592 258.480667,103.840267 Z M245.238368,63.9788437 L214.878684,79.5407223 C215.705598,81.5321907 216.161616,83.7133735 216.161616,86 C216.161616,86.4279495 216.145644,86.8522058 216.114256,87.2722163 L259.967577,98.2612371 C260.069751,98.0415113 260.176569,97.8243377 260.287906,97.6098394 C261.387938,95.3591572 262.973791,93.3844494 264.911037,91.8200234 L253.273972,67.2842033 C253.047888,67.2997759 252.819673,67.3076923 252.58959,67.3076923 C249.652476,67.3076923 247.019785,66.0176617 245.238368,63.9788437 Z M268.975656,32.6226993 L259.251969,50.2671093 C261.316807,52.0096025 262.626263,54.6034105 262.626263,57.5 C262.626263,60.6315273 261.095776,63.4091651 258.734929,65.1397895 C258.725823,65.1472565 258.716716,65.1546001 258.707594,65.1619276 L270.001371,88.9786703 C271.800808,88.3449879 273.738497,88 275.757576,88 C277.229361,88 278.657899,88.1833099 280.021166,88.5281261 L289.436981,71.1023623 C287.116916,69.3452008 285.620537,66.5763272 285.620537,63.4615385 C285.620537,60.0195 287.447862,56.9998808 290.194738,55.3011503 L280.440725,33.3600944 C278.952008,33.7769425 277.381104,34 275.757576,34 C273.34893,34 271.056112,33.5090435 268.975656,32.6226993 Z M259.698505,23.243815 L222.472,34.659 L222.469277,34.8891485 C222.322853,40.0729819 218.031085,44.2307692 212.758155,44.2307692 C209.447897,44.2307692 206.524327,42.5921354 204.770316,40.0897135 L155.14937,55.3075491 C155.415322,56.4963597 155.555556,57.7319669 155.555556,59 C155.555556,59.9887785 155.470287,60.9578406 155.306632,61.9003724 L185.229261,75.7539951 C185.850339,74.9614208 186.541391,74.2252531 187.293246,73.5545714 C190.358873,70.728461 194.470495,69 198.989899,69 C204.062427,69 208.62125,71.1774401 211.764723,74.6396919 L242.9241,58.6689362 C242.89137,58.3477949 242.874606,58.0219889 242.874606,57.6923077 C242.874606,52.8623908 246.472628,48.8642216 251.160541,48.1802192 L251.421428,48.1329416 C251.944551,48.0455168 252.482058,48 253.030303,48 C253.30341,48 253.573853,48.0112951 253.84118,48.0334391 L264.077393,29.4615699 C263.181943,28.6385889 262.375335,27.7221684 261.673394,26.7279739 C260.882275,25.6561352 260.217261,24.4874712 259.698505,23.243815 Z" id="Combined-Shape" fill="url(#linearGradient-1)"></path>
+    </g>
+</svg>
\ No newline at end of file
diff --git a/web/src/constants/setting.ts b/web/src/constants/setting.ts
index 9cb05c125..a58af0176 100644
--- a/web/src/constants/setting.ts
+++ b/web/src/constants/setting.ts
@@ -72,6 +72,7 @@ export const IconMap = {
   'nomic-ai': 'nomic-ai',
   jinaai: 'jina',
   'sentence-transformers': 'sentence-transformers',
+  GPUStack: 'gpustack',
 };
 
 export const TimezoneList = [
diff --git a/web/src/pages/user-setting/constants.tsx b/web/src/pages/user-setting/constants.tsx
index 0bac99480..255cb4a5e 100644
--- a/web/src/pages/user-setting/constants.tsx
+++ b/web/src/pages/user-setting/constants.tsx
@@ -31,6 +31,7 @@ export const LocalLlmFactories = [
   'Replicate',
   'OpenRouter',
   'HuggingFace',
+  'GPUStack',
 ];
 
 export enum TenantRole {
diff --git a/web/src/pages/user-setting/setting-model/ollama-modal/index.tsx b/web/src/pages/user-setting/setting-model/ollama-modal/index.tsx
index 0925d2fe9..b68913a2c 100644
--- a/web/src/pages/user-setting/setting-model/ollama-modal/index.tsx
+++ b/web/src/pages/user-setting/setting-model/ollama-modal/index.tsx
@@ -29,6 +29,7 @@ const llmFactoryToUrlMap = {
   OpenRouter: 'https://openrouter.ai/docs',
   HuggingFace:
     'https://huggingface.co/docs/text-embeddings-inference/quick_tour',
+  GPUStack: 'https://docs.gpustack.ai/latest/quickstart',
 };
 type LlmFactory = keyof typeof llmFactoryToUrlMap;
 
@@ -76,6 +77,13 @@ const OllamaModal = ({
       { value: 'speech2text', label: 'sequence2text' },
       { value: 'tts', label: 'tts' },
     ],
+    GPUStack: [
+      { value: 'chat', label: 'chat' },
+      { value: 'embedding', label: 'embedding' },
+      { value: 'rerank', label: 'rerank' },
+      { value: 'speech2text', label: 'sequence2text' },
+      { value: 'tts', label: 'tts' },
+    ],
     Default: [
       { value: 'chat', label: 'chat' },
       { value: 'embedding', label: 'embedding' },