diff --git a/rag/llm/cv_model.py b/rag/llm/cv_model.py index 4c4513dc2..aeaeefffa 100644 --- a/rag/llm/cv_model.py +++ b/rag/llm/cv_model.py @@ -449,6 +449,8 @@ class LocalAICV(GptV4): class XinferenceCV(Base): def __init__(self, key, model_name="", lang="Chinese", base_url=""): + if base_url.split("/")[-1] != "v1": + base_url = os.path.join(base_url, "v1") self.client = OpenAI(api_key="xxx", base_url=base_url) self.model_name = model_name self.lang = lang diff --git a/rag/llm/embedding_model.py b/rag/llm/embedding_model.py index 221fea198..6f7c4b89d 100644 --- a/rag/llm/embedding_model.py +++ b/rag/llm/embedding_model.py @@ -268,6 +268,8 @@ class FastEmbed(Base): class XinferenceEmbed(Base): def __init__(self, key, model_name="", base_url=""): + if base_url.split("/")[-1] != "v1": + base_url = os.path.join(base_url, "v1") self.client = OpenAI(api_key="xxx", base_url=base_url) self.model_name = model_name diff --git a/rag/llm/rerank_model.py b/rag/llm/rerank_model.py index 3a2a91092..fcda163cc 100644 --- a/rag/llm/rerank_model.py +++ b/rag/llm/rerank_model.py @@ -140,6 +140,8 @@ class YoudaoRerank(DefaultRerank): class XInferenceRerank(Base): def __init__(self, key="xxxxxxx", model_name="", base_url=""): + if base_url.split("/")[-1] != "v1": + base_url = os.path.join(base_url, "v1") self.model_name = model_name self.base_url = base_url self.headers = { diff --git a/rag/llm/sequence2txt_model.py b/rag/llm/sequence2txt_model.py index fcd6859d5..a3f7f5af1 100644 --- a/rag/llm/sequence2txt_model.py +++ b/rag/llm/sequence2txt_model.py @@ -93,6 +93,8 @@ class AzureSeq2txt(Base): class XinferenceSeq2txt(Base): def __init__(self, key, model_name="", base_url=""): + if base_url.split("/")[-1] != "v1": + base_url = os.path.join(base_url, "v1") self.client = OpenAI(api_key="xxx", base_url=base_url) self.model_name = model_name