Resolve 8475 support rerank model from infinity (#10939)

Co-authored-by: linyanxu <linyanxu2@qq.com>
2025-08-15 11:25:55 +08:00 · 2024-11-21 18:03:49 +08:00 · 2024-11-21 18:03:49 +08:00 · 1a6b961b5f
commit 1a6b961b5f
parent 01014a6a84
1 changed files with 8 additions and 2 deletions
--- a/api/core/model_runtime/model_providers/openai_api_compatible/rerank/rerank.py
+++ b/api/core/model_runtime/model_providers/openai_api_compatible/rerank/rerank.py
@ -64,7 +64,7 @@ class OAICompatRerankModel(RerankModel):

        # TODO: Do we need truncate docs to avoid llama.cpp return error?

-        data = {"model": model_name, "query": query, "documents": docs, "top_n": top_n}
+        data = {"model": model_name, "query": query, "documents": docs, "top_n": top_n, "return_documents": True}

        try:
            response = post(str(URL(url) / "rerank"), headers=headers, data=dumps(data), timeout=60)
@ -83,7 +83,13 @@ class OAICompatRerankModel(RerankModel):
                index = result["index"]

                # Retrieve document text (fallback if llama.cpp rerank doesn't return it)
-                text = result.get("document", {}).get("text", docs[index])
+                text = docs[index]
+                document = result.get("document", {})
+                if document:
+                    if isinstance(document, dict):
+                        text = document.get("text", docs[index])
+                    elif isinstance(document, str):
+                        text = document

                # Normalize the score
                normalized_score = (result["relevance_score"] - min_score) / score_range