From 2871455e4ec8c990e19d2219a389916695b420df Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?=E9=BB=84=E8=85=BE?= <101850389+hangters@users.noreply.github.com> Date: Tue, 3 Sep 2024 15:11:53 +0800 Subject: [PATCH] fix zhipuCV bug (#2215) ### What problem does this PR solve? #2198 fix zhipuCV bug ### Type of change - [x] Bug Fix (non-breaking change which fixes an issue) Co-authored-by: Zhedong Cen --- rag/llm/cv_model.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/rag/llm/cv_model.py b/rag/llm/cv_model.py index 65f73d00b..4c4513dc2 100644 --- a/rag/llm/cv_model.py +++ b/rag/llm/cv_model.py @@ -293,9 +293,12 @@ class Zhipu4V(Base): def describe(self, image, max_tokens=1024): b64 = self.image2base64(image) + prompt = self.prompt(b64) + prompt[0]["content"][1]["type"] = "text" + res = self.client.chat.completions.create( model=self.model_name, - messages=self.prompt(b64), + messages=prompt, max_tokens=max_tokens, ) return res.choices[0].message.content.strip(), res.usage.total_tokens