diff --git a/api/core/tool/web_reader_tool.py b/api/core/tool/web_reader_tool.py index be76839239..c2e68bc7a8 100644 --- a/api/core/tool/web_reader_tool.py +++ b/api/core/tool/web_reader_tool.py @@ -88,11 +88,9 @@ class WebReaderTool(BaseTool): texts = character_splitter.split_text(page_contents) docs = [Document(page_content=t) for t in texts] - if len(docs) == 0: + if len(docs) == 0 or docs[0].page_content.endswith('TEXT:'): return "No content found." - docs = docs[1:] - # only use first 5 docs if len(docs) > 5: docs = docs[:5]