@@ -88,11 +88,9 @@ class WebReaderTool(BaseTool):
texts = character_splitter.split_text(page_contents)
docs = [Document(page_content=t) for t in texts]
- if len(docs) == 0:
+ if len(docs) == 0 or docs[0].page_content.endswith('TEXT:'):
return "No content found."
- docs = docs[1:]
-
# only use first 5 docs
if len(docs) > 5:
docs = docs[:5]