deer-flow/tests/integration/test_crawler.py
2025-04-17 11:34:42 +08:00

31 lines
971 B
Python

# Copyright (c) 2025 Bytedance Ltd. and/or its affiliates
# SPDX-License-Identifier: MIT
import pytest
from src.crawler import Crawler
def test_crawler_initialization():
"""Test that crawler can be properly initialized."""
crawler = Crawler()
assert isinstance(crawler, Crawler)
def test_crawler_crawl_valid_url():
"""Test crawling with a valid URL."""
crawler = Crawler()
test_url = "https://finance.sina.com.cn/stock/relnews/us/2024-08-15/doc-incitsya6536375.shtml"
result = crawler.crawl(test_url)
assert result is not None
assert hasattr(result, "to_markdown")
def test_crawler_markdown_output():
"""Test that crawler output can be converted to markdown."""
crawler = Crawler()
test_url = "https://finance.sina.com.cn/stock/relnews/us/2024-08-15/doc-incitsya6536375.shtml"
result = crawler.crawl(test_url)
markdown = result.to_markdown()
assert isinstance(markdown, str)
assert len(markdown) > 0