From 6d99dedd3cec15d9543aaccba2a5a6b5d78559ec Mon Sep 17 00:00:00 2001 From: Nicolas Date: Tue, 30 Jul 2024 19:11:01 -0400 Subject: [PATCH] Nick: fixed tests --- .../api/src/scraper/WebScraper/__tests__/single_url.test.ts | 6 +++--- apps/api/src/scraper/WebScraper/scrapers/fireEngine.ts | 1 + 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/apps/api/src/scraper/WebScraper/__tests__/single_url.test.ts b/apps/api/src/scraper/WebScraper/__tests__/single_url.test.ts index 4b720835..d555e030 100644 --- a/apps/api/src/scraper/WebScraper/__tests__/single_url.test.ts +++ b/apps/api/src/scraper/WebScraper/__tests__/single_url.test.ts @@ -23,8 +23,8 @@ describe('scrapSingleUrl', () => { }, 10000); }); -it('should return a list of links on the mendable.ai page', async () => { - const url = 'https://mendable.ai'; +it('should return a list of links on the firecrawl.ai page', async () => { + const url = 'https://example.com'; const pageOptions: PageOptions = { includeHtml: true }; const result = await scrapSingleUrl("TEST", url, pageOptions); @@ -33,5 +33,5 @@ it('should return a list of links on the mendable.ai page', async () => { expect(result.linksOnPage).toBeDefined(); expect(Array.isArray(result.linksOnPage)).toBe(true); expect(result.linksOnPage.length).toBeGreaterThan(0); - expect(result.linksOnPage).toContain('https://mendable.ai/blog') + expect(result.linksOnPage).toContain('https://www.iana.org/domains/example') }, 10000); diff --git a/apps/api/src/scraper/WebScraper/scrapers/fireEngine.ts b/apps/api/src/scraper/WebScraper/scrapers/fireEngine.ts index 0f4c2320..461d8e16 100644 --- a/apps/api/src/scraper/WebScraper/scrapers/fireEngine.ts +++ b/apps/api/src/scraper/WebScraper/scrapers/fireEngine.ts @@ -81,6 +81,7 @@ export async function scrapWithFireEngine({ timeout: universalTimeout + waitParam, } ); + console.log(response.data?.pageStatusCode); if (response.status !== 200) { Logger.debug(