From 6d1da2e22a65e41ee2a41605a91f37797354598f Mon Sep 17 00:00:00 2001 From: Nicolas Date: Fri, 30 Aug 2024 18:45:02 -0300 Subject: [PATCH] Update index.ts --- apps/api/src/scraper/WebScraper/index.ts | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/apps/api/src/scraper/WebScraper/index.ts b/apps/api/src/scraper/WebScraper/index.ts index e67ad02b..fc828224 100644 --- a/apps/api/src/scraper/WebScraper/index.ts +++ b/apps/api/src/scraper/WebScraper/index.ts @@ -306,7 +306,7 @@ export class WebScraperDataProvider { // documents = await this.applyImgAltText(documents); if (this.mode === "single_urls" && this.pageOptions.includeExtract) { - const extractionMode = this.extractorOptions.mode; + const extractionMode = this.extractorOptions?.mode ?? "markdown"; const completionMode = extractionMode === "llm-extraction-from-raw-html" ? "raw-html" : "markdown"; if ( @@ -583,7 +583,7 @@ export class WebScraperDataProvider { removeTags: options.pageOptions?.removeTags ?? [], includeMarkdown: options.pageOptions?.includeMarkdown ?? true, includeRawHtml: options.pageOptions?.includeRawHtml ?? false, - includeExtract: options.pageOptions?.includeExtract ?? options.extractorOptions.mode !== "markdown" ?? false, + includeExtract: options.pageOptions?.includeExtract ?? (options.extractorOptions?.mode && options.extractorOptions?.mode !== "markdown") ?? false, waitFor: options.pageOptions?.waitFor ?? undefined, headers: options.pageOptions?.headers ?? undefined, includeLinks: options.pageOptions?.includeLinks ?? true,