Merge pull request #878 from mendableai/mog/deduplicate-urls

feat(crawl): Similar URL deduplication
This commit is contained in:
Nicolas
2024-11-11 14:33:13 -05:00
committed by GitHub
5 changed files with 91 additions and 9 deletions
+3
View File
@@ -86,6 +86,8 @@ export interface CrawlScrapeOptions {
country?: string;
languages?: string[];
};
skipTlsVerification?: boolean;
removeBase64Images?: boolean;
}
export type Action = {
@@ -151,6 +153,7 @@ export interface CrawlParams {
ignoreSitemap?: boolean;
scrapeOptions?: CrawlScrapeOptions;
webhook?: string;
deduplicateSimilarURLs?: boolean;
}
/**