fix(crawler): sitemaps poisoning crawls with unrelated links (#1334)
This commit is contained in:
@@ -271,7 +271,7 @@ export class WebCrawler {
|
|||||||
return urlsHandler(urls);
|
return urlsHandler(urls);
|
||||||
} else {
|
} else {
|
||||||
let filteredLinks = this.filterLinks(
|
let filteredLinks = this.filterLinks(
|
||||||
[...new Set(urls)],
|
[...new Set(urls)].filter(x => this.filterURL(x, this.initialUrl) !== null),
|
||||||
leftOfLimit,
|
leftOfLimit,
|
||||||
this.maxCrawledDepth,
|
this.maxCrawledDepth,
|
||||||
fromMap,
|
fromMap,
|
||||||
|
|||||||
Reference in New Issue
Block a user