fix(crawler): bad urls from sitemap
This commit is contained in:
@@ -228,7 +228,7 @@ export class WebCrawler {
|
|||||||
);
|
);
|
||||||
leftOfLimit -= filteredLinks.length;
|
leftOfLimit -= filteredLinks.length;
|
||||||
let uniqueURLs: string[] = [];
|
let uniqueURLs: string[] = [];
|
||||||
for (const url of urls) {
|
for (const url of filteredLinks) {
|
||||||
if (
|
if (
|
||||||
await redisConnection.sadd(
|
await redisConnection.sadd(
|
||||||
"sitemap:" + this.jobId + ":links",
|
"sitemap:" + this.jobId + ":links",
|
||||||
|
|||||||
Reference in New Issue
Block a user