mirror of
https://github.com/mendableai/firecrawl.git
synced 2024-11-15 19:22:19 +08:00
added .inc files and forced lower case comparison
This commit is contained in:
parent
4ab7fb007a
commit
f48ff36b32
|
@ -164,7 +164,7 @@ export class WebCrawler {
|
||||||
concurrencyLimit,
|
concurrencyLimit,
|
||||||
inProgress
|
inProgress
|
||||||
);
|
);
|
||||||
|
|
||||||
if (
|
if (
|
||||||
urls.length === 0 &&
|
urls.length === 0 &&
|
||||||
this.filterLinks([this.initialUrl], limit, this.maxCrawledDepth).length > 0
|
this.filterLinks([this.initialUrl], limit, this.maxCrawledDepth).length > 0
|
||||||
|
@ -420,9 +420,10 @@ export class WebCrawler {
|
||||||
".woff",
|
".woff",
|
||||||
".ttf",
|
".ttf",
|
||||||
".woff2",
|
".woff2",
|
||||||
".webp"
|
".webp",
|
||||||
|
".inc"
|
||||||
];
|
];
|
||||||
return fileExtensions.some((ext) => url.endsWith(ext));
|
return fileExtensions.some((ext) => url.toLowerCase().endsWith(ext));
|
||||||
}
|
}
|
||||||
|
|
||||||
private isSocialMediaOrEmail(url: string): boolean {
|
private isSocialMediaOrEmail(url: string): boolean {
|
||||||
|
|
Loading…
Reference in New Issue
Block a user