mirror of
https://github.com/mendableai/firecrawl.git
synced 2024-11-16 11:42:24 +08:00
[Feat] Added allowed urls
FireCrawl should be able to scrape LinkedIn Articles (/pulse/*)
This commit is contained in:
parent
75e82869ed
commit
75597f72a1
|
@ -14,6 +14,14 @@ const socialMediaBlocklist = [
|
|||
'telegram.org',
|
||||
];
|
||||
|
||||
const allowedUrls = [
|
||||
'linkedin.com/pulse'
|
||||
];
|
||||
|
||||
export function isUrlBlocked(url: string): boolean {
|
||||
if (allowedUrls.some(allowedUrl => url.includes(allowedUrl))) {
|
||||
return false;
|
||||
}
|
||||
|
||||
return socialMediaBlocklist.some(domain => url.includes(domain));
|
||||
}
|
||||
|
|
Loading…
Reference in New Issue
Block a user