[Feat] Added allowed urls
FireCrawl should be able to scrape LinkedIn Articles (/pulse/*)
This commit is contained in:
parent
75e82869ed
commit
75597f72a1
@ -14,6 +14,14 @@ const socialMediaBlocklist = [
|
|||||||
'telegram.org',
|
'telegram.org',
|
||||||
];
|
];
|
||||||
|
|
||||||
|
const allowedUrls = [
|
||||||
|
'linkedin.com/pulse'
|
||||||
|
];
|
||||||
|
|
||||||
export function isUrlBlocked(url: string): boolean {
|
export function isUrlBlocked(url: string): boolean {
|
||||||
|
if (allowedUrls.some(allowedUrl => url.includes(allowedUrl))) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
return socialMediaBlocklist.some(domain => url.includes(domain));
|
return socialMediaBlocklist.some(domain => url.includes(domain));
|
||||||
}
|
}
|
||||||
|
Loading…
Reference in New Issue
Block a user