Spaces:
Sleeping
Sleeping
Commit
·
95dbc93
1
Parent(s):
c4aea89
update api handle 3
Browse files
app.py
CHANGED
|
@@ -173,10 +173,10 @@ async def crawl_url(request: CrawlRequest):
|
|
| 173 |
cache_mode=cache_mode,
|
| 174 |
excluded_tags=request.excluded_tags,
|
| 175 |
remove_overlay_elements=request.remove_overlay_elements,
|
| 176 |
-
|
| 177 |
-
|
| 178 |
-
|
| 179 |
-
|
| 180 |
)
|
| 181 |
|
| 182 |
result = await crawler.arun(
|
|
|
|
| 173 |
cache_mode=cache_mode,
|
| 174 |
excluded_tags=request.excluded_tags,
|
| 175 |
remove_overlay_elements=request.remove_overlay_elements,
|
| 176 |
+
exclude_external_links=True,
|
| 177 |
+
exclude_social_media_links=True,
|
| 178 |
+
exclude_external_images=True,
|
| 179 |
+
exclude_domains=["facebook.com", "twitter.com", "instagram.com", "youtube.com", "tiktok.com", "pinterest.com"]
|
| 180 |
)
|
| 181 |
|
| 182 |
result = await crawler.arun(
|