Spaces:
Runtime error
Runtime error
File size: 911 Bytes
105b369 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 |
from phi.tools import Toolkit
try:
from newspaper import Article
except ImportError:
raise ImportError("`newspaper3k` not installed. Please run `pip install newspaper3k lxml_html_clean`.")
class NewspaperToolkit(Toolkit):
def __init__(
self,
get_article_text: bool = True,
):
super().__init__(name="newspaper_toolkit")
if get_article_text:
self.register(self.get_article_text)
def get_article_text(self, url: str) -> str:
"""Get the text of an article from a URL.
Args:
url (str): The URL of the article.
Returns:
str: The text of the article.
"""
try:
article = Article(url)
article.download()
article.parse()
return article.text
except Exception as e:
return f"Error getting article text from {url}: {e}"
|