Spaces:
Runtime error
Runtime error
from phi.tools import Toolkit | |
try: | |
from newspaper import Article | |
except ImportError: | |
raise ImportError("`newspaper3k` not installed. Please run `pip install newspaper3k lxml_html_clean`.") | |
class NewspaperToolkit(Toolkit): | |
def __init__( | |
self, | |
get_article_text: bool = True, | |
): | |
super().__init__(name="newspaper_toolkit") | |
if get_article_text: | |
self.register(self.get_article_text) | |
def get_article_text(self, url: str) -> str: | |
"""Get the text of an article from a URL. | |
Args: | |
url (str): The URL of the article. | |
Returns: | |
str: The text of the article. | |
""" | |
try: | |
article = Article(url) | |
article.download() | |
article.parse() | |
return article.text | |
except Exception as e: | |
return f"Error getting article text from {url}: {e}" | |