AutoRAG_llama3_groq / phi /tools /newspaper_toolkit.py
AmmarFahmy
adding all files
105b369
from phi.tools import Toolkit
try:
from newspaper import Article
except ImportError:
raise ImportError("`newspaper3k` not installed. Please run `pip install newspaper3k lxml_html_clean`.")
class NewspaperToolkit(Toolkit):
def __init__(
self,
get_article_text: bool = True,
):
super().__init__(name="newspaper_toolkit")
if get_article_text:
self.register(self.get_article_text)
def get_article_text(self, url: str) -> str:
"""Get the text of an article from a URL.
Args:
url (str): The URL of the article.
Returns:
str: The text of the article.
"""
try:
article = Article(url)
article.download()
article.parse()
return article.text
except Exception as e:
return f"Error getting article text from {url}: {e}"