|
import gradio as gr |
|
import requests |
|
from datetime import datetime, timezone |
|
|
|
API_URL = "https://huggingface.co/api/daily_papers" |
|
|
|
class PaperManager: |
|
def __init__(self, papers_per_page=10): |
|
self.papers_per_page = papers_per_page |
|
self.current_page = 1 |
|
self.papers = [] |
|
self.total_pages = 0 |
|
self.last_fetched_page = 0 |
|
|
|
def fetch_papers(self, page=1): |
|
try: |
|
response = requests.get(f"{API_URL}?page={page}&limit={self.papers_per_page}") |
|
response.raise_for_status() |
|
data = response.json() |
|
new_papers = sorted(data, key=lambda x: x.get('paper', {}).get('upvotes', 0), reverse=True) |
|
|
|
if page > self.last_fetched_page: |
|
self.papers.extend(new_papers) |
|
self.last_fetched_page = page |
|
elif page < self.last_fetched_page: |
|
self.papers = new_papers + self.papers |
|
self.last_fetched_page = page |
|
|
|
self.total_pages = max(self.total_pages, page) |
|
if len(new_papers) < self.papers_per_page: |
|
self.total_pages = page |
|
|
|
return True |
|
except requests.RequestException as e: |
|
print(f"Error fetching papers: {e}") |
|
return False |
|
|
|
def format_paper(self, paper): |
|
title = paper.get('title', 'No title') |
|
url = f"https://huggingface.co/papers/{paper['paper'].get('id', '')}" |
|
authors = ', '.join([author.get('name', '') for author in paper['paper'].get('authors', [])]) |
|
upvotes = paper.get('paper', {}).get('upvotes', 0) |
|
comments = paper.get('numComments', 0) |
|
published_time = datetime.fromisoformat(paper.get('publishedAt', datetime.now(timezone.utc).isoformat()).replace('Z', '+00:00')) |
|
time_ago = (datetime.now(timezone.utc) - published_time).days |
|
|
|
return f"""<div style='border-bottom: 1px solid #eee; padding: 10px 0;'> |
|
<a href='{url}' target='_blank' style='color: #000; text-decoration: none; font-weight: bold;'>{title}</a> |
|
<div style='font-size: 0.8em; color: #666; margin-top: 5px;'> |
|
{upvotes} upvotes | by {authors} | {time_ago} days ago | {comments} comments |
|
</div> |
|
</div>""" |
|
|
|
def render_papers(self): |
|
if not self.papers or self.current_page > self.last_fetched_page: |
|
if not self.fetch_papers(self.current_page): |
|
return "<div>Failed to fetch papers. Please try again later.</div>" |
|
|
|
start_index = (self.current_page - 1) * self.papers_per_page |
|
end_index = start_index + self.papers_per_page |
|
current_papers = self.papers[start_index:end_index] |
|
|
|
if not current_papers: |
|
return "<div>No more papers available.</div>" |
|
|
|
return "".join([self.format_paper(paper) for paper in current_papers]) |
|
|
|
def search_papers(self, query): |
|
if not query: |
|
self.current_page = 1 |
|
return self.render_papers() |
|
|
|
filtered_papers = [paper for paper in self.papers if query.lower() in paper.get('title', '').lower()] |
|
return "".join([self.format_paper(paper) for paper in filtered_papers[:self.papers_per_page]]) |
|
|
|
def next_page(self): |
|
if self.current_page < self.total_pages or len(self.papers) >= self.current_page * self.papers_per_page: |
|
self.current_page += 1 |
|
return self.render_papers(), f"Page {self.current_page} of {self.total_pages}+" |
|
|
|
def prev_page(self): |
|
if self.current_page > 1: |
|
self.current_page -= 1 |
|
return self.render_papers(), f"Page {self.current_page} of {self.total_pages}+" |
|
|
|
css = """ |
|
body { |
|
font-family: Arial, sans-serif; |
|
max-width: 800px; |
|
margin: 0 auto; |
|
padding: 20px; |
|
} |
|
.paper-list { |
|
max-height: 600px; |
|
overflow-y: auto; |
|
border: 1px solid #eee; |
|
border-radius: 5px; |
|
padding: 10px; |
|
} |
|
.search-row { |
|
display: flex; |
|
gap: 10px; |
|
margin-bottom: 20px; |
|
} |
|
""" |
|
|
|
paper_manager = PaperManager() |
|
|
|
def refresh_papers(): |
|
paper_manager.current_page = 1 |
|
paper_manager.papers = [] |
|
paper_manager.last_fetched_page = 0 |
|
paper_manager.total_pages = 0 |
|
paper_manager.fetch_papers() |
|
return paper_manager.render_papers(), f"Page {paper_manager.current_page} of {paper_manager.total_pages}+" |
|
|
|
demo = gr.Blocks(css=css) |
|
|
|
with demo: |
|
gr.Markdown("# Daily Papers - HackerNews Style") |
|
with gr.Row(elem_classes=["search-row"]): |
|
search_input = gr.Textbox(label="Search papers", placeholder="Enter search term...") |
|
refresh_button = gr.Button("Refresh") |
|
paper_list = gr.HTML(paper_manager.render_papers(), elem_classes=["paper-list"]) |
|
|
|
with gr.Row(): |
|
prev_button = gr.Button("Previous Page") |
|
next_button = gr.Button("Next Page") |
|
page_info = gr.Markdown(f"Page {paper_manager.current_page} of {paper_manager.total_pages}+") |
|
|
|
search_input.change(paper_manager.search_papers, inputs=[search_input], outputs=[paper_list]) |
|
refresh_button.click(refresh_papers, outputs=[paper_list, page_info]) |
|
prev_button.click(paper_manager.prev_page, outputs=[paper_list, page_info]) |
|
next_button.click(paper_manager.next_page, outputs=[paper_list, page_info]) |
|
|
|
demo.launch() |