CEEMEESEEK / app2.py
acecalisto3's picture
Update app2.py
cec96a7 verified
raw
history blame
8.96 kB
import asyncio
import gradio as gr
from sqlalchemy.exc import SQLAlchemyError
from sqlalchemy.ext.asyncio import create_async_engine, AsyncSession
from sqlalchemy.future import select
from sqlalchemy.orm import sessionmaker
import logging
import os
import sys
from typing import List, Dict, Any
from datetime import datetime
from pytz import timezone
import pytz
import requests
from bs4 import BeautifulSoup
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt
from sklearn.model_selection import train_test_split
from sklearn.linear_model import LinearRegression
from sklearn import metrics
# Global variables for database session and engine
db_session = None
engine = None
monitoring_task = None
logger = logging.getLogger(__name__)
# Function for dynamically setting the database connection
async def set_db_connection(host: str, port: str, user: str, password: str, db_name: str):
global db_session, engine
try:
engine = create_async_engine(f"mysql+aiomysql://{user}:{password}@{host}:{port}/{db_name}", echo=False)
Session = sessionmaker(engine, class_=AsyncSession, expire_on_commit=False)
db_session = Session()
return "Database connection established."
except Exception as e:
logger.error(f"Failed to establish database connection: {e}")
return f"Failed to connect to database: {e}"
# Periodic feed updater with error handling and logging improvements
async def periodic_update_with_error_handling():
while True:
try:
await asyncio.sleep(300) # Wait for 5 minutes before updating the feed content.
await update_feed_content() # Update the feed content.
except Exception as e: # Catch all exceptions for logging purposes.
logger.error(f"Error in periodic update: {e}") # Improved logging message format.
# Function to fetch RSS feed content from the provided URL with error handling and logging improvements.
async def fetch_feed_content(feed_url: str) -> Dict[str, Any]:
try:
result = await db_session.execute(select(Article).order_by(Article.timestamp.desc()).limit(20))
articles = result.scalars().all() # Fetch latest articles
feed = {
'title': 'Website Changes Feed',
'link': feed_url,
'description': 'Feed of changes detected on monitored websites.',
'items': [{'title': article.title, 'link': article.url, 'description': article.content, 'pubDate': str(article.timestamp)} for article in articles] if articles else []
}
return feed
except Exception as e:
logger.error(f"Error fetching feed content: {e}")
return {}
# Function to scrape website content
async def scrape_website(url: str) -> str:
try:
response = requests.get(url)
soup = BeautifulSoup(response.text, 'html.parser')
return soup.get_text()
except Exception as e:
logger.error(f"Error scraping website: {e}")
return ""
# Function to analyze website content
async def analyze_website_content(content: str) -> Dict[str, Any]:
try:
# Perform sentiment analysis using Natural Language Processing (NLP) techniques
# For simplicity, we'll use a basic sentiment analysis approach
sentiment = "Positive" if content.count("good") > content.count("bad") else "Negative"
return {'sentiment': sentiment}
except Exception as e:
logger.error(f"Error analyzing website content: {e}")
return {}
# Function to predict website traffic
async def predict_website_traffic(url: str) -> Dict[str, Any]:
try:
# Use machine learning model to predict website traffic
# For simplicity, we'll use a basic linear regression model
X = pd.DataFrame({'url': [url]})
y = pd.DataFrame({'traffic': [100]}) # Replace with actual traffic data
X_train, X_test, y_train, y_test = train_test_split(X, y, test_size=0.2, random_state=42)
model = LinearRegression()
model.fit(X_train, y_train)
y_pred = model.predict(X_test)
return {'traffic': y_pred[0]}
except Exception as e:
logger.error(f"Error predicting website traffic: {e}")
return {}
# Main application that runs Gradio UI and background tasks
async def main():
global db_session, monitoring_task
engine = None
demo = gr.Blocks()
# Define the Gradio interface
with demo:
gr.Markdown("# Website Monitor and Chatbot")
with gr.Row():
with gr.Column():
gr.Markdown("## Database Settings")
db_host = gr.Textbox(label="Database Host", placeholder="localhost", value="localhost")
db_port = gr.Textbox(label="Database Port", placeholder="3306", value="3306")
db_user = gr.Textbox(label="Database User", placeholder="username", value="")
db_pass = gr.Textbox(label="Database Password", placeholder="password", type="password", value="")
db_name = gr.Textbox(label="Database Name", placeholder="database_name", value="monitoring")
db_status_textbox = gr.Textbox(label="Database Status", interactive=False)
status_text = gr.Textbox(label="Status", interactive=False)
gr.Markdown("## RSS Feed Reader Settings")
feed_target_url = gr.Textbox(label="RSS Feed Target URL", placeholder="http://yourwebsite.com/feed")
view_button = gr.Button("View Feed")
target_urls = gr.Textbox(label="Target URLs (comma-separated)", placeholder="https://example.com, https://another-site.com")
storage_location = gr.Textbox(label="Storage Location (CSV file path)", placeholder="/path/to/your/file.csv")
feed_rss_checkbox = gr.Checkbox(label="Enable RSS Feed")
start_button = gr.Button("Start Monitoring")
stop_button = gr.Button("Stop Monitoring")
with gr.Column():
feed_content = gr.JSON(label="RSS Feed Content")
chatbot_interface = gr.Chatbot(type='messages')
message_input = gr.Textbox(placeholder="Type your message here...")
send_button = gr.Button("Send")
scrape_button = gr.Button("Scrape Website")
analyze_button = gr.Button("Analyze Website Content")
predict_button = gr.Button("Predict Website Traffic")
scrape_output = gr.Textbox(label="Scraped Website Content", interactive=False)
analyze_output = gr.JSON(label="Website Content Analysis", interactive=False)
predict_output = gr.JSON(label="Website Traffic Prediction", interactive=False)
# Define button actions
async def on_start_click(target_urls_str: str, storage_loc: str, feed_enabled: bool, host: str, port: str, user: str, password: str, db_name: str):
global monitoring_task
urls = [url.strip() for url in target_urls_str.split(",")]
await set_db_connection(host, port, user, password, db_name)
monitoring_task = asyncio.create_task(start_monitoring(urls, storage_loc, feed_enabled))
return "Monitoring started."
async def on_stop_click():
global monitoring_task
if monitoring_task:
monitoring_task.cancel()
monitoring_task = None
return "Monitoring stopped."
async def on_view_feed_click(feed_url: str):
return await fetch_feed_content(feed_url)
async def on_scrape_click(url: str):
return await scrape_website(url)
async def on_analyze_click(content: str):
return await analyze_website_content(content)
async def on_predict_click(url: str):
return await predict_website_traffic(url)
stop_button.click(on_stop_click, outputs=[status_text])
view_button.click(on_view_feed_click, inputs=[feed_target_url], outputs=[feed_content])
scrape_button.click(on_scrape_click, inputs=[target_urls], outputs=[scrape_output])
analyze_button.click(on_analyze_click, inputs=[scrape_output], outputs=[analyze_output])
predict_button.click(on_predict_click, inputs=[target_urls], outputs=[predict_output])
send_button.click(chatbot_response, inputs=[message_input, chatbot_interface], outputs=[chatbot_interface, message_input])
# Set up the timer for periodic updates
feed_updater = gr.Timer(interval=300)
feed_updater.tick(fn=update_feed_content, outputs=feed_content)
# Load and check database status when the UI is loaded
demo.load(update_db_status, outputs=db_status_textbox)
asyncio.create_task(periodic_update_with_error_handling())
# Launch the Gradio demo
await demo.launch()
# Launch the app using asyncio
if __name__ == "__main__":
asyncio.run(main())