Spaces:

DreamStream-1
/

Testing

Sleeping

App Files Files Community

DreamStream-1 commited on Nov 29, 2024

Commit

e623c13

verified ·

1 Parent(s): bdd3317

Update app.py

Browse files

Files changed (1) hide show

app.py +219 -97

app.py CHANGED Viewed

@@ -1,60 +1,61 @@
 import gradio as gr
 import nltk
 import numpy as np
 import tflearn
-import torch
 from nltk.tokenize import word_tokenize
 from nltk.stem.lancaster import LancasterStemmer
-from transformers import AutoTokenizer, AutoModelForSequenceClassification
 import requests
-import pandas as pd
-import os
-import json
-import pickle
 from bs4 import BeautifulSoup
 from selenium import webdriver
 from selenium.webdriver.chrome.options import Options
 import chromedriver_autoinstaller
-# Ensure NLTK resources are downloaded
 nltk.download('punkt')
-# Constants
-GOOGLE_MAPS_API_KEY = os.environ.get("GOOGLE_API_KEY")  # Get API key from environment variable
-if not GOOGLE_MAPS_API_KEY:
-    raise ValueError("Error: GOOGLE_MAPS_API_KEY environment variable not set.")
-url = "https://maps.googleapis.com/maps/api/place/textsearch/json"
-places_details_url = "https://maps.googleapis.com/maps/api/place/details/json"
-query = "therapist OR counselor OR mental health professional OR marriage and family therapist OR psychotherapist OR psychiatrist OR psychologist OR nutritionist OR wellness doctor OR holistic practitioner OR integrative medicine OR chiropractor OR naturopath"
-# Chatbot
 stemmer = LancasterStemmer()
 try:
     with open("intents.json") as file:
         data = json.load(file)
 except FileNotFoundError:
-    raise FileNotFoundError("Error: 'intents.json' file not found.")
 try:
-    with open("data.pickle", "rb") as file:
-        words, labels, training, output = pickle.load(file)
 except FileNotFoundError:
-    raise FileNotFoundError("Error: 'data.pickle' file not found.")
 net = tflearn.input_data(shape=[None, len(training[0])])
 net = tflearn.fully_connected(net, 8)
 net = tflearn.fully_connected(net, 8)
 net = tflearn.fully_connected(net, len(output[0]), activation="softmax")
 model = tflearn.DNN(net)
 try:
     model.load("MentalHealthChatBotmodel.tflearn")
 except FileNotFoundError:
     raise FileNotFoundError("Error: Trained model file 'MentalHealthChatBotmodel.tflearn' not found.")
 def bag_of_words(s, words):
     bag = [0 for _ in range(len(words))]
     s_words = word_tokenize(s)
@@ -65,71 +66,115 @@ def bag_of_words(s, words):
                 bag[i] = 1
     return np.array(bag)
 def chat(message, history):
     history = history or []
     message = message.lower()
     try:
         results = model.predict([bag_of_words(message, words)])
         results_index = np.argmax(results)
         tag = labels[results_index]
         for tg in data["intents"]:
             if tg['tag'] == tag:
                 responses = tg['responses']
                 response = random.choice(responses)
-        history.append((message, response))
-    except Exception as e:
-        response = "I'm sorry, I didn't understand that. Could you please rephrase?"
-        history.append((message, response))
-    return history, history
-# Sentiment Analysis
-tokenizer = AutoTokenizer.from_pretrained("cardiffnlp/twitter-roberta-base-sentiment")
-model_sentiment = AutoModelForSequenceClassification.from_pretrained("cardiffnlp/twitter-roberta-base-sentiment")
-def analyze_sentiment(text):
-    try:
-        inputs = tokenizer(text, return_tensors="pt")
-        with torch.no_grad():
-            logits = model_sentiment(**inputs).logits
-        sentiment = ["Negative", "Neutral", "Positive"][torch.argmax(logits)]
-        return f"**Predicted Sentiment:** {sentiment}"
     except Exception as e:
-        return f"Error analyzing sentiment: {str(e)}"
-# Emotion Detection
-def detect_emotion(text):
-    # Implement your own emotion detection logic
-    return "Emotion detection not implemented"
-# Suggestion Generation
-def provide_suggestions(emotion):
-    # Implement your own suggestion generation logic
-    return pd.DataFrame(columns=["Subject", "Article URL", "Video URL"])
-# Google Places API Functions
 def get_places_data(query, location, radius, api_key, next_page_token=None):
-    params = {"query": query, "location": location, "radius": radius, "key": api_key}
     if next_page_token:
         params["pagetoken"] = next_page_token
     response = requests.get(url, params=params)
     if response.status_code == 200:
         return response.json()
     else:
-        print(f"Error: {response.status_code} - {response.text}")
         return None
 def get_place_details(place_id, api_key):
-    params = {"place_id": place_id, "key": api_key}
-    response = requests.get(places_details_url, params=params)
     if response.status_code == 200:
         details_data = response.json().get("result", {})
         return {
             "phone_number": details_data.get("formatted_phone_number", "Not available"),
             "website": details_data.get("website", "Not available")
         }
     else:
         return {}
 def get_all_places(query, location, radius, api_key):
     all_results = []
     next_page_token = None
@@ -137,61 +182,138 @@ def get_all_places(query, location, radius, api_key):
         data = get_places_data(query, location, radius, api_key, next_page_token)
         if data:
             results = data.get('results', [])
             for place in results:
                 place_id = place.get("place_id")
                 name = place.get("name")
                 address = place.get("formatted_address")
                 details = get_place_details(place_id, api_key)
                 phone_number = details.get("phone_number", "Not available")
-                website = details.get("website", "Not available")
-                all_results.append([name, address, phone_number, website])
             next_page_token = data.get('next_page_token')
             if not next_page_token:
                 break
         else:
             break
     return all_results
-# Gradio Interface
-def gradio_interface(message, location, state):
-    history = state or []
-    if message:
-        history, _ = chat(message, history)
-        sentiment = analyze_sentiment(message)
-        emotion = detect_emotion(message)
-        suggestions = provide_suggestions(emotion)
-        if location:
-            try:
-                wellness_results = pd.DataFrame(get_all_places(query, location, 50000, GOOGLE_MAPS_API_KEY), columns=["Name", "Address", "Phone", "Website"])
-            except Exception as e:
-                wellness_results = pd.DataFrame([["Error fetching data: " + str(e), "", "", ""]], columns=["Name", "Address", "Phone", "Website"])
-        else:
-            wellness_results = pd.DataFrame([["", "", "", ""]], columns=["Name", "Address", "Phone", "Website"])
     else:
-        sentiment = ""
-        emotion = ""
-        suggestions = pd.DataFrame(columns=["Subject", "Article URL", "Video URL"])
-        wellness_results = pd.DataFrame([["", "", "", ""]], columns=["Name", "Address", "Phone", "Website"])
-    return history, sentiment, emotion, suggestions, wellness_results, history
-gr.Interface(
-    fn=gradio_interface,
-    inputs=[
-        gr.Textbox(label="Enter your message", placeholder="How are you feeling today?"),
-        gr.Textbox(label="Enter your location (e.g., 'Hawaii, USA')", placeholder="Enter your location (optional)"),
-        gr.State(),
-        gr.Button("Send")
-    ],
-    outputs=[
-        gr.Chatbot(label="Chatbot Responses"),
-        gr.Textbox(label="Sentiment Analysis"),
-        gr.Textbox(label="Emotion Detected"),
-        gr.DataFrame(label="Suggested Articles & Videos"),
-        gr.DataFrame(label="Nearby Wellness Professionals"),
-        gr.State()
-    ],
-    live=True,
-    title="Mental Health Chatbot with Wellness Professional Search",
-    description="This chatbot provides mental health support with sentiment analysis, emotion detection, suggestions, and a list of nearby wellness professionals. Interact with the chatbot first, then enter a location to search."
-).launch(debug=True, share=True)

 import gradio as gr
+from transformers import AutoTokenizer, AutoModelForSequenceClassification
+import torch
 import nltk
 import numpy as np
 import tflearn
+import tensorflow as tf
+import random
+import json
+import pickle
 from nltk.tokenize import word_tokenize
 from nltk.stem.lancaster import LancasterStemmer
 import requests
+import csv
+import time
+import re
 from bs4 import BeautifulSoup
+import pandas as pd
 from selenium import webdriver
 from selenium.webdriver.chrome.options import Options
 import chromedriver_autoinstaller
+import os
+# Ensure necessary NLTK resources are downloaded
 nltk.download('punkt')
+# Initialize the stemmer
 stemmer = LancasterStemmer()
+# Load intents.json
 try:
     with open("intents.json") as file:
         data = json.load(file)
 except FileNotFoundError:
+    raise FileNotFoundError("Error: 'intents.json' file not found. Ensure it exists in the current directory.")
+# Load preprocessed data from pickle
 try:
+    with open("data.pickle", "rb") as f:
+        words, labels, training, output = pickle.load(f)
 except FileNotFoundError:
+    raise FileNotFoundError("Error: 'data.pickle' file not found. Ensure it exists and matches the model.")
+# Build the model structure
 net = tflearn.input_data(shape=[None, len(training[0])])
 net = tflearn.fully_connected(net, 8)
 net = tflearn.fully_connected(net, 8)
 net = tflearn.fully_connected(net, len(output[0]), activation="softmax")
+net = tflearn.regression(net)
+# Load the trained model
 model = tflearn.DNN(net)
 try:
     model.load("MentalHealthChatBotmodel.tflearn")
 except FileNotFoundError:
     raise FileNotFoundError("Error: Trained model file 'MentalHealthChatBotmodel.tflearn' not found.")
+# Function to process user input into a bag-of-words format
 def bag_of_words(s, words):
     bag = [0 for _ in range(len(words))]
     s_words = word_tokenize(s)
                 bag[i] = 1
     return np.array(bag)
+# Chat function
 def chat(message, history):
     history = history or []
     message = message.lower()
     try:
+        # Predict the tag
         results = model.predict([bag_of_words(message, words)])
         results_index = np.argmax(results)
         tag = labels[results_index]
+        # Match tag with intent and choose a random response
         for tg in data["intents"]:
             if tg['tag'] == tag:
                 responses = tg['responses']
                 response = random.choice(responses)
+                break
+        else:
+            response = "I'm sorry, I didn't understand that. Could you please rephrase?"
     except Exception as e:
+        response = f"An error occurred: {str(e)}"
+    history.append((message, response))
+    return history, history
+# Function to send a request to Google Places API and fetch places data
 def get_places_data(query, location, radius, api_key, next_page_token=None):
+    params = {
+        "query": query,
+        "location": location,
+        "radius": radius,
+        "key": api_key
+    }
     if next_page_token:
         params["pagetoken"] = next_page_token
     response = requests.get(url, params=params)
     if response.status_code == 200:
         return response.json()
     else:
         return None
+# Function to fetch detailed information for a specific place using its place_id
 def get_place_details(place_id, api_key):
+    details_url = places_details_url
+    params = {
+        "place_id": place_id,
+        "key": api_key
+    }
+    response = requests.get(details_url, params=params)
     if response.status_code == 200:
         details_data = response.json().get("result", {})
         return {
+            "opening_hours": details_data.get("opening_hours", {}).get("weekday_text", "Not available"),
+            "reviews": details_data.get("reviews", "Not available"),
             "phone_number": details_data.get("formatted_phone_number", "Not available"),
             "website": details_data.get("website", "Not available")
         }
     else:
         return {}
+# Scrape website URL from Google Maps results (using Selenium)
+def scrape_website_from_google_maps(place_name):
+    chrome_options = Options()
+    chrome_options.add_argument("--headless")
+    chrome_options.add_argument("--no-sandbox")
+    chrome_options.add_argument("--disable-dev-shm-usage")
+    driver = webdriver.Chrome(options=chrome_options)
+    search_url = f"https://www.google.com/maps/search/{place_name.replace(' ', '+')}"
+    driver.get(search_url)
+    time.sleep(5)
+    try:
+        website_element = driver.find_element_by_xpath('//a[contains(@aria-label, "Visit") and contains(@aria-label, "website")]')
+        website_url = website_element.get_attribute('href')
+    except:
+        website_url = "Not available"
+    driver.quit()
+    return website_url
+# Scraping the website to extract phone number or email
+def scrape_website_for_contact_info(website):
+    phone_number = "Not available"
+    email = "Not available"
+    try:
+        response = requests.get(website, timeout=5)
+        soup = BeautifulSoup(response.content, 'html.parser')
+        phone_match = re.search(r'\(?\+?[0-9]*\)?[0-9_\- \(\)]*', soup.get_text())
+        if phone_match:
+            phone_number = phone_match.group()
+        email_match = re.search(r'[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\.[a-zA-Z]{2,}', soup.get_text())
+        if email_match:
+            email = email_match.group()
+    except Exception as e:
+        print(f"Error scraping website {website}: {e}")
+    return phone_number, email
+# Function to fetch all places data including pagination
 def get_all_places(query, location, radius, api_key):
     all_results = []
     next_page_token = None
         data = get_places_data(query, location, radius, api_key, next_page_token)
         if data:
             results = data.get('results', [])
+            if not results:
+                break
             for place in results:
                 place_id = place.get("place_id")
                 name = place.get("name")
                 address = place.get("formatted_address")
+                rating = place.get("rating", "Not available")
+                business_status = place.get("business_status", "Not available")
+                user_ratings_total = place.get("user_ratings_total", "Not available")
+                website = place.get("website", "Not available")
+                types = ", ".join(place.get("types", []))
+                location = place.get("geometry", {}).get("location", {})
+                latitude = location.get("lat", "Not available")
+                longitude = location.get("lng", "Not available")
                 details = get_place_details(place_id, api_key)
                 phone_number = details.get("phone_number", "Not available")
+                if phone_number == "Not available" and website != "Not available":
+                    phone_number, email = scrape_website_for_contact_info(website)
+                else:
+                    email = "Not available"
+                if website == "Not available":
+                    website = scrape_website_from_google_maps(name)
+                all_results.append([name, address, phone_number, rating, business_status,
+                                    user_ratings_total, website, types, latitude, longitude,
+                                    details.get("opening_hours", "Not available"),
+                                    details.get("reviews", "Not available"), email])
             next_page_token = data.get('next_page_token')
             if not next_page_token:
                 break
+            time.sleep(2)
         else:
             break
     return all_results
+# Function to save results to CSV file
+def save_to_csv(data, filename):
+    with open(filename, mode='w', newline='', encoding='utf-8') as file:
+        writer = csv.writer(file)
+        writer.writerow(["Name", "Address", "Phone", "Rating", "Business Status", "User Ratings Total", "Website", "Types", "Latitude", "Longitude", "Opening Hours", "Reviews", "Email"])
+        writer.writerows(data)
+    print(f"Data saved to {filename}")
+# Main function to execute script
+def main():
+    google_places_data = get_all_places(query, location, radius, api_key)
+    if google_places_data:
+        save_to_csv(google_places_data, "wellness_professionals_hawaii.csv")
     else:
+        print("No data found.")
+# Gradio UI setup
+with gr.Blocks() as demo:
+    st.set_page_config(page_title="Emotion Detection and Well-Being Suggestions", layout="wide")
+    # Load pre-trained model and tokenizer
+    @gr.cache_resource
+    def load_model():
+        tokenizer = AutoTokenizer.from_pretrained("j-hartmann/emotion-english-distilroberta-base")
+        model = AutoModelForSequenceClassification.from_pretrained("j-hartmann/emotion-english-distilroberta-base")
+        return tokenizer, model
+    tokenizer, model = load_model()
+    # Display header
+    gr.Markdown("# Emotion Detection and Well-Being Suggestions")
+    # User input for text (emotion detection)
+    user_input = gr.Textbox(lines=1, label="How are you feeling today?")
+    emotion_output = gr.Textbox(label="Emotion Detected")
+    # Model prediction
+    def predict_emotion(text):
+        pipe = pipeline("text-classification", model=model, tokenizer=tokenizer)
+        result = pipe(text)
+        emotion = result[0]['label']
+        return emotion
+    user_input.change(predict_emotion, inputs=user_input, outputs=emotion_output)
+    # Chatbot functionality
+    chatbot = gr.Chatbot(label="Chat")
+    message_input = gr.Textbox(lines=1, label="Message")
+    history_state = gr.State([])
+    def chat(message, history):
+        history = history or []
+        message = message.lower()
+        try:
+            # Predict the tag
+            results = model.predict([bag_of_words(message, words)])
+            results_index = np.argmax(results)
+            tag = labels[results_index]
+            # Match tag with intent and choose a random response
+            for tg in data["intents"]:
+                if tg['tag'] == tag:
+                    responses = tg['responses']
+                    response = random.choice(responses)
+                    break
+            else:
+                response = "I'm sorry, I didn't understand that. Could you please rephrase?"
+        except Exception as e:
+            response = f"An error occurred: {str(e)}"
+        history.append((message, response))
+        return history, history
+    message_input.submit(chat, inputs=[message_input, history_state], outputs=[chatbot, history_state])
+    # Button to fetch wellness professionals data
+    fetch_button = gr.Button("Fetch Wellness Professionals Data")
+    data_output = gr.File(label="Download Data")
+    def fetch_data():
+        all_results = get_all_places(query, location, radius, api_key)
+        if all_results:
+            df = pd.DataFrame(all_results, columns=["Name", "Address", "Phone", "Rating", "Business Status", "User Ratings Total", "Website", "Types", "Latitude", "Longitude", "Opening Hours", "Reviews", "Email"])
+            csv_file = df.to_csv(index=False)
+            return csv_file
+        else:
+            return "No data found."
+    fetch_button.click(fetch_data, inputs=None, outputs=data_output)
+# Launch Gradio interface
+demo.launch()