Spaces:

blazingbunny
/

google-entity-analysis

Running

App Files Files Community

blazingbunny commited on Oct 14, 2023

Commit

3fec030

1 Parent(s): 309b488

Update app.py

Browse files

Files changed (1) hide show

app.py +14 -5

app.py CHANGED Viewed

@@ -3,6 +3,15 @@ import streamlit as st
 from google.oauth2 import service_account
 from google.cloud import language_v1
 # Sidebar content
 st.sidebar.title("About This Tool")
 st.sidebar.markdown("This tool leverages Google's NLP technology for entity analysis.")
@@ -12,17 +21,14 @@ st.sidebar.markdown("""
 2. **User Input**: Enter the text you want to analyze.
 3. **Analyze**: Click the 'Analyze' button.
 4. **View Results**: See the identified entities and their details.
-To do:
-https://www.linkedin.com/pulse/seo-content-writing-how-optimize-entity-salience-emmanuel-dan-awoh/
 """)
 # Header and intro
 st.title("Google Cloud NLP Entity Analyzer")
 st.write("This tool analyzes text to identify entities such as people, locations, organizations, and events")
 st.write("Entity salience scores are always relative to the analysed text. In natural language processing, a salience score is always a prediction of what a human would consider to be the most important entities in the same text. A number of textual features contribute to the salience score.")
 def sample_analyze_entities(text_content):
-    # Assuming service_account_info is set in your Streamlit secrets
     service_account_info = json.loads(st.secrets["google_nlp"])
     credentials = service_account.Credentials.from_service_account_info(
         service_account_info, scopes=["https://www.googleapis.com/auth/cloud-platform"]
@@ -33,8 +39,11 @@ def sample_analyze_entities(text_content):
     encoding_type = language_v1.EncodingType.UTF8
     response = client.analyze_entities(request={"document": document, "encoding_type": encoding_type})
-    st.write(f"### We found {len(response.entities)} entities")
     st.write("---")
     for i, entity in enumerate(response.entities):

 from google.oauth2 import service_account
 from google.cloud import language_v1
+# Function to count entities with 'mid' and '/g/' in their metadata
+def count_entities(entities):
+    count = 0
+    for entity in entities:
+        metadata = entity.metadata
+        if 'mid' in metadata and '/g/' in metadata['mid']:
+            count += 1
+    return count
 # Sidebar content
 st.sidebar.title("About This Tool")
 st.sidebar.markdown("This tool leverages Google's NLP technology for entity analysis.")
 2. **User Input**: Enter the text you want to analyze.
 3. **Analyze**: Click the 'Analyze' button.
 4. **View Results**: See the identified entities and their details.
 """)
 # Header and intro
 st.title("Google Cloud NLP Entity Analyzer")
 st.write("This tool analyzes text to identify entities such as people, locations, organizations, and events")
 st.write("Entity salience scores are always relative to the analysed text. In natural language processing, a salience score is always a prediction of what a human would consider to be the most important entities in the same text. A number of textual features contribute to the salience score.")
 def sample_analyze_entities(text_content):
     service_account_info = json.loads(st.secrets["google_nlp"])
     credentials = service_account.Credentials.from_service_account_info(
         service_account_info, scopes=["https://www.googleapis.com/auth/cloud-platform"]
     encoding_type = language_v1.EncodingType.UTF8
     response = client.analyze_entities(request={"document": document, "encoding_type": encoding_type})
+    # Count the entities with 'mid' and '/g/' in their metadata
+    entity_count = count_entities(response.entities)
+    st.write(f"We found {len(response.entities)} entities - {entity_count} meet your criteria")
     st.write("---")
     for i, entity in enumerate(response.entities):