Spaces:

boompack
/

new-space

Sleeping

App Files Files Community

boompack commited on Nov 6, 2024

Commit

2e66c7c

verified ·

1 Parent(s): 2a2a846

Update app.py

Browse files

Files changed (1) hide show

app.py +76 -1

app.py CHANGED Viewed

@@ -197,6 +197,81 @@ if __name__ == "__main__":
         )
     except Exception as e:
         logger.error(f"Error launching interface: {e}", exc_info=True)
-ошбика . ничего не работает

         )
     except Exception as e:
         logger.error(f"Error launching interface: {e}", exc_info=True)
+import re
+import emoji
+import gradio as gr
+from collections import defaultdict, Counter
+def extract_comment_data(comment_text: str) -> dict:
+    """Extracts data from a comment string."""
+    comment_data = {}
+    # Username extraction (improved robustness)
+    match = re.search(r"Фото профиля\s*(.+?)\n", comment_text)
+    comment_data["username"] = match.group(1).strip() if match else None
+    if not comment_data["username"]:
+        return None # Skip if no username found
+    # Comment text extraction (handling multiple lines & various time formats)
+    lines = comment_text.splitlines()
+    comment_text = ""
+    for i, line in enumerate(lines):
+        if re.search(r"\d+\s*(?:нед\.|ч\.)", line): #Matches days or hours
+            comment_text = "\n".join(lines[i+1:]).strip()
+            break
+        comment_text += line + "\n"
+    comment_text = comment_text.strip()
+    comment_data["comment"] = comment_text
+    # Likes extraction (more flexible regex)
+    match = re.search(r'"Нравится":\s*(\d+)', comment_text)
+    comment_data["likes"] = int(match.group(1)) if match else 0
+    # Time extraction (more robust to variations)
+    time_match = re.search(r"(\d+)\s*(?:нед\.|ч\.)", comment_text)
+    comment_data["time"] = int(time_match.group(1)) if time_match else None
+    return comment_data
+def analyze_comments(comments_text: str) -> dict:
+    """Analyzes a block of comments text."""
+    comments = []
+    blocks = re.split(r'(Фото профиля)', comments_text, flags=re.IGNORECASE)
+    for i in range(1,len(blocks),2):
+        comment_data = extract_comment_data(blocks[i])
+        if comment_data:
+            comments.append(comment_data)
+    # Aggregate data
+    analytics = defaultdict(int)
+    unique_users = set()
+    top_commenters = Counter()
+    for comment in comments:
+        analytics["total_comments"] += 1
+        unique_users.add(comment["username"])
+        analytics["total_likes"] += comment["likes"]
+        top_commenters[comment["username"]] += 1
+        analytics["emojis"] += len(emoji.demojize(comment["comment"])) # Counts emojis
+    analytics["unique_users"] = len(unique_users)
+    analytics["avg_likes"] = analytics["total_likes"] / analytics["total_comments"] if analytics["total_comments"] > 0 else 0
+    analytics["top_commenters"] = dict(top_commenters.most_common(5))
+    return analytics, comments
+iface = gr.Interface(
+    fn=analyze_comments,
+    inputs=gr.Textbox(label="Instagram Comments (Paste here)", lines=10),
+    outputs=[
+        gr.Textbox(label="Analytics Summary"),
+        gr.JSON(label="Individual Comment Data")
+    ],
+    title="Enhanced Instagram Comment Analyzer",
+    description="Improved analyzer for Instagram comments.",
+)
+iface.launch(share=True)