Spaces:

boompack
/

new-space

Sleeping

App Files Files Community

boompack commited on Nov 6, 2024

Commit

8c00b86

verified ·

1 Parent(s): bf4724c

Update app.py

Browse files

Files changed (1) hide show

app.py +40 -154

app.py CHANGED Viewed

@@ -1,114 +1,34 @@
 import gradio as gr
-import re
 import emoji
-import logging
-from typing import Tuple, Optional
-from functools import lru_cache
 from collections import Counter
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-def count_emojis(text: str) -> int:
-    """Подсчет количества эмодзи в тексте"""
-    return len([c for c in text if c in emoji.EMOJI_DATA])
-def extract_mentions(text: str) -> list:
-    """Извлечение упоминаний пользователей"""
-    return re.findall(r'@(\w+)', text)
-def is_spam(text: str) -> bool:
-    """Определение спам-комментариев"""
-    spam_indicators = ['🔥' * 3, '❤️' * 3, 'follow me', 'check my']
-    return any(indicator in text.lower() for indicator in spam_indicators)
-def extract_comment_data(comment_text: str) -> Tuple[Optional[str], Optional[str], int, int]:
-    """Извлекает данные из комментария"""
-    try:
-        # Extract username
-        username_match = re.search(r'Фото профиля\s+(.+?)\n', comment_text)
-        username = username_match.group(1).strip() if username_match else None
-        if not username:
-            return None, None, 0, 0
-        # Extract comment text
-        comment_lines = comment_text.split('\n')
-        comment = ""
-        time_pattern = r'\d+\s*(?:ч\.|нед\.)'
-        # Identify where the comment text starts
-        for i, line in enumerate(comment_lines):
-            if re.search(time_pattern, line):
-                if i + 1 < len(comment_lines):
-                    comment = comment_lines[i + 1].strip()
-                break
-        # Clean up comment text
-        comment = re.sub(r'\d+\s*(?:ч\.|нед\.)\s*$', '', comment)
-        comment = re.sub(r'"Нравится":\s*\d+\s*Ответить\s*$', '', comment)
-        # Extract likes
-        likes_match = re.search(r'"Нравится":\s*(\d+)', comment_text)
-        likes = int(likes_match.group(1)) if likes_match else 0
-        # Extract time
-        time_match = re.search(r'(\d+)\s*(?:ч\.|нед\.)', comment_text)
-        time = int(time_match.group(1)) if time_match else 0
-        return username, comment.strip(), likes, time
-    except Exception as e:
-        logger.error(f"Error extracting data: {e}")
-        return None, None, 0, 0
-@lru_cache(maxsize=100)
 def analyze_post(content_type: str, link: str, post_likes: int,
                 post_date: str, description: str, comment_count: int,
                 all_comments: str) -> Tuple[str, str, str, str, str]:
-    """Анализирует пост и комментарии"""
     try:
-        if not all_comments or 'Фото профиля' not in all_comments:
-            return "Ошибка: неверный формат данных", "", "", "", "0"
-        blocks = re.split(r'(?=Фото профиля)', all_comments)
-        blocks = [b.strip() for b in blocks if b.strip()]
-        comments_data = []
         total_emojis = 0
         mentions = []
         spam_count = 0
-        for block in blocks:
-            username, comment, likes, time = extract_comment_data(block)
-            if username and comment:
-                emoji_count = count_emojis(comment)
-                comment_mentions = extract_mentions(comment)
-                is_spam_comment = is_spam(comment)
-                comments_data.append({
-                    'username': username,
-                    'comment': comment,
-                    'likes': likes,
-                    'time': time,
-                    'emoji_count': emoji_count,
-                    'mentions': comment_mentions,
-                    'is_spam': is_spam_comment
-                })
-                total_emojis += emoji_count
-                mentions.extend(comment_mentions)
-                if is_spam_comment:
-                    spam_count += 1
-        # Подсчет статистики
         total_comments = len(comments_data)
-        unique_users = len(set(item['username'] for item in comments_data))
-        total_likes = sum(item['likes'] for item in comments_data)
         avg_likes = total_likes / total_comments if total_comments > 0 else 0
-        # Топ комментаторы
-        commenter_counts = Counter(item['username'] for item in comments_data)
         top_commenters = commenter_counts.most_common(5)
         analytics = f"""
@@ -126,74 +46,40 @@ def analyze_post(content_type: str, link: str, post_likes: int,
         {chr(10).join(f'• {user}: {count} комментария' for user, count in top_commenters if count > 1)}
         """
-        return (
-            analytics,
-            "\n".join(item['username'] for item in comments_data),
-            "\n".join(item['comment'] for item in comments_data),
-            "\n".join(str(item['likes']) for item in comments_data),
-            str(total_likes)
-        )
     except Exception as e:
-        logger.error(f"Analysis error: {e}")
-        return str(e), "", "", "", "0"
-# Создаем интерфейс Gradio
 iface = gr.Interface(
     fn=analyze_post,
     inputs=[
-        gr.Radio(
-            choices=["Photo", "Video"],
-            label="Content Type",
-            value="Photo"
-        ),
-        gr.Textbox(
-            label="Link to Post",
-            placeholder="Вставьте ссылку на пост"
-        ),
-        gr.Number(
-            label="Likes",
-            value=0,
-            minimum=0
-        ),
-        gr.Textbox(
-            label="Post Date",
-            placeholder="YYYY-MM-DD"
-        ),
-        gr.Textbox(
-            label="Description",
-            lines=3,
-            placeholder="Описание поста"
-        ),
-        gr.Number(
-            label="Comment Count",
-            value=0,
-            minimum=0
-        ),
-        gr.Textbox(
-            label="Comments",
-            lines=10,
-            placeholder="Вставьте комментарии"
-        )
     ],
     outputs=[
-        gr.Textbox(label="Analytics Summary", lines=15),
-        gr.Textbox(label="Usernames"),
-        gr.Textbox(label="Comments"),
-        gr.Textbox(label="Likes Chronology"),
-        gr.Textbox(label="Total Likes on Comments")
     ],
-    title="Enhanced Instagram Comment Analyzer",
-    description="Анализатор комментариев Instagram с расширенной аналитикой",
     theme="default"
 )
-if __name__ == "__main__":
-    try:
-        iface.launch(
-            share=True,  # Создает публичную ссылку
-            debug=True,  # Включает режим отладки
-            show_error=True  # Показывает подробности ошибок
-        )
-    except Exception as e:
-        logger.error(f"Error launching interface: {e}", exc_info=True)

 import gradio as gr
+import json
 import emoji
+import re
 from collections import Counter
 def analyze_post(content_type: str, link: str, post_likes: int,
                 post_date: str, description: str, comment_count: int,
                 all_comments: str) -> Tuple[str, str, str, str, str]:
     try:
+        comments_data = json.loads(all_comments)
         total_emojis = 0
         mentions = []
         spam_count = 0
+        total_likes = 0
+        for comment in comments_data:
+            username = comment['username']
+            comment_text = comment['comment']
+            likes = comment.get('likes', 0) #Обработка отсутствия ключа likes
+            total_likes += likes
+            total_emojis += len([c for c in comment_text if c in emoji.EMOJI_DATA])
+            mentions.extend(re.findall(r'@(\w+)', comment_text))
         total_comments = len(comments_data)
+        unique_users = len(set(comment['username'] for comment in comments_data))
         avg_likes = total_likes / total_comments if total_comments > 0 else 0
+        commenter_counts = Counter(comment['username'] for comment in comments_data)
         top_commenters = commenter_counts.most_common(5)
         analytics = f"""
         {chr(10).join(f'• {user}: {count} комментария' for user, count in top_commenters if count > 1)}
         """
+        usernames = "\n".join(comment['username'] for comment in comments_data)
+        comments = "\n".join(comment['comment'] for comment in comments_data)
+        likes_chronology = "\n".join(str(comment.get('likes', 0)) for comment in comments_data)
+        return (analytics, usernames, comments, likes_chronology, str(total_likes))
+    except json.JSONDecodeError:
+        return "Ошибка: Неверный JSON-ввод", "", "", "", "0"
     except Exception as e:
+        return f"Произошла ошибка: {e}", "", "", "", "0"
 iface = gr.Interface(
     fn=analyze_post,
     inputs=[
+        gr.Radio(choices=["Фото", "Видео"], label="Тип контента", value="Фото"),
+        gr.Textbox(label="Ссылка на пост", placeholder="Вставьте ссылку на пост"),
+        gr.Number(label="Лайки", value=0, minimum=0),
+        gr.Textbox(label="Дата поста", placeholder="YYYY-MM-DD"),
+        gr.Textbox(label="Описание", lines=3, placeholder="Описание поста"),
+        gr.Number(label="Количество комментариев", value=0, minimum=0),
+        gr.Textbox(label="Комментарии (JSON)", lines=10,
+                   placeholder='Вставьте данные в формате JSON (см. пример)')
     ],
     outputs=[
+        gr.Textbox(label="Анализ", lines=15),
+        gr.Textbox(label="Пользователи"),
+        gr.Textbox(label="Комментарии"),
+        gr.Textbox(label="Хронология лайков"),
+        gr.Textbox(label="Всего лайков")
     ],
+    title="Расширенный анализатор комментариев Instagram",
+    description="Анализатор комментариев Instagram с расширенной аналитикой.  Введите комментарии в формате JSON.",
     theme="default"
 )
+iface.launch(share=True, debug=True, show_error=True)