Spaces:

boompack
/

new-space

Sleeping

App Files Files Community

boompack commited on Nov 2, 2024

Commit

f508547

verified ·

1 Parent(s): 8c8dfe8

Update app.py

Browse files

Files changed (1) hide show

app.py +438 -213

app.py CHANGED Viewed

@@ -1,307 +1,532 @@
-# analyzers.py
 import re
 import emoji
 import statistics
 from collections import Counter
-from typing import Dict, List, Tuple, Optional
 import logging
-from io import StringIO
 import csv
-logging.basicConfig(level=logging.INFO)
 logger = logging.getLogger(__name__)
 class TextAnalyzer:
-    """Класс для базового анализа текста"""
     @staticmethod
     def clean_text(text: str) -> str:
-        return re.sub(r'\s+', ' ', text).strip()
     @staticmethod
     def count_emojis(text: str) -> int:
-        return len([c for c in text if c in emoji.EMOJI_DATA])
     @staticmethod
-    def extract_mentions(text: str) -> List[str]:
-        return re.findall(r'@[\w\.]+', text)
     @staticmethod
     def get_words(text: str) -> List[str]:
-        return [w for w in re.findall(r'\w+', text.lower()) if len(w) > 2]
 class SentimentAnalyzer:
-    """Класс для анализа тональности"""
-    POSITIVE_INDICATORS = {
-        'emoji': ['🔥', '❤️', '👍', '😊', '💪', '👏', '🎉', '♥️', '😍', '🙏'],
-        'words': ['круто', 'супер', 'класс', 'огонь', 'пушка', 'отлично', 'здорово',
-                 'прекрасно', 'молодец', 'красота', 'спасибо', 'топ', 'лучший',
-                 'amazing', 'wonderful', 'great', 'perfect', 'love', 'beautiful']
-    }
-    NEGATIVE_INDICATORS = {
-        'emoji': ['👎', '😢', '😞', '😠', '😡', '💔', '😕', '😑'],
-        'words': ['плохо', 'ужас', 'отстой', 'фу', 'жесть', 'ужасно',
-                 'разочарован', 'печаль', 'грустно', 'bad', 'worst',
-                 'terrible', 'awful', 'sad', 'disappointed']
     }
     @classmethod
-    def analyze(cls, text: str) -> str:
         text_lower = text.lower()
-        pos_count = sum(1 for ind in cls.POSITIVE_INDICATORS['emoji'] + cls.POSITIVE_INDICATORS['words']
-                       if ind in text_lower)
-        neg_count = sum(1 for ind in cls.NEGATIVE_INDICATORS['emoji'] + cls.NEGATIVE_INDICATORS['words']
-                       if ind in text_lower)
-        exclamation_boost = text.count('!') * 0.5
         if pos_count > neg_count:
-            pos_count += exclamation_boost
         elif neg_count > pos_count:
-            neg_count += exclamation_boost
-        return 'positive' if pos_count > neg_count else 'negative' if neg_count > pos_count else 'neutral'
 class CommentExtractor:
-    """Класс для извлечения данных из комментариев"""
     PATTERNS = {
-        'username': [
-            r"Фото профиля ([^\n]+)",
-            r"^([^\s]+)\s+",
-            r"@([^\s]+)\s+"
-        ],
-        'time': [
-            r"(\d+)\s*(?:ч|нед)\.",
-            r"(\d+)\s*(?:h|w)",
-            r"(\d+)\s*(?:час|hour|week)"
-        ],
-        'likes': [
-            r"(\d+) отметк[аи] \"Нравится\"",
-            r"Нравится: (\d+)",
-            r"(\d+) отметка \"Нравится\"",
-            r"\"Нравится\": (\d+)",
-            r"likes?: (\d+)"
-        ],
-        'metadata': [
-            r"Фото профиля [^\n]+\n",
-            r"\d+\s*(?:ч|нед|h|w|час|hour|week)\.",
-            r"Нравится:?\s*\d+",
-            r"\d+ отметк[аи] \"Нравится\"",
-            r"Ответить",
-            r"Показать перевод",
-            r"Скрыть все ответы",
-            r"Смотреть все ответы \(\d+\)"
-        ]
     }
     @classmethod
-    def extract_data(cls, comment_text: str) -> Tuple[Optional[str], Optional[str], int, float]:
         try:
-            # Извлечение имени пользователя
-            username = None
-            for pattern in cls.PATTERNS['username']:
-                if match := re.search(pattern, comment_text):
-                    username = match.group(1).strip()
-                    break
-            if not username:
-                return None, None, 0, 0
-            # Очистка комментария
-            comment = comment_text
-            for pattern in cls.PATTERNS['metadata'] + [username]:
-                comment = re.sub(pattern, '', comment)
             comment = TextAnalyzer.clean_text(comment)
-            # Извлечение времени
-            weeks = 0
-            for pattern in cls.PATTERNS['time']:
-                if match := re.search(pattern, comment_text):
-                    time_value = int(match.group(1))
-                    if any(unit in comment_text.lower() for unit in ['нед', 'w', 'week']):
-                        weeks = time_value
-                    else:
-                        weeks = time_value / (24 * 7)
-                    break
-            # Извлечение лайков
-            likes = 0
-            for pattern in cls.PATTERNS['likes']:
-                if match := re.search(pattern, comment_text):
-                    likes = int(match.group(1))
-                    break
-            return username, comment, likes, weeks
         except Exception as e:
-            logger.error(f"Error extracting comment data: {e}")
-            return None, None, 0, 0
 class StatsCalculator:
-    """Класс для расчета статистики"""
     @staticmethod
-    def calculate_period_stats(weeks: List[float], likes: List[str], sentiments: List[str]) -> Dict:
-        if not weeks:
             return {}
-        earliest_week = max(weeks)
-        latest_week = min(weeks)
-        week_range = earliest_week - latest_week
-        period_length = week_range / 3 if week_range > 0 else 1
-        engagement_periods = {
             'early': [],
             'middle': [],
             'late': []
         }
-        for i, week in enumerate(weeks):
-            if week >= earliest_week - period_length:
-                engagement_periods['early'].append(i)
-            elif week >= earliest_week - 2 * period_length:
-                engagement_periods['middle'].append(i)
             else:
-                engagement_periods['late'].append(i)
         return {
             period: {
-                'comments': len(indices),
-                'avg_likes': sum(int(likes[i]) for i in indices) / len(indices) if indices else 0,
-                'sentiment_ratio': sum(1 for i in indices if sentiments[i] == 'positive') / len(indices) if indices else 0
             }
-            for period, indices in engagement_periods.items()
         }
-def analyze_post(content_type: str, link_to_post: str, post_likes: int, post_date: str,
-                description: str, comment_count: int, all_comments: str) -> Tuple[str, str, str, str, str]:
-    """Основная функция анализа поста"""
     try:
-        # Разделение на комментарии
-        comment_patterns = '|'.join([
-            r"(?=Фото профиля)",
-            r"(?=\n\s*[a-zA-Z0-9._]+\s+[^\n]+\n)",
-            r"(?=^[a-zA-Z0-9._]+\s+[^\n]+\n)",
-            r"(?=@[a-zA-Z0-9._]+\s+[^\n]+\n)"
-        ])
-        comments_blocks = [block.strip() for block in re.split(comment_patterns, all_comments)
-                         if block and block.strip() and 'Скрыто алгоритмами Instagram' not in block]
-        # Извлечение данных
-        data = [CommentExtractor.extract_data(block) for block in comments_blocks]
-        valid_data = [(u, c, l, w) for u, c, l, w in data if all((u, c))]
-        if not valid_data:
-            return "No comments found", "", "", "", "0"
-        usernames, comments, likes, weeks = zip(*valid_data)
-        likes = [str(l) for l in likes]
-        # Анализ комментариев
-        comment_stats = {
-            'lengths': [len(c) for c in comments],
-            'words': [len(TextAnalyzer.get_words(c)) for c in comments],
-            'emojis': sum(TextAnalyzer.count_emojis(c) for c in comments),
-            'mentions': [m for c in comments for m in TextAnalyzer.extract_mentions(c)],
-            'sentiments': [SentimentAnalyzer.analyze(c) for c in comments]
-        }
-        # Расчет базовой статистики
         basic_stats = {
-            'total_comments': len(comments),
-            'avg_length': statistics.mean(comment_stats['lengths']),
-            'median_length': statistics.median(comment_stats['lengths']),
-            'avg_words': statistics.mean(comment_stats['words']),
-            'total_likes': sum(map(int, likes)),
-            'avg_likes': statistics.mean(map(int, likes))
         }
-        # Расчет периодов
-        period_stats = StatsCalculator.calculate_period_stats(weeks, likes, comment_stats['sentiments'])
-        # Создание отчета
-        csv_data = create_csv_report(content_type, link_to_post, post_likes, basic_stats,
-                                   comment_stats, period_stats, usernames, comment_stats['mentions'])
-        analytics_summary = create_text_report(basic_stats, comment_stats, period_stats, csv_data)
         return (
-            analytics_summary,
-            "\n".join(usernames),
-            "\n".join(comments),
-            "\n".join(likes),
             str(basic_stats['total_likes'])
         )
     except Exception as e:
-        logger.error(f"Error in analyze_post: {e}", exc_info=True)
-        return f"Error: {str(e)}", "", "", "", "0"
-def create_csv_report(content_type, link, post_likes, basic_stats, comment_stats, period_stats, usernames, mentions):
-    """Создание CSV отчета"""
-    csv_data = {
-        'metadata': {
-            'content_type': content_type,
-            'link': link,
-            'post_likes': post_likes
-        },
-        'basic_stats': basic_stats,
-        'sentiment_stats': dict(Counter(comment_stats['sentiments'])),
-        'period_analysis': period_stats,
-        'top_users': dict(Counter(usernames).most_common(5)),
-        'top_mentioned': dict(Counter(mentions).most_common(5))
-    }
-    output = StringIO()
-    writer = csv.writer(output)
-    for section, data in csv_data.items():
         writer.writerow([section])
         for key, value in data.items():
             writer.writerow([key, value])
         writer.writerow([])
-    return output.getvalue()
-def create_text_report(basic_stats, comment_stats, period_stats, csv_data):
-    """Создание текстового отчета"""
-    sentiment_dist = Counter(comment_stats['sentiments'])
-    return (
-        f"CSV DATA:\n{csv_data}\n\n"
-        f"СТАТИСТИКА:\n"
-        f"- Всего комментариев: {basic_stats['total_comments']}\n"
-        f"- Среднее лайков: {basic_stats['avg_likes']:.1f}\n"
-        f"АНАЛИЗ КОНТЕНТА:\n"
-        f"- Средняя длина: {basic_stats['avg_length']:.1f}\n"
-        f"- Медиана длины: {basic_stats['median_length']}\n"
-        f"- Среднее слов: {basic_stats['avg_words']:.1f}\n"
-        f"- Эмодзи: {comment_stats['emojis']}\n"
-        f"ТОНАЛЬНОСТЬ:\n"
-        f"- Позитив: {sentiment_dist['positive']}\n"
-        f"- Нейтрально: {sentiment_dist['neutral']}\n"
-        f"- Негатив: {sentiment_dist['negative']}\n"
     )
-# Создание интерфейса Gradio
 import gradio as gr
 iface = gr.Interface(
-    fn=analyze_post,
     inputs=[
-        gr.Radio(choices=["Photo", "Video"], label="Content Type", value="Photo"),
-        gr.Textbox(label="Link to Post"),
-        gr.Number(label="Likes", value=0),
-        gr.Textbox(label="Post Date"),
-        gr.Textbox(label="Description", lines=3),
-        gr.Number(label="Total Comment Count", value=0),
-        gr.Textbox(label="All Comments", lines=10)
     ],
     outputs=[
-        gr.Textbox(label="Analytics Summary", lines=20),
-        gr.Textbox(label="Usernames"),
-        gr.Textbox(label="Comments"),
-        gr.Textbox(label="Likes Chronology"),
-        gr.Textbox(label="Total Likes on Comments")
     ],
     title="Enhanced Instagram Comment Analyzer",
-    description="Анализатор комментариев Instagram с расширенной аналитикой"
 )
 if __name__ == "__main__":
-    iface.launch()

 import re
 import emoji
 import statistics
 from collections import Counter
+from typing import Dict, List, Tuple, Optional, Set, Union
 import logging
+from pathlib import Path
+from datetime import datetime
 import csv
+from dataclasses import dataclass, asdict
+from enum import Enum
+import numpy as np
+# Configure logging
+log_dir = Path("logs")
+log_dir.mkdir(exist_ok=True)
+logging.basicConfig(
+    level=logging.INFO,
+    format='%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+    handlers=[
+        logging.FileHandler(log_dir / f'analyzer_{datetime.now():%Y%m%d}.log'),
+        logging.StreamHandler()
+    ]
+)
 logger = logging.getLogger(__name__)
+class Sentiment(str, Enum):
+    POSITIVE = 'positive'
+    SLIGHTLY_POSITIVE = 'slightly_positive'
+    NEUTRAL = 'neutral'
+    SLIGHTLY_NEGATIVE = 'slightly_negative'
+    NEGATIVE = 'negative'
+@dataclass
+class CommentData:
+    username: str
+    text: str
+    likes: int
+    weeks_ago: float
+    sentiment: Sentiment
 class TextAnalyzer:
+    """Enhanced text analysis utilities"""
     @staticmethod
     def clean_text(text: str) -> str:
+        """Clean text using more efficient string splitting"""
+        return ' '.join(text.split())
     @staticmethod
     def count_emojis(text: str) -> int:
+        """Count emojis using set operations for better performance"""
+        return len({c for c in text if c in emoji.EMOJI_DATA})
     @staticmethod
+    def extract_mentions(text: str) -> Set[str]:
+        """Extract mentions returning a set for uniqueness"""
+        return set(re.findall(r'@[\w.]+', text))
     @staticmethod
     def get_words(text: str) -> List[str]:
+        """Extract meaningful words using improved regex"""
+        return [w for w in re.findall(r'\b\w{3,}\b', text.lower())]
 class SentimentAnalyzer:
+    """Enhanced sentiment analysis with gradual classification"""
+    # Using sets for O(1) lookup
+    INDICATORS = {
+        'positive': {
+            '🔥', '❤️', '👍', '😊', '💪', '👏', '🎉', '♥️', '😍', '🙏',
+            'круто', 'супер', 'класс', 'огонь', 'пушка', 'отлично', 'здорово',
+            'прекрасно', 'молодец', 'красота', 'спасибо', 'топ', 'лучший',
+            'amazing', 'wonderful', 'great', 'perfect', 'love', 'beautiful'
+        },
+        'negative': {
+            '👎', '😢', '😞', '😠', '😡', '💔', '😕', '😑',
+            'плохо', 'ужас', 'отстой', 'фу', 'жесть', 'ужасно',
+            'разочарован', 'печаль', 'грустно', 'bad', 'worst',
+            'terrible', 'awful', 'sad', 'disappointed'
+        }
     }
     @classmethod
+    def analyze(cls, text: str) -> Sentiment:
+        """
+        Analyze text sentiment with enhanced granularity and emphasis handling
+        """
         text_lower = text.lower()
+        words = set(cls.TextAnalyzer.get_words(text_lower))
+        pos_count = len(words & cls.INDICATORS['positive'])
+        neg_count = len(words & cls.INDICATORS['negative'])
+        # Calculate emphasis multiplier based on punctuation
+        emphasis = min(text.count('!') * 0.2 + text.count('?') * 0.1, 1.0)
+        # Apply emphasis to the dominant sentiment
         if pos_count > neg_count:
+            pos_count *= (1 + emphasis)
         elif neg_count > pos_count:
+            neg_count *= (1 + emphasis)
+        # Determine sentiment with granularity
+        total = pos_count + neg_count
+        if total == 0:
+            return Sentiment.NEUTRAL
+        ratio = pos_count / total
+        if ratio > 0.8:
+            return Sentiment.POSITIVE
+        elif ratio > 0.6:
+            return Sentiment.SLIGHTLY_POSITIVE
+        elif ratio < 0.2:
+            return Sentiment.NEGATIVE
+        elif ratio < 0.4:
+            return Sentiment.SLIGHTLY_NEGATIVE
+        return Sentiment.NEUTRAL
 class CommentExtractor:
+    """Enhanced comment data extraction"""
+    class ParseError(Exception):
+        """Custom exception for parsing errors"""
+        pass
+    # Optimized patterns with named groups
     PATTERNS = {
+        'username': re.compile(r"""
+            (?:
+                Фото\sпрофиля\s(?P<name1>[^\n]+)|
+                ^(?P<name2>[^\s]+)\s+|
+                @(?P<name3>[^\s]+)\s+
+            )
+        """, re.VERBOSE),
+        'time': re.compile(r"""
+            (?P<value>\d+)\s*
+            (?P<unit>(?:ч|нед|h|w|час|hour|week))\.?
+        """, re.VERBOSE),
+        'likes': re.compile(r"""
+            (?:
+                (?P<count1>\d+)\s*отметк[аи]\s\"Нравится\"|
+                Нравится:\s*(?P<count2>\d+)|
+                \"Нравится\":\s*(?P<count3>\d+)|
+                likes?:\s*(?P<count4>\d+)
+            )
+        """, re.VERBOSE),
+        'metadata': re.compile(r"""
+            Фото\sпрофиля[^\n]+\n|
+            \d+\s*(?:ч|нед|h|w|час|hour|week)\.?|
+            (?:Нравится|likes?):\s*\d+|
+            \d+\s*отметк[аи]\s\"Нравится\"|
+            Ответить|
+            Показать\sперевод|
+            Скрыть\sвсе\sответы|
+            Смотреть\sвсе\sответы\s\(\d+\)
+        """, re.VERBOSE)
     }
     @classmethod
+    def extract_data(cls, comment_text: str) -> Optional[CommentData]:
+        """Extract comment data with improved error handling"""
         try:
+            # Extract username
+            username_match = cls.PATTERNS['username'].search(comment_text)
+            if not username_match:
+                raise cls.ParseError("Could not extract username")
+            username = next(
+                name for name in username_match.groups()
+                if name is not None
+            ).strip()
+            # Clean comment text
+            comment = cls.PATTERNS['metadata'].sub('', comment_text)
             comment = TextAnalyzer.clean_text(comment)
+            # Extract time
+            time_match = cls.PATTERNS['time'].search(comment_text)
+            if not time_match:
+                weeks = 0
+            else:
+                value = int(time_match.group('value'))
+                unit = time_match.group('unit')
+                weeks = value if unit in {'нед', 'w', 'week'} else value / (24 * 7)
+            # Extract likes
+            likes_match = cls.PATTERNS['likes'].search(comment_text)
+            likes = next(
+                (int(count) for count in likes_match.groups() if count),
+                0
+            ) if likes_match else 0
+            # Analyze sentiment
+            sentiment = SentimentAnalyzer.analyze(comment)
+            return CommentData(
+                username=username,
+                text=comment,
+                likes=likes,
+                weeks_ago=weeks,
+                sentiment=sentiment
+            )
+        except cls.ParseError as e:
+            logger.warning(f"Failed to parse comment: {e}")
+            return None
         except Exception as e:
+            logger.error(f"Unexpected error parsing comment: {e}", exc_info=True)
+            return None
 class StatsCalculator:
+    """Enhanced statistics calculation"""
     @staticmethod
+    def calculate_period_stats(comments: List[CommentData]) -> Dict:
+        """Calculate statistics using quantile-based periods"""
+        if not comments:
             return {}
+        # Sort by weeks
+        sorted_comments = sorted(comments, key=lambda x: x.weeks_ago)
+        # Calculate period boundaries using quantiles
+        weeks = [c.weeks_ago for c in sorted_comments]
+        boundaries = np.quantile(weeks, [0.33, 0.67])
+        # Group comments by period
+        periods = {
             'early': [],
             'middle': [],
             'late': []
         }
+        for comment in sorted_comments:
+            if comment.weeks_ago <= boundaries[0]:
+                periods['early'].append(comment)
+            elif comment.weeks_ago <= boundaries[1]:
+                periods['middle'].append(comment)
             else:
+                periods['late'].append(comment)
+        # Calculate statistics for each period
         return {
             period: {
+                'comments': len(comments),
+                'avg_likes': statistics.mean(c.likes for c in comments) if comments else 0,
+                'sentiment_ratio': sum(
+                    1 for c in comments
+                    if c.sentiment in {Sentiment.POSITIVE, Sentiment.SLIGHTLY_POSITIVE}
+                ) / len(comments) if comments else 0
             }
+            for period, comments in periods.items()
         }
+def analyze_post(
+    content_type: str,
+    link_to_post: str,
+    post_likes: int,
+    post_date: str,
+    description: str,
+    comment_count: int,
+    all_comments: str
+) -> Tuple[str, str, str, str, str]:
+    """Enhanced post analysis with improved error handling and reporting"""
     try:
+        # Split comments using optimized pattern
+        comment_pattern = re.compile(
+            r'(?=Фото профиля|\n\s*[a-zA-Z0-9._]+\s+|\b@[a-zA-Z0-9._]+\s+)',
+            re.MULTILINE
+        )
+        comments_blocks = [
+            block.strip() for block in comment_pattern.split(all_comments)
+            if block and block.strip() and 'Скрыто алгоритмами Instagram' not in block
+        ]
+        # Extract and validate comment data
+        comments_data = []
+        for block in comments_blocks:
+            if data := CommentExtractor.extract_data(block):
+                comments_data.append(data)
+        if not comments_data:
+            logger.warning("No valid comments found in the input")
+            return "No valid comments found", "", "", "", "0"
+        # Calculate statistics
         basic_stats = {
+            'total_comments': len(comments_data),
+            'avg_length': statistics.mean(len(c.text) for c in comments_data),
+            'median_length': statistics.median(len(c.text) for c in comments_data),
+            'avg_words': statistics.mean(len(TextAnalyzer.get_words(c.text)) for c in comments_data),
+            'total_likes': sum(c.likes for c in comments_data),
+            'avg_likes': statistics.mean(c.likes for c in comments_data)
         }
+        # Generate reports
+        reports = generate_reports(
+            content_type=content_type,
+            link_to_post=link_to_post,
+            post_likes=post_likes,
+            comments_data=comments_data,
+            basic_stats=basic_stats
+        )
         return (
+            reports['analytics'],
+            "\n".join(c.username for c in comments_data),
+            "\n".join(c.text for c in comments_data),
+            "\n".join(str(c.likes) for c in comments_data),
             str(basic_stats['total_likes'])
         )
     except Exception as e:
+        logger.error(f"Error analyzing post: {e}", exc_info=True)
+        return f"Error analyzing post: {str(e)}", "", "", "", "0"
+def generate_reports(
+    content_type: str,
+    link_to_post: str,
+    post_likes: int,
+    comments_data: List[CommentData],
+    basic_stats: Dict
+) -> Dict[str, str]:
+    """Generate comprehensive reports in multiple formats"""
+    # Calculate additional statistics
+    sentiment_dist = Counter(c.sentiment for c in comments_data)
+    period_stats = StatsCalculator.calculate_period_stats(comments_data)
+    top_users = Counter(c.username for c in comments_data).most_common(5)
+    top_mentioned = Counter(
+        mention for c in comments_data
+        for mention in TextAnalyzer.extract_mentions(c.text)
+    ).most_common(5)
+    # Generate CSV report
+    csv_output = StringIO()
+    writer = csv.writer(csv_output)
+    # Write metadata
+    writer.writerow(['Content Analysis Report'])
+    writer.writerow(['Generated', datetime.now().isoformat()])
+    writer.writerow(['Content Type', content_type])
+    writer.writerow(['Post URL', link_to_post])
+    writer.writerow(['Post Likes', post_likes])
+    writer.writerow([])
+    # Write statistics sections
+    for section, data in {
+        'Basic Statistics': basic_stats,
+        'Sentiment Distribution': sentiment_dist,
+        'Period Analysis': period_stats,
+        'Top Users': dict(top_users),
+        'Top Mentioned': dict(top_mentioned)
+    }.items():
         writer.writerow([section])
         for key, value in data.items():
             writer.writerow([key, value])
         writer.writerow([])
+    # Generate text report
+    text_report = (
+        f"ANALYSIS REPORT\n"
+        f"Generated: {datetime.now():%Y-%m-%d %H:%M:%S}\n\n"
+        f"BASIC STATISTICS:\n"
+        f"- Total Comments: {basic_stats['total_comments']}\n"
+        f"- Average Likes: {basic_stats['avg_likes']:.1f}\n"
+        f"- Average Length: {basic_stats['avg_length']:.1f} characters\n"
+        f"- Median Length: {basic_stats['median_length']}\n"
+        f"- Average Words: {basic_stats['avg_words']:.1f}\n\n"
+        f"SENTIMENT ANALYSIS:\n"
+        f"- Positive: {sentiment_dist[Sentiment.POSITIVE]}\n"
+        f"- Slightly Positive: {sentiment_dist[Sentiment.SLIGHTLY_POSITIVE]}\n"
+        f"- Neutral: {sentiment_dist[Sentiment.NEUTRAL]}\n"
+        f"- Slightly Negative: {sentiment_dist[Sentiment.SLIGHTLY_NEGATIVE]}\n"
+        f"- Negative: {sentiment_dist[Sentiment.NEGATIVE]}\n\n"
+        f"TOP CONTRIBUTORS:\n" +
+        "\n".join(f"- {user}: {count} comments" for user, count in top_users) +
+        f"\n\nMOST MENTIONED:\n""\n".join(f"- {user}: {count} mentions" for user, count in top_mentioned) +
+        f"\n\nENGAGEMENT PERIODS:\n"
+        f"Early Period:\n"
+        f"- Comments: {period_stats['early']['comments']}\n"
+        f"- Avg Likes: {period_stats['early']['avg_likes']:.1f}\n"
+        f"- Positive Sentiment: {period_stats['early']['sentiment_ratio']*100:.1f}%\n\n"
+        f"Middle Period:\n"
+        f"- Comments: {period_stats['middle']['comments']}\n"
+        f"- Avg Likes: {period_stats['middle']['avg_likes']:.1f}\n"
+        f"- Positive Sentiment: {period_stats['middle']['sentiment_ratio']*100:.1f}%\n\n"
+        f"Late Period:\n"
+        f"- Comments: {period_stats['late']['comments']}\n"
+        f"- Avg Likes: {period_stats['late']['avg_likes']:.1f}\n"
+        f"- Positive Sentiment: {period_stats['late']['sentiment_ratio']*100:.1f}%\n"
     )
+    return {
+        'csv': csv_output.getvalue(),
+        'analytics': text_report
+    }
+# Gradio interface with improved input validation and error handling
 import gradio as gr
+def validate_input(content_type: str, link: str, likes: int, date: str,
+                  description: str, comment_count: int, comments: str) -> Tuple[bool, str]:
+    """Validate input parameters before processing"""
+    if not link:
+        return False, "Post link is required"
+    if likes < 0:
+        return False, "Likes count cannot be negative"
+    if comment_count < 0:
+        return False, "Comment count cannot be negative"
+    if not comments.strip():
+        return False, "Comments text is required"
+    return True, ""
+def wrapped_analyze_post(*args):
+    """Wrapper for analyze_post with input validation"""
+    is_valid, error_message = validate_input(*args)
+    if not is_valid:
+        return error_message, "", "", "", "0"
+    try:
+        return analyze_post(*args)
+    except Exception as e:
+        logger.error(f"Error in analyze_post wrapper: {e}", exc_info=True)
+        return f"An error occurred: {str(e)}", "", "", "", "0"
+# Create enhanced Gradio interface
 iface = gr.Interface(
+    fn=wrapped_analyze_post,
     inputs=[
+        gr.Radio(
+            choices=["Photo", "Video", "Reel", "Story"],
+            label="Content Type",
+            value="Photo"
+        ),
+        gr.Textbox(
+            label="Link to Post",
+            placeholder="https://instagram.com/p/..."
+        ),
+        gr.Number(
+            label="Post Likes",
+            value=0,
+            minimum=0
+        ),
+        gr.Textbox(
+            label="Post Date",
+            placeholder="YYYY-MM-DD"
+        ),
+        gr.Textbox(
+            label="Post Description",
+            lines=3,
+            placeholder="Enter post description..."
+        ),
+        gr.Number(
+            label="Total Comment Count",
+            value=0,
+            minimum=0
+        ),
+        gr.Textbox(
+            label="Comments",
+            lines=10,
+            placeholder="Paste comments here..."
+        )
     ],
     outputs=[
+        gr.Textbox(
+            label="Analytics Summary",
+            lines=20
+        ),
+        gr.Textbox(
+            label="Extracted Usernames"
+        ),
+        gr.Textbox(
+            label="Cleaned Comments"
+        ),
+        gr.Textbox(
+            label="Comment Likes Timeline"
+        ),
+        gr.Textbox(
+            label="Total Comment Likes"
+        )
     ],
     title="Enhanced Instagram Comment Analyzer",
+    description="""
+    Analyze Instagram comments with advanced metrics including:
+    - Sentiment analysis with granular classification
+    - Temporal engagement patterns
+    - User interaction statistics
+    - Content quality metrics
+    """,
+    article="""
+    ### Usage Instructions
+    1. Select the content type (Photo, Video, Reel, or Story)
+    2. Paste the post URL
+    3. Enter the post metadata (likes, date, description)
+    4. Paste the comments text
+    5. Click submit to generate analysis
+    ### Analysis Features
+    - Multi-level sentiment analysis
+    - Engagement period breakdown
+    - Top contributors and mentions
+    - Detailed statistical metrics
+    ### Notes
+    - All text fields support Unicode characters including emojis
+    - Time references are converted to a standardized format
+    - Analysis includes both quantitative and qualitative metrics
+    """
 )
 if __name__ == "__main__":
+    # Configure logging for the main application
+    logger.info("Starting Instagram Comment Analyzer")
+    try:
+        # Launch the interface with enhanced settings
+        iface.launch(
+            server_name="0.0.0.0",  # Allow external access
+            server_port=7860,        # Default Gradio port
+            share=False,             # Disable public URL generation
+            debug=False,             # Disable debug mode in production
+            enable_queue=True,       # Enable request queuing
+            max_threads=4           # Limit concurrent processing
+        )
+    except Exception as e:
+        logger.error(f"Failed to start application: {e}", exc_info=True)
+        raise