FLS

Sleeping

App Files Files Community

kambris commited on Dec 13, 2024

Commit

a0b6552

verified ·

1 Parent(s): bf19518

Update app.py

Browse files

Files changed (1) hide show

app.py +70 -76

app.py CHANGED Viewed

@@ -128,57 +128,61 @@ class SpeechAnalyzer:
         return aggregated_scores
     def analyze_emotional_trajectory(self, text, window_size=5):
-        """Enhanced emotional trajectory analysis using batch processing"""
         segments = self.split_text(text, max_length=512)
         sentiment_scores = []
         for segment in segments:
-            # Split into sentences using NLTK
             sentences = nltk.sent_tokenize(segment)
-            # Process sentences in batches
             batch_size = 64
             segment_scores = []
             for i in range(0, len(sentences), batch_size):
                 batch = sentences[i:i+batch_size]
                 try:
-                    # Pad or truncate sentences to ensure consistent length
-                    batch = [sent[:512] for sent in batch]  # Truncate to max model input
-                    # Ensure all sentences are strings and non-empty
-                    batch = [sent if sent.strip() else "." for sent in batch]
                     results = self.sentiment_pipeline(batch)
-                    # Process batch results
                     batch_scores = []
                     for result in results:
-                        # Convert to signed score (-1 to 1 range)
                         score = result['score']
-                        score = score * 2 - 1 if result['label'] == 'POSITIVE' else -score
                         batch_scores.append(score)
                     segment_scores.extend(batch_scores)
                 except Exception as e:
                     print(f"Batch processing error: {e}")
-                    # Fallback to individual processing if batch fails
-                    for sent in batch:
-                        try:
-                            result = self.sentiment_pipeline(sent)[0]
-                            score = result['score']
-                            score = score * 2 - 1 if result['label'] == 'POSITIVE' else -score
-                            segment_scores.append(score)
-                        except:
-                            segment_scores.append(0)
-            # Calculate average score for the segment
-            avg_score = np.mean(segment_scores) if segment_scores else 0
-            sentiment_scores.append(avg_score)
-        return sentiment_scores
     def detect_named_entities(self, text):
         """Detect named entities in the text"""
@@ -331,78 +335,68 @@ def main():
                 st.write(f"**{MORAL_FOUNDATIONS[foundation]}**: {score:.2%}")
         with tab2:
-            status_text.text('Processing Emotional Trajectory...')
-            progress_bar.progress(40)
             st.subheader("Speech Trajectory Analysis")
-            col1, col2 = st.columns(2)
-            # Create consistent segments for both analyses
             segments = analyzer.split_text(text, max_length=512)
             num_segments = len(segments)
             segment_labels = [f"{i+1}" for i in range(num_segments)]
             with col1:
-                st.write("### Emotional Flow")
-                sentiment_scores = analyzer.analyze_emotional_trajectory(text)
-                trajectory_fig = go.Figure(data=go.Scatter(
                     x=segment_labels,
                     y=sentiment_scores,
                     mode='lines+markers',
                     line=dict(color='#1f77b4', width=3),
-                    marker=dict(size=8, color='#1f77b4', symbol='circle')
                 ))
-                trajectory_fig.update_layout(
-                    title='Emotional Flow Throughout the Speech',
                     xaxis_title='Speech Segments',
-                    yaxis_title='Relative Emotional Tone',
                     yaxis=dict(
-                        ticktext=['Most Negative', 'Neutral', 'Most Positive'],
-                        tickvals=[-1, 0, 1],
-                        range=[-1.1, 1.1],
                         gridcolor='lightgray'
                     ),
-                    hovermode='x unified',
-                    showlegend=False,
                     plot_bgcolor='white'
                 )
-                st.plotly_chart(trajectory_fig)
-            with col2:
-                st.write("### Moral Foundations Flow")
-                moral_trajectories = {foundation: [] for foundation in MORAL_FOUNDATIONS}
-                for segment in segments:
-                    segment_scores = analyzer.analyze_moral_foundations(segment)
-                    for foundation, score in segment_scores.items():
-                        moral_trajectories[foundation].append(score)
-                moral_fig = go.Figure()
-                for foundation, scores in moral_trajectories.items():
-                    moral_fig.add_trace(go.Scatter(
-                        x=segment_labels,
-                        y=scores,
-                        name=MORAL_FOUNDATIONS[foundation],
-                        mode='lines+markers'
-                    ))
-                moral_fig.update_layout(
-                    title='Moral Foundations Flow',
                     xaxis_title='Speech Segments',
-                    yaxis_title='Foundation Strength',
-                    hovermode='x unified',
-                    plot_bgcolor='white',
                     showlegend=True,
-                    legend=dict(
-                        yanchor="top",
-                        y=0.99,
-                        xanchor="left",
-                        x=1.05
-                    )
                 )
-                st.plotly_chart(moral_fig)
         with tab3:
             status_text.text('Analyzing Linguistic Features...')

         return aggregated_scores
     def analyze_emotional_trajectory(self, text, window_size=5):
+        """Enhanced emotional trajectory analysis with basic emotions"""
         segments = self.split_text(text, max_length=512)
         sentiment_scores = []
+        basic_emotions = []
+        # Add emotion classifier pipeline
+        emotion_classifier = pipeline("text-classification", model="j-hartmann/emotion-english-distilroberta-base", return_all_scores=True)
         for segment in segments:
             sentences = nltk.sent_tokenize(segment)
             batch_size = 64
             segment_scores = []
+            segment_emotions = []
             for i in range(0, len(sentences), batch_size):
                 batch = sentences[i:i+batch_size]
+                batch = [sent[:512] for sent in batch]
+                batch = [sent if sent.strip() else "." for sent in batch]
+                # Get sentiment scores
                 try:
                     results = self.sentiment_pipeline(batch)
                     batch_scores = []
                     for result in results:
                         score = result['score']
+                        # Enhanced score scaling for better visualization
+                        if result['label'] == 'POSITIVE':
+                            score = 0.5 + (score * 0.5)  # Scale from 0.5 to 1.0
+                        else:
+                            score = 0.5 - (score * 0.5)  # Scale from 0.0 to 0.5
                         batch_scores.append(score)
                     segment_scores.extend(batch_scores)
+                    # Get emotion classifications
+                    emotion_results = emotion_classifier(batch)
+                    batch_emotions = []
+                    for result in emotion_results:
+                        # Get the dominant emotion
+                        dominant_emotion = max(result[0], key=lambda x: x['score'])
+                        batch_emotions.append(dominant_emotion['label'])
+                    segment_emotions.extend(batch_emotions)
                 except Exception as e:
                     print(f"Batch processing error: {e}")
+                    segment_scores.extend([0.5] * len(batch))
+                    segment_emotions.extend(['neutral'] * len(batch))
+            sentiment_scores.append(np.mean(segment_scores))
+            # Get most frequent emotion in segment
+            if segment_emotions:
+                basic_emotions.append(max(set(segment_emotions), key=segment_emotions.count))
+            else:
+                basic_emotions.append('neutral')
+        return sentiment_scores, basic_emotions
     def detect_named_entities(self, text):
         """Detect named entities in the text"""
                 st.write(f"**{MORAL_FOUNDATIONS[foundation]}**: {score:.2%}")
         with tab2:
             st.subheader("Speech Trajectory Analysis")
+            col1, col2, col3 = st.columns(3)
             segments = analyzer.split_text(text, max_length=512)
             num_segments = len(segments)
             segment_labels = [f"{i+1}" for i in range(num_segments)]
+            sentiment_scores, basic_emotions = analyzer.analyze_emotional_trajectory(text)
             with col1:
+                st.write("### Sentiment Flow")
+                sentiment_fig = go.Figure(data=go.Scatter(
                     x=segment_labels,
                     y=sentiment_scores,
                     mode='lines+markers',
                     line=dict(color='#1f77b4', width=3),
+                    marker=dict(
+                        size=8,
+                        color=['#ff0000' if score < 0.4 else '#00ff00' if score > 0.6 else '#888888' for score in sentiment_scores],
+                        symbol='circle'
+                    )
                 ))
+                sentiment_fig.update_layout(
+                    title='Sentiment Throughout Speech',
                     xaxis_title='Speech Segments',
+                    yaxis_title='Sentiment',
                     yaxis=dict(
+                        ticktext=['Very Negative', 'Negative', 'Neutral', 'Positive', 'Very Positive'],
+                        tickvals=[0, 0.25, 0.5, 0.75, 1],
+                        range=[0, 1],
                         gridcolor='lightgray'
                     ),
                     plot_bgcolor='white'
                 )
+                st.plotly_chart(sentiment_fig)
+            # Rest of the code remains the same for col2 (Moral Foundations)
+            with col3:
+                st.write("### Basic Emotions")
+                emotions_df = pd.DataFrame({
+                    'Segment': segment_labels,
+                    'Emotion': basic_emotions
+                })
+                emotions_fig = px.bar(
+                    emotions_df,
+                    x='Segment',
+                    y='Emotion',
+                    color='Emotion',
+                    title='Basic Emotions Flow',
+                    category_orders={'Emotion': ['joy', 'sadness', 'anger', 'fear', 'surprise', 'neutral']}
+                )
+                emotions_fig.update_layout(
                     xaxis_title='Speech Segments',
+                    yaxis_title='Emotion',
                     showlegend=True,
+                    plot_bgcolor='white'
                 )
+                st.plotly_chart(emotions_fig)
         with tab3:
             status_text.text('Analyzing Linguistic Features...')