Spaces:

Anuj02003
/

YouTube_Content_Analyzer

Sleeping

App Files Files Community

Anuj02003 commited on Nov 22, 2024

Commit

33edde5

verified ·

1 Parent(s): 89238f7

Update app.py

Browse files

Files changed (1) hide show

app.py +9 -17

app.py CHANGED Viewed

@@ -10,14 +10,15 @@ from textblob import TextBlob
 import re
 import nltk
-# Ensure that necessary NLTK data is downloaded
 nltk.download('punkt')
 nltk.download('stopwords')
 nltk.download('wordnet')
 # Function to summarize text
 def summarize_text(text, max_length=80000):  # Increased max_length to 80,000
-    summarization_pipeline = pipeline("summarization", model="facebook/bart-large-cnn")
     summary = summarization_pipeline(text, max_length=max_length, min_length=100, do_sample=False)
     return summary[0]['summary_text']
@@ -63,20 +64,6 @@ def extract_video_id(url):
             break
     return video_id
-# Function to fetch transcript with retries
-def get_transcript(video_id):
-    try:
-        # Attempt to fetch the transcript with language preference
-        transcript = YouTubeTranscriptApi.get_transcript(video_id, languages=['en'])
-        return transcript
-    except TranscriptsDisabled:
-        st.error("Transcripts are disabled for this video. Try a different one.")
-    except NoTranscriptFound:
-        st.error("No transcript found for this video. Ensure it has captions enabled.")
-    except Exception as e:
-        st.error(f"An unexpected error occurred while fetching the transcript: {str(e)}")
-    return None
 # Main Streamlit app
 def main():
     st.title("YouTube Video Summarizer")
@@ -118,8 +105,9 @@ def main():
                 return
             # Get transcript of the video
-            transcript = get_transcript(video_id)
             if not transcript:
                 return
             video_text = ' '.join([line['text'] for line in transcript])
@@ -151,6 +139,10 @@ def main():
             st.write(f"Polarity: {sentiment.polarity}")
             st.write(f"Subjectivity: {sentiment.subjectivity}")
         except Exception as e:
             st.error(f"Error: {str(e)}")

 import re
 import nltk
+# Ensure necessary NLTK data is downloaded
 nltk.download('punkt')
 nltk.download('stopwords')
 nltk.download('wordnet')
+nltk.download('tokenizers/punkt_tab/english')  # Added to resolve punkt_tab error
 # Function to summarize text
 def summarize_text(text, max_length=80000):  # Increased max_length to 80,000
+    summarization_pipeline = pipeline("summarization")
     summary = summarization_pipeline(text, max_length=max_length, min_length=100, do_sample=False)
     return summary[0]['summary_text']
             break
     return video_id
 # Main Streamlit app
 def main():
     st.title("YouTube Video Summarizer")
                 return
             # Get transcript of the video
+            transcript = YouTubeTranscriptApi.get_transcript(video_id)
             if not transcript:
+                st.error("Transcript not available for this video. Please try a different video.")
                 return
             video_text = ' '.join([line['text'] for line in transcript])
             st.write(f"Polarity: {sentiment.polarity}")
             st.write(f"Subjectivity: {sentiment.subjectivity}")
+        except TranscriptsDisabled:
+            st.error("Transcripts are disabled for this video. Please try a different video.")
+        except NoTranscriptFound:
+            st.error("No transcript found for this video. Please try a different video.")
         except Exception as e:
             st.error(f"Error: {str(e)}")