Spaces:

chuanenlin
/

which-frame

Sleeping

App Files Files Community

chuanenlin commited on Nov 27, 2024

Commit

df75121

1 Parent(s): 6792725

Demo version

Browse files

Files changed (3) hide show

.DS_Store +0 -0
whichframe.py +26 -69
youtube.com_cookies.txt +0 -5

.DS_Store CHANGED Viewed

Binary files a/.DS_Store and b/.DS_Store differ

whichframe.py CHANGED Viewed

@@ -17,39 +17,26 @@ CACHED_DATA_PATH = "cached_data/"
 device = "cuda" if torch.cuda.is_available() else "cpu"
 model, preprocess = openai_clip.load("ViT-B/32", device=device)
-def export_cookies():
-    cookie_path = "youtube.com_cookies.txt"
-    if not os.path.exists(cookie_path):
-        with open(cookie_path, "w") as f:
-            f.write("# Netscape HTTP Cookie File\n")
-            f.write("# https://curl.haxx.se/rfc/cookie_spec.html\n")
-            f.write("# This is a generated file!  Do not edit.\n\n")
-            f.write(".youtube.com\tTRUE\t/\tFALSE\t2147483647\tCONSENT\tYES+cb.20210328-17-p0.en+FX+{}\n")
-    return cookie_path
 def fetch_video(url):
     try:
-        cookie_path = export_cookies()
         ydl_opts = {
             'format': 'bestvideo[height<=360][ext=mp4]/best[height<=360]',
             'quiet': True,
             'no_warnings': True,
-            'cookies': cookie_path,
             'extract_flat': False,
             'no_check_certificates': True
         }
         with yt_dlp.YoutubeDL(ydl_opts) as ydl:
             info = ydl.extract_info(url, download=False)
-            duration = info.get('duration', 0)
-            if duration >= 300:  # 5 minutes
-                st.error("Please find a YouTube video shorter than 5 minutes.")
-                st.stop()
             video_url = info['url']
             return None, video_url
     except Exception as e:
         st.error(f"Error fetching video: {str(e)}")
-        st.error("Try another YouTube video or check if the URL is correct.")
         st.stop()
 def extract_frames(video, status_text, progress_bar):
@@ -242,16 +229,28 @@ a:hover {text-decoration: none;}
 """
 st.markdown(hide_streamlit_style, unsafe_allow_html=True)
-if 'progress' not in st.session_state:
-    st.session_state.progress = 1
-if 'video_frames' not in st.session_state:
     st.session_state.video_frames = None
-if 'video_features' not in st.session_state:
     st.session_state.video_features = None
-if 'fps' not in st.session_state:
     st.session_state.fps = None
-if 'video_name' not in st.session_state:
-    st.session_state.video_name = 'videos/example.mp4'
 st.title("Which Frame? 🎞️🔍")
 st.markdown("""
@@ -259,52 +258,10 @@ Search a video semantically. For example, which frame has "a person with sunglas
 Search using text, images, or a mix of text + image. WhichFrame uses [CLIP](https://github.com/openai/CLIP) for zero-shot frame classification.
 """)
-if 'url' not in st.session_state:
-    st.session_state.url = ''
-url = st.text_input("Enter a YouTube URL (e.g., https://www.youtube.com/watch?v=zTvJJnoWIPk)", key="url_input")
-if st.button("Process Video"):
-    if not url:
-        st.error("Please enter a YouTube URL first")
-    else:
-        try:
-            cached_frames, cached_features, cached_fps, cached_frame_indices = load_cached_data(url)
-            if cached_frames is not None:
-                st.session_state.video_frames = cached_frames
-                st.session_state.video_features = cached_features
-                st.session_state.fps = cached_fps
-                st.session_state.frame_indices = cached_frame_indices
-                st.session_state.url = url
-                st.session_state.progress = 2
-                st.success("Loaded cached video data!")
-            else:
-                with st.spinner('Fetching video...'):
-                    video, video_url = fetch_video(url)
-                    st.session_state.url = url
-                progress_bar = st.progress(0)
-                status_text = st.empty()
-                # Extract frames
-                st.session_state.video_frames, st.session_state.fps, st.session_state.frame_indices = extract_frames(video_url, status_text, progress_bar)
-                # Encode frames
-                st.session_state.video_features = encode_frames(st.session_state.video_frames, status_text)
-                save_cached_data(url, st.session_state.video_frames, st.session_state.video_features, st.session_state.fps, st.session_state.frame_indices)
-                status_text.text('Finalizing...')
-                st.session_state.progress = 2
-                progress_bar.progress(100)
-                status_text.empty()
-                progress_bar.empty()
-                st.success("Video processed successfully!")
-        except Exception as e:
-            st.error(f"Error processing video: {str(e)}")
-if st.session_state.progress == 2:
     search_type = st.radio("Search Method", ["Text Search", "Image Search", "Text + Image Search"], index=0)
     if search_type == "Text Search":  # Text Search

 device = "cuda" if torch.cuda.is_available() else "cpu"
 model, preprocess = openai_clip.load("ViT-B/32", device=device)
 def fetch_video(url):
+    if url != EXAMPLE_URL:
+        st.error("Only the example video is supported due to compute constraints.")
+        st.stop()
     try:
         ydl_opts = {
             'format': 'bestvideo[height<=360][ext=mp4]/best[height<=360]',
             'quiet': True,
             'no_warnings': True,
             'extract_flat': False,
             'no_check_certificates': True
         }
         with yt_dlp.YoutubeDL(ydl_opts) as ydl:
             info = ydl.extract_info(url, download=False)
             video_url = info['url']
             return None, video_url
     except Exception as e:
         st.error(f"Error fetching video: {str(e)}")
         st.stop()
 def extract_frames(video, status_text, progress_bar):
 """
 st.markdown(hide_streamlit_style, unsafe_allow_html=True)
+# Initialize session state
+if 'initialized' not in st.session_state:
+    st.session_state.initialized = False
     st.session_state.video_frames = None
     st.session_state.video_features = None
     st.session_state.fps = None
+    st.session_state.frame_indices = None
+    st.session_state.url = EXAMPLE_URL
+# Load data on first run
+if not st.session_state.initialized:
+    cached_frames, cached_features, cached_fps, cached_frame_indices = load_cached_data(EXAMPLE_URL)
+    if cached_frames is not None:
+        st.session_state.video_frames = cached_frames
+        st.session_state.video_features = cached_features
+        st.session_state.fps = cached_fps
+        st.session_state.frame_indices = cached_frame_indices
+        st.session_state.initialized = True
+    else:
+        st.error("Could not load video data. Please contact the administrator.")
+        st.stop()
 st.title("Which Frame? 🎞️🔍")
 st.markdown("""
 Search using text, images, or a mix of text + image. WhichFrame uses [CLIP](https://github.com/openai/CLIP) for zero-shot frame classification.
 """)
+st.video(EXAMPLE_URL)
+st.caption("Note: Try out the code linked at the bottom of the page to run WhichFrame on your own videos.")
+if st.session_state.initialized:
     search_type = st.radio("Search Method", ["Text Search", "Image Search", "Text + Image Search"], index=0)
     if search_type == "Text Search":  # Text Search

youtube.com_cookies.txt DELETED Viewed

@@ -1,5 +0,0 @@
-# Netscape HTTP Cookie File
-# https://curl.haxx.se/rfc/cookie_spec.html
-# This is a generated file!  Do not edit.
-.youtube.com	TRUE	/	FALSE	2147483647	CONSENT	YES+cb.20210328-17-p0.en+FX+{}