Spaces:

stcoats
/

tspace

Sleeping

App Files Files Community

stcoats commited on Mar 14

Commit

a0a9509

1 Parent(s): a47efdc

Add application file

Browse files

Files changed (1) hide show

app.py +26 -24

app.py CHANGED Viewed

@@ -37,6 +37,9 @@ except Exception as e:
     st.error(f"DuckDB connection failed: {e}")
     st.stop()
 # Search
 query = st.text_input("Search text (case-insensitive)", "").strip()
@@ -44,7 +47,7 @@ if query:
     sql = """
         SELECT id, channel, video_id, video_title, speaker, start_time, end_time, text, pos_tags, upload_date, audio
         FROM data
-        WHERE LOWER(text) LIKE '%' || LOWER(?) || '%'
         LIMIT 100
     """
     df = con.execute(sql, [query]).df()
@@ -76,27 +79,26 @@ else:
             return None
     df["audio_file"] = df["audio"].apply(render_audio_cell)
-    # Build an interactive sortable table
-    st.markdown("### Results Table (Sortable)")
-    for i, row in df.iterrows():
-        with st.expander(f"? {row['speaker']} | {row['text'][:60]}..."):
-            col1, col2 = st.columns([2, 3])
-            with col1:
-                st.write(f"**ID:** {row['id']}")
-                st.write(f"**Channel:** {row['channel']}")
-                st.write(f"**Video ID:** {row['video_id']}")
-                st.write(f"**Video Title:** {row['video_title']}")
-                st.write(f"**Speaker:** {row['speaker']}")
-                st.write(f"**Start Time:** {row['start_time']}")
-                st.write(f"**End Time:** {row['end_time']}")
-                st.write(f"**Upload Date:** {row['upload_date']}")
-                st.write(f"**POS Tags:** {row['pos_tags']}")
-            with col2:
-                st.markdown(f"**Text:** {row['text']}")
-                if row['audio_file']:
-                    st.audio(row['audio_file'], format="audio/mp3")
-                else:
-                    st.warning("Audio not available or invalid format.")

     st.error(f"DuckDB connection failed: {e}")
     st.stop()
+# Enable full-text search index on first run (one-time setup if not exists)
+con.execute("PRAGMA create_fts_index('data', 'text')")
 # Search
 query = st.text_input("Search text (case-insensitive)", "").strip()
     sql = """
         SELECT id, channel, video_id, video_title, speaker, start_time, end_time, text, pos_tags, upload_date, audio
         FROM data
+        WHERE text % ?
         LIMIT 100
     """
     df = con.execute(sql, [query]).df()
             return None
     df["audio_file"] = df["audio"].apply(render_audio_cell)
+    df_display = df.drop(columns=["audio"]).copy()
+    # Add HTML audio tag column
+    def audio_html(path):
+        if path:
+            return f'<audio controls preload="none" style="height:20px;"> <source src="file://{path}" type="audio/mpeg"> </audio>'
+        return ""
+    df_display["Audio"] = df["audio_file"].apply(audio_html)
+    # Reorder columns
+    column_order = ["id", "channel", "video_id", "video_title", "speaker", "start_time", "end_time", "upload_date", "text", "pos_tags", "Audio"]
+    df_display = df_display[column_order]
+    st.markdown("### Full Table View (Sortable)")
+    st.write("Note: Audio is embedded using HTML tags; not all browsers allow playback from local temp paths.")
+    st.dataframe(df_display.drop(columns=["Audio"]))
+    st.markdown("### Audio Previews")
+    for i, row in df_display.iterrows():
+        if row["Audio"]:
+            st.markdown(f"**{row['speaker']} | {row['text'][:80]}**", unsafe_allow_html=True)
+            st.markdown(row["Audio"], unsafe_allow_html=True)