stcoats commited on
Commit
6763ad1
·
1 Parent(s): 135e6d1

Add application file

Browse files
Files changed (1) hide show
  1. app.py +21 -16
app.py CHANGED
@@ -42,13 +42,15 @@ query = st.text_input("Search text (case-insensitive)", "").strip()
42
 
43
  # Build query
44
  if query:
45
- sql = """
 
 
46
  SELECT id, channel, video_id, speaker, start_time, end_time, upload_date, text, pos_tags, audio
47
  FROM data
48
- WHERE LOWER(text) LIKE LOWER(?)
49
  LIMIT 100
50
  """
51
- df = con.execute(sql, [f"%{query}%"]).df()
52
  else:
53
  df = con.execute("""
54
  SELECT id, channel, video_id, speaker, start_time, end_time, upload_date, text, pos_tags, audio
@@ -61,7 +63,7 @@ st.markdown(f"### Showing {len(df)} results")
61
  if len(df) == 0:
62
  st.warning("No matches found.")
63
  else:
64
- def render_audio_cell(audio_bytes):
65
  try:
66
  if isinstance(audio_bytes, (bytes, bytearray, memoryview)):
67
  data = bytes(audio_bytes)
@@ -72,22 +74,25 @@ else:
72
  with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
73
  tmp.write(data)
74
  tmp.flush()
75
- return f'<audio controls style="height:20px;"> <source src="file://{tmp.name}" type="audio/mpeg"></audio>'
76
  except Exception:
77
  return ""
78
 
79
- df["Audio"] = df["audio"].apply(render_audio_cell)
80
- df_display = df.drop(columns=["audio"]) # Drop binary column before display
 
81
 
82
- # Reorder columns for display
83
- df_display = df_display[["id", "channel", "video_id", "speaker", "start_time", "end_time", "upload_date", "text", "pos_tags", "Audio"]]
84
 
85
- st.markdown("### Results Table (Sortable with Audio Column)")
86
- st.markdown("(Scroll right to view audio controls)")
87
- st.dataframe(df_display, use_container_width=True)
88
 
89
- # Optionally, render inline HTML audio
90
- # for i, row in df_display.iterrows():
91
- # st.markdown(f"**{row['speaker']} | {row['text']}**")
92
- # st.markdown(row["Audio"], unsafe_allow_html=True)
 
 
 
 
 
93
 
 
42
 
43
  # Build query
44
  if query:
45
+ search_terms = query.lower().split()
46
+ conditions = " AND ".join(["LOWER(text) LIKE ?" for _ in search_terms])
47
+ sql = f"""
48
  SELECT id, channel, video_id, speaker, start_time, end_time, upload_date, text, pos_tags, audio
49
  FROM data
50
+ WHERE {conditions}
51
  LIMIT 100
52
  """
53
+ df = con.execute(sql, [f"%{term}%" for term in search_terms]).df()
54
  else:
55
  df = con.execute("""
56
  SELECT id, channel, video_id, speaker, start_time, end_time, upload_date, text, pos_tags, audio
 
63
  if len(df) == 0:
64
  st.warning("No matches found.")
65
  else:
66
+ def render_audio_html(audio_bytes):
67
  try:
68
  if isinstance(audio_bytes, (bytes, bytearray, memoryview)):
69
  data = bytes(audio_bytes)
 
74
  with tempfile.NamedTemporaryFile(delete=False, suffix=".mp3") as tmp:
75
  tmp.write(data)
76
  tmp.flush()
77
+ return f'<audio controls style="height:20px;width:100%;"><source src="file://{tmp.name}" type="audio/mpeg"></audio>'
78
  except Exception:
79
  return ""
80
 
81
+ df["Audio"] = df["audio"].apply(render_audio_html)
82
+ df = df.drop(columns=["audio"])
83
+ df = df[["id", "channel", "video_id", "speaker", "start_time", "end_time", "upload_date", "text", "pos_tags", "Audio"]]
84
 
85
+ from st_aggrid import AgGrid, GridOptionsBuilder
 
86
 
87
+ st.markdown("### Results Table (Sortable with Embedded Audio)")
 
 
88
 
89
+ gb = GridOptionsBuilder.from_dataframe(df.drop(columns=["Audio"]))
90
+ gb.configure_default_column(resizable=True, sortable=True, filter=True)
91
+ grid_options = gb.build()
92
+
93
+ AgGrid(df.drop(columns=["Audio"]), gridOptions=grid_options, fit_columns_on_grid_load=True)
94
+
95
+ st.markdown("### Audio Controls in Table")
96
+ for i in range(len(df)):
97
+ st.markdown(df.loc[i, "Audio"], unsafe_allow_html=True)
98