Update app.py
Browse files
app.py
CHANGED
@@ -1,6 +1,10 @@
|
|
1 |
import streamlit as st
|
2 |
-
import
|
|
|
|
|
|
|
3 |
import re
|
|
|
4 |
|
5 |
# Streamlit μ λͺ© λ° μ€λͺ
|
6 |
st.title("VOD μ±ν
ν¬λ‘€λ¬")
|
@@ -29,10 +33,9 @@ def crawl_chats(vod_url):
|
|
29 |
"previousVideoChatSize": 50 # κ°μ Έμ¬ μ±ν
λ©μμ§ μ
|
30 |
}
|
31 |
|
32 |
-
# λ§μ§λ§ μμ§ν μ±ν
λ©μμ§ μ μ₯ λ³μ
|
33 |
-
last_collected_chats = None
|
34 |
-
total_collected_chats = 0
|
35 |
chat_logs = []
|
|
|
|
|
36 |
|
37 |
# μ±ν
λ°μ΄ν°λ₯Ό μμ°¨μ μΌλ‘ μμ²νμ¬ κ°μ Έμ€κΈ°
|
38 |
while True:
|
@@ -41,7 +44,7 @@ def crawl_chats(vod_url):
|
|
41 |
|
42 |
# μμ² κ²°κ³Όκ° μ±κ³΅μ μ΄μ§ μμ κ²½μ° μ’
λ£
|
43 |
if response.status_code != 200:
|
44 |
-
return f"API μμ² μ€ν¨: {response.status_code}"
|
45 |
|
46 |
# JSON λ°μ΄ν°λ‘ λ³ν
|
47 |
data = response.json()
|
@@ -53,10 +56,6 @@ def crawl_chats(vod_url):
|
|
53 |
if not chats:
|
54 |
break
|
55 |
|
56 |
-
# νμ¬ μμ§λ μ±ν
μ΄ μ΄μ μ μμ§λ μ±ν
κ³Ό λμΌνμ§ νμΈ
|
57 |
-
if last_collected_chats == chats:
|
58 |
-
break
|
59 |
-
|
60 |
# μ±ν
λ©μμ§(content)μ playerMessageTime(μ±ν
μκ°)λ§ μμ§
|
61 |
for chat in chats:
|
62 |
chat_content = chat.get("content") # μ±ν
λ©μμ§ λ΄μ©
|
@@ -76,11 +75,14 @@ def crawl_chats(vod_url):
|
|
76 |
# μ±ν
λ‘κ·Έμ μΆκ°
|
77 |
chat_logs.append(f"{formatted_time} - {chat_content}")
|
78 |
|
79 |
-
|
80 |
-
|
|
|
|
|
81 |
|
82 |
-
|
83 |
-
|
|
|
84 |
|
85 |
# λ€μ μμ²μ μν΄ playerMessageTime νλΌλ―Έν° μ
λ°μ΄νΈ
|
86 |
next_time = data["content"].get("nextPlayerMessageTime")
|
@@ -88,15 +90,13 @@ def crawl_chats(vod_url):
|
|
88 |
break
|
89 |
params["playerMessageTime"] = next_time
|
90 |
|
91 |
-
|
92 |
-
return "\n".join(chat_logs)
|
93 |
|
94 |
# λ²νΌμ λλ μ λ μ±ν
ν¬λ‘€λ§ μμ
|
95 |
if st.button("ν¬λ‘€λ§ μμ"):
|
96 |
if vod_url:
|
97 |
-
chat_logs = crawl_chats(vod_url)
|
98 |
-
|
99 |
-
|
100 |
# νμΌλ‘ μ μ₯
|
101 |
file_name = "chat_logs.txt"
|
102 |
with open(file_name, "w") as file:
|
@@ -110,5 +110,53 @@ if st.button("ν¬λ‘€λ§ μμ"):
|
|
110 |
file_name=file_name,
|
111 |
mime="text/plain"
|
112 |
)
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
113 |
else:
|
114 |
st.warning("URLμ μ
λ ₯νμΈμ.")
|
|
|
1 |
import streamlit as st
|
2 |
+
import pandas as pd
|
3 |
+
import plotly.graph_objects as go
|
4 |
+
from collections import defaultdict
|
5 |
+
import datetime
|
6 |
import re
|
7 |
+
import requests
|
8 |
|
9 |
# Streamlit μ λͺ© λ° μ€λͺ
|
10 |
st.title("VOD μ±ν
ν¬λ‘€λ¬")
|
|
|
33 |
"previousVideoChatSize": 50 # κ°μ Έμ¬ μ±ν
λ©μμ§ μ
|
34 |
}
|
35 |
|
|
|
|
|
|
|
36 |
chat_logs = []
|
37 |
+
chat_counts = defaultdict(int)
|
38 |
+
laugh_counts = defaultdict(int)
|
39 |
|
40 |
# μ±ν
λ°μ΄ν°λ₯Ό μμ°¨μ μΌλ‘ μμ²νμ¬ κ°μ Έμ€κΈ°
|
41 |
while True:
|
|
|
44 |
|
45 |
# μμ² κ²°κ³Όκ° μ±κ³΅μ μ΄μ§ μμ κ²½μ° μ’
λ£
|
46 |
if response.status_code != 200:
|
47 |
+
return f"API μμ² μ€ν¨: {response.status_code}", None, None
|
48 |
|
49 |
# JSON λ°μ΄ν°λ‘ λ³ν
|
50 |
data = response.json()
|
|
|
56 |
if not chats:
|
57 |
break
|
58 |
|
|
|
|
|
|
|
|
|
59 |
# μ±ν
λ©μμ§(content)μ playerMessageTime(μ±ν
μκ°)λ§ μμ§
|
60 |
for chat in chats:
|
61 |
chat_content = chat.get("content") # μ±ν
λ©μμ§ λ΄μ©
|
|
|
75 |
# μ±ν
λ‘κ·Έμ μΆκ°
|
76 |
chat_logs.append(f"{formatted_time} - {chat_content}")
|
77 |
|
78 |
+
# μκ°λλ³λ‘ μ±ν
κ°μ κ³μ°
|
79 |
+
time_obj = datetime.datetime.strptime(formatted_time, '%H:%M:%S')
|
80 |
+
minute_key = time_obj.replace(second=0) # λΆ λ¨μλ‘ λ³ννμ¬ μ§κ³
|
81 |
+
chat_counts[minute_key] += 1
|
82 |
|
83 |
+
# 'γ
γ
γ
γ
'κ° ν¬ν¨λ μ±ν
κ°μ μΉ΄μ΄νΈ
|
84 |
+
if len(re.findall(r'γ
', chat_content)) >= 4:
|
85 |
+
laugh_counts[minute_key] += 1
|
86 |
|
87 |
# λ€μ μμ²μ μν΄ playerMessageTime νλΌλ―Έν° μ
λ°μ΄νΈ
|
88 |
next_time = data["content"].get("nextPlayerMessageTime")
|
|
|
90 |
break
|
91 |
params["playerMessageTime"] = next_time
|
92 |
|
93 |
+
return "\n".join(chat_logs), chat_counts, laugh_counts
|
|
|
94 |
|
95 |
# λ²νΌμ λλ μ λ μ±ν
ν¬λ‘€λ§ μμ
|
96 |
if st.button("ν¬λ‘€λ§ μμ"):
|
97 |
if vod_url:
|
98 |
+
chat_logs, chat_counts, laugh_counts = crawl_chats(vod_url)
|
99 |
+
|
|
|
100 |
# νμΌλ‘ μ μ₯
|
101 |
file_name = "chat_logs.txt"
|
102 |
with open(file_name, "w") as file:
|
|
|
110 |
file_name=file_name,
|
111 |
mime="text/plain"
|
112 |
)
|
113 |
+
|
114 |
+
# κ·Έλν μΆλ ₯
|
115 |
+
if chat_counts and laugh_counts:
|
116 |
+
# λ°μ΄ν°νλ μ μμ±
|
117 |
+
times = [time.strftime('%H:%M:%S') for time in chat_counts.keys()]
|
118 |
+
chat_numbers = list(chat_counts.values())
|
119 |
+
laugh_numbers = [laugh_counts.get(time, 0) for time in chat_counts.keys()]
|
120 |
+
df = pd.DataFrame({'μκ°': times, 'μ 체 μ±ν
κ°μ': chat_numbers, 'γ
γ
γ
γ
μ±ν
κ°μ': laugh_numbers})
|
121 |
+
|
122 |
+
# Plotly μ κ·Έλν 그리기
|
123 |
+
fig = go.Figure()
|
124 |
+
|
125 |
+
# μ 체 μ±ν
κ°μ μ κ·Έλν μΆκ°
|
126 |
+
fig.add_trace(go.Scatter(
|
127 |
+
x=df['μκ°'],
|
128 |
+
y=df['μ 체 μ±ν
κ°μ'],
|
129 |
+
mode='lines', # λ§μ»€ μμ΄ μ λ§ νμ
|
130 |
+
name='μ 체 μ±ν
κ°μ',
|
131 |
+
line=dict(color='blue'),
|
132 |
+
hovertemplate='%{x} - μ 체 μ±ν
κ°μ: %{y}<extra></extra>'
|
133 |
+
))
|
134 |
+
|
135 |
+
# γ
γ
γ
γ
μ±ν
κ°μ μ κ·Έλν μΆκ°
|
136 |
+
fig.add_trace(go.Scatter(
|
137 |
+
x=df['μκ°'],
|
138 |
+
y=df['γ
γ
γ
γ
μ±ν
κ°μ'],
|
139 |
+
mode='lines', # λ§μ»€ μμ΄ μ λ§ νμ
|
140 |
+
name='γ
γ
γ
γ
μ±ν
κ°μ',
|
141 |
+
line=dict(color='red'),
|
142 |
+
hovertemplate='%{x} - γ
γ
γ
γ
μ±ν
κ°μ: %{y}<extra></extra>'
|
143 |
+
))
|
144 |
+
|
145 |
+
# κ·Έλν λ μ΄μμ μ€μ
|
146 |
+
fig.update_layout(
|
147 |
+
title="λΆλΉ μ±ν
λ° γ
γ
γ
γ
μ±ν
κ°μ",
|
148 |
+
xaxis_title="μκ°",
|
149 |
+
yaxis_title="μ±ν
κ°μ",
|
150 |
+
xaxis=dict(
|
151 |
+
showticklabels=True # xμΆ μκ° λ μ΄λΈ νμ
|
152 |
+
),
|
153 |
+
hovermode="x unified", # λ§μ°μ€λ₯Ό μ¬λ Έμ λ ν΄λΉ xμΆμμ ν΄ν νμ
|
154 |
+
showlegend=True, # λ²λ‘ νμ
|
155 |
+
margin=dict(l=50, r=50, t=100, b=100) # κ·Έλν μλμͺ½ μ¬λ°±μ μ‘°μ
|
156 |
+
)
|
157 |
+
|
158 |
+
# κ·Έλν μΆλ ₯
|
159 |
+
st.plotly_chart(fig)
|
160 |
+
|
161 |
else:
|
162 |
st.warning("URLμ μ
λ ₯νμΈμ.")
|