sepp81 commited on
Commit
60e7aa6
·
verified ·
1 Parent(s): 734617f

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +185 -34
app.py CHANGED
@@ -93,11 +93,139 @@ def local_css():
93
  """, unsafe_allow_html=True)
94
 
95
  class RoFTGame:
96
- # [Previous implementation remains the same]
97
- # ... [Copy the entire RoFTGame class from the previous implementation] ...
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
98
 
99
  def main():
100
- # Apply custom CSS
101
  local_css()
102
 
103
  # Fancy title with animation
@@ -118,6 +246,7 @@ def main():
118
  </div>
119
  """, unsafe_allow_html=True)
120
 
 
121
  # Initialize game session state
122
  if 'game' not in st.session_state:
123
  st.session_state.game = RoFTGame('roft.csv')
@@ -132,58 +261,80 @@ def main():
132
  st.sidebar.markdown("## 🎮 Game Stats")
133
  st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}")
134
  st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}")
135
-
136
- # Animated difficulty indicator
137
- difficulty_map = {
138
- 'gpt2': '🟢 Easy',
139
- 'gpt2-xl': '🟠 Medium',
140
- 'ctrl': '🔴 Hard'
141
- }
142
- current_model = st.session_state.game.current_sample['model']
143
- difficulty = difficulty_map.get(current_model, '⚪ Unknown')
144
- st.sidebar.markdown(f"### 🎯 Difficulty: {difficulty}")
145
-
146
- # Display sentences with enhanced styling
147
- st.subheader("🔍 Examine the Text Carefully")
148
  for i, sentence in enumerate(st.session_state.game.current_sentences):
149
- st.markdown(f"""
150
- <div class='sentence-container'>
151
- <strong>{i+1}.</strong> {sentence}
152
- </div>
153
- """, unsafe_allow_html=True)
154
 
155
- # Boundary selection with visual improvements
156
- st.markdown("### 🚨 Detect AI Transition Point")
157
  guess = st.radio(
158
  "Where do you think the AI-generated text begins?",
159
  options=[str(i+1) for i in range(len(st.session_state.game.current_sentences))]
160
  )
161
 
162
- # Reason input with predefined options and visual enhancements
163
- st.markdown("### 🧐 Explain Your Reasoning")
164
  reason_options = st.session_state.game.predefined_reasons
165
  selected_predefined_reasons = st.multiselect(
166
- "Select indicators of AI generation",
167
  options=reason_options
168
  )
169
 
170
  # Custom reason input
171
- custom_reason = st.text_area("Additional detective notes (optional)")
172
 
173
  # Combine predefined and custom reasons
174
  full_reason = " ".join(selected_predefined_reasons)
175
  if custom_reason:
176
  full_reason += f" {custom_reason}"
177
 
178
- # Submit button with game metaphor
179
- if st.button("🕵️ Submit Detective Report"):
180
  if not full_reason.strip():
181
- st.warning("🚨 Every good detective needs evidence! Please provide a reason.")
182
  else:
183
- # [Rest of the submission logic remains the same as in previous implementation]
184
- # ... [Copy the entire submission block from previous implementation] ...
185
-
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
186
  st.markdown("</div>", unsafe_allow_html=True)
187
 
 
 
 
 
 
 
 
 
 
188
  if __name__ == "__main__":
189
- main()
 
93
  """, unsafe_allow_html=True)
94
 
95
  class RoFTGame:
96
+ def __init__(self, dataset_path):
97
+ """
98
+ Initialize the RoFT Game with the dataset
99
+
100
+ :param dataset_path: Path to the roft.csv file
101
+ """
102
+ self.df = pd.read_csv(dataset_path)
103
+ self.current_sample = None
104
+ self.current_sentences = None
105
+ self.true_boundary_index = None
106
+ self.current_guess_index = None
107
+ # Predefined reasons from the dataset description
108
+ self.predefined_reasons = [
109
+ "grammar",
110
+ "repetition",
111
+ "irrelevant",
112
+ "contradicts_sentence",
113
+ "contradicts_knowledge",
114
+ "common_sense",
115
+ "coreference",
116
+ "generic"
117
+ ]
118
+
119
+ def load_random_sample(self):
120
+ """
121
+ Load a random sample from the dataset
122
+ """
123
+ # Filter for samples with valid generations and reasons
124
+ valid_samples = self.df[
125
+ (self.df['gen_body'].notna()) &
126
+ (self.df['reason'].notna()) &
127
+ (self.df['reason'] != '[]')
128
+ ]
129
+
130
+ # Select a random sample
131
+ self.current_sample = valid_samples.sample(n=1).iloc[0]
132
+
133
+ # Prepare sentences
134
+ prompt_sentences = self.current_sample['prompt_body'].split('_SEP_')
135
+ gen_sentences = self.current_sample['gen_body'].split('_SEP_')
136
+
137
+ # Combine and truncate to 10 sentences
138
+ combined_sentences = prompt_sentences + gen_sentences
139
+ self.current_sentences = combined_sentences[:10]
140
+
141
+ # Store true boundary
142
+ self.true_boundary_index = self.current_sample['true_boundary_index']
143
+
144
+ # Parse reasons from the dataset
145
+ try:
146
+ self.current_reasons = ast.literal_eval(self.current_sample['reason'])
147
+ except:
148
+ self.current_reasons = []
149
+
150
+ # Reset current guess
151
+ self.current_guess_index = None
152
+
153
+ def check_guess(self, guess_index):
154
+ """
155
+ Check if the guess is correct
156
+
157
+ :param guess_index: Index of the guessed boundary
158
+ :return: Points earned
159
+ """
160
+ self.current_guess_index = guess_index
161
+
162
+ # Calculate points based on closeness to true boundary
163
+ if guess_index == self.true_boundary_index:
164
+ return 5
165
+ elif guess_index > self.true_boundary_index:
166
+ return max(5 - (guess_index - self.true_boundary_index), 0)
167
+ else:
168
+ return 0
169
+
170
+ def validate_reason(self, user_reason):
171
+ """
172
+ Validate user's reason against dataset reasons
173
+
174
+ :param user_reason: Reason provided by user
175
+ :return: Tuple of (is_valid, matching_reasons)
176
+ """
177
+ # Convert user reason to lowercase for matching
178
+ user_reason_lower = user_reason.lower()
179
+
180
+ # Check against predefined reasons and current sample's reasons
181
+ matching_reasons = []
182
+
183
+ # Check predefined reasons
184
+ for reason in self.predefined_reasons:
185
+ if reason.lower() in user_reason_lower:
186
+ matching_reasons.append(reason)
187
+
188
+ # Check original sample's reasons
189
+ for orig_reason in self.current_reasons:
190
+ if orig_reason.lower() in user_reason_lower:
191
+ matching_reasons.append(orig_reason)
192
+
193
+ return len(matching_reasons) > 0, matching_reasons
194
+
195
+ def save_annotation(self, guess_index, reason, reason_validity):
196
+ """
197
+ Save annotation to a text file
198
+
199
+ :param guess_index: Index of the guessed boundary
200
+ :param reason: Reason for the guess
201
+ :param reason_validity: Validity of the reason
202
+ """
203
+ # Ensure logs directory exists
204
+ os.makedirs('logs', exist_ok=True)
205
+
206
+ # Generate unique filename with timestamp
207
+ timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
208
+ filename = f'logs/annotation_{timestamp}.txt'
209
+
210
+ # Prepare annotation details
211
+ annotation_details = [
212
+ f"Timestamp: {timestamp}",
213
+ f"Model: {self.current_sample['model']}",
214
+ f"Dataset: {self.current_sample['dataset']}",
215
+ f"Guess Index: {guess_index + 1}",
216
+ f"True Boundary Index: {self.true_boundary_index + 1}",
217
+ f"Original Dataset Reasons: {self.current_reasons}",
218
+ f"User Reason: {reason}",
219
+ f"Reason Validity: {reason_validity[0]}",
220
+ f"Matching Reasons: {reason_validity[1]}",
221
+ "\nFull Text:\n" + "\n".join(f"{i+1}. {sent}" for i, sent in enumerate(self.current_sentences))
222
+ ]
223
+
224
+ # Write to file
225
+ with open(filename, 'w') as f:
226
+ f.write("\n".join(annotation_details))
227
 
228
  def main():
 
229
  local_css()
230
 
231
  # Fancy title with animation
 
246
  </div>
247
  """, unsafe_allow_html=True)
248
 
249
+
250
  # Initialize game session state
251
  if 'game' not in st.session_state:
252
  st.session_state.game = RoFTGame('roft.csv')
 
261
  st.sidebar.markdown("## 🎮 Game Stats")
262
  st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}")
263
  st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}")
264
+
265
+ # Display sentences
266
+ st.subheader("Read the following text carefully:")
 
 
 
 
 
 
 
 
 
 
267
  for i, sentence in enumerate(st.session_state.game.current_sentences):
268
+ st.write(f"{i+1}. {sentence}")
 
 
 
 
269
 
270
+ # Boundary selection
 
271
  guess = st.radio(
272
  "Where do you think the AI-generated text begins?",
273
  options=[str(i+1) for i in range(len(st.session_state.game.current_sentences))]
274
  )
275
 
276
+ # Reason input with predefined options
277
+ st.subheader("Reason Selection")
278
  reason_options = st.session_state.game.predefined_reasons
279
  selected_predefined_reasons = st.multiselect(
280
+ "Select predefined reasons (you can also add custom text)",
281
  options=reason_options
282
  )
283
 
284
  # Custom reason input
285
+ custom_reason = st.text_area("Additional explanation (optional)")
286
 
287
  # Combine predefined and custom reasons
288
  full_reason = " ".join(selected_predefined_reasons)
289
  if custom_reason:
290
  full_reason += f" {custom_reason}"
291
 
292
+ # Guess submission
293
+ if st.button("Submit Guess"):
294
  if not full_reason.strip():
295
+ st.warning("Please provide a reason for your guess.")
296
  else:
297
+ # Convert guess to index (subtract 1 for 0-based indexing)
298
+ guess_index = int(guess) - 1
299
+
300
+ # Check guess and update points
301
+ points_earned = st.session_state.game.check_guess(guess_index)
302
+ st.session_state.total_points += points_earned
303
+ st.session_state.rounds_played += 1
304
+
305
+ # Validate reason
306
+ reason_validity = st.session_state.game.validate_reason(full_reason)
307
+
308
+ # Save annotation
309
+ st.session_state.game.save_annotation(guess_index, full_reason, reason_validity)
310
+
311
+ # Show results
312
+ st.subheader("Results")
313
+ st.write(f"Your Guess: Sentence {guess}")
314
+ st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}")
315
+ st.write(f"Points Earned: {points_earned}")
316
+
317
+ # Display reason validation
318
+ st.write("Reason Validation:")
319
+ st.write(f"Valid Reason: {reason_validity[0]}")
320
+ if reason_validity[1]:
321
+ st.write("Matching Reasons:", ", ".join(reason_validity[1]))
322
+
323
+ # Option to continue
324
+ if st.button("Next Round"):
325
+ st.session_state.game.load_random_sample()
326
+ st.experimental_rerun()
327
+
328
  st.markdown("</div>", unsafe_allow_html=True)
329
 
330
+ # Optional: Show metadata for current sample
331
+ if st.checkbox("Show Sample Metadata"):
332
+ st.write("Current Sample Details:")
333
+ sample = st.session_state.game.current_sample
334
+ st.write(f"Model: {sample['model']}")
335
+ st.write(f"Dataset: {sample['dataset']}")
336
+ st.write(f"Sampling Strategy (p): {sample['dec_strat_value']}")
337
+ st.write(f"Original Reasons: {st.session_state.game.current_reasons}")
338
+
339
  if __name__ == "__main__":
340
+ main()