Spaces:

sepp81
/

knjdkjafk

Sleeping

App Files Files Community

sepp81 commited on Jan 3

Commit

279a22c

verified ·

1 Parent(s): 6de7b7f

Update app.py

Browse files

Files changed (1) hide show

app.py +182 -51

app.py CHANGED Viewed

@@ -11,7 +11,7 @@ def local_css():
     st.markdown("""
     <style>
     /* Global Styling */
     /* Game Container */
     .game-container {
         border-radius: 15px;
@@ -21,12 +21,12 @@ def local_css():
     }
     /* Sentences Styling */
     .sentence-container {
         border-left: 4px solid #3498db;
         padding: 10px;
         margin-bottom: 10px;
-        display: flex;
-        align-items: center;
-        justify-content: space-between;
     }
     .sentence-container:hover {
         transform: translateX(5px);
@@ -63,6 +63,15 @@ def local_css():
         background-color: #2c3e50;
         color: white;
     }
     </style>
     """, unsafe_allow_html=True)
@@ -70,7 +79,7 @@ class RoFTGame:
     def __init__(self, dataset_path):
         """
         Initialize the RoFT Game with the dataset
         :param dataset_path: Path to the roft.csv file
         """
         self.df = pd.read_csv(dataset_path)
@@ -78,14 +87,15 @@ class RoFTGame:
         self.current_sentences = None
         self.true_boundary_index = None
         self.current_guess_index = None
         self.predefined_reasons = [
             "grammar",
-            "repetition",
-            "irrelevant",
-            "contradicts_sentence",
-            "contradicts_knowledge",
-            "common_sense",
-            "coreference",
             "generic"
         ]
@@ -93,32 +103,46 @@ class RoFTGame:
         """
         Load a random sample from the dataset
         """
         valid_samples = self.df[
-            (self.df['gen_body'].notna()) &
-            (self.df['reason'].notna()) &
             (self.df['reason'] != '[]')
         ]
         self.current_sample = valid_samples.sample(n=1).iloc[0]
         prompt_sentences = self.current_sample['prompt_body'].split('_SEP_')
         gen_sentences = self.current_sample['gen_body'].split('_SEP_')
         combined_sentences = prompt_sentences + gen_sentences
         self.current_sentences = combined_sentences[:10]
         self.true_boundary_index = self.current_sample['true_boundary_index']
         try:
             self.current_reasons = ast.literal_eval(self.current_sample['reason'])
         except:
             self.current_reasons = []
         self.current_guess_index = None
     def check_guess(self, guess_index):
         self.current_guess_index = guess_index
         if guess_index == self.true_boundary_index:
             return 5
         elif guess_index > self.true_boundary_index:
@@ -126,80 +150,187 @@ class RoFTGame:
         else:
             return 0
-    def save_annotation(self, guess_index, reason):
         os.makedirs('logs', exist_ok=True)
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
         filename = f'logs/annotation_{timestamp}.txt'
         annotation_details = [
             f"Timestamp: {timestamp}",
             f"Model: {self.current_sample['model']}",
             f"Dataset: {self.current_sample['dataset']}",
             f"Guess Index: {guess_index + 1}",
             f"True Boundary Index: {self.true_boundary_index + 1}",
-            f"User Reason: {reason}"
         ]
         with open(filename, 'w') as f:
             f.write("\n".join(annotation_details))
 def main():
     local_css()
     st.markdown("""
-    <h1 style='text-align: center; color: #2c3e50;'>
     🕵️ Real or Fake Text Detective 🕵️‍♀️
     </h1>
     """, unsafe_allow_html=True)
     if 'game' not in st.session_state:
         st.session_state.game = RoFTGame('roft.csv')
         st.session_state.game.load_random_sample()
         st.session_state.total_points = 0
         st.session_state.rounds_played = 0
     st.sidebar.markdown("## 🎮 Game Stats")
     st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}")
     st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}")
-    st.markdown("<div class='game-container'>", unsafe_allow_html=True)
     st.subheader("🔍 Examine the Text Carefully")
-    guess = None
-    for i, sentence in enumerate(st.session_state.game.current_sentences):
-        col1, col2 = st.columns([9, 1])
-        with col1:
-            st.markdown(f"<div class='sentence-container'><strong>{i+1}.</strong> {sentence}</div>", unsafe_allow_html=True)
-        with col2:
-            if st.radio("", ["", str(i + 1)], key=f"guess_{i}"):
-                guess = i
     if st.button("Submit Guess"):
-        if guess is None:
-            st.warning("Please select where the AI-generated text begins.")
         else:
-            points_earned = st.session_state.game.check_guess(guess)
             st.session_state.total_points += points_earned
             st.session_state.rounds_played += 1
-            st.subheader("Results")
-            st.write(f"Your Guess: Sentence {guess + 1}")
-            st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}")
-            st.write(f"Points Earned: {points_earned}")
-            if points_earned > 0:
-                reason = st.text_area("Explain Your Reason")
-                if reason:
-                    st.session_state.game.save_annotation(guess, reason)
-                    st.success("Reason saved successfully.")
             else:
-                st.info("You didn't get the boundary right. Try again in the next round!")
             if st.button("Next Round"):
                 st.session_state.game.load_random_sample()
                 st.experimental_rerun()
     st.markdown("</div>", unsafe_allow_html=True)
 if __name__ == "__main__":
     main()

     st.markdown("""
     <style>
     /* Global Styling */
     /* Game Container */
     .game-container {
         border-radius: 15px;
     }
     /* Sentences Styling */
     .sentence-container {
+        display: flex;
+        align-items: center;
         border-left: 4px solid #3498db;
         padding: 10px;
         margin-bottom: 10px;
+        transition: all 0.3s ease;
     }
     .sentence-container:hover {
         transform: translateX(5px);
         background-color: #2c3e50;
         color: white;
     }
+    /* Reason Validation */
+    .reason-valid {
+        color: #2ecc71;
+        font-weight: bold;
+    }
+    .reason-invalid {
+        color: #e74c3c;
+        font-weight: bold;
+    }
     </style>
     """, unsafe_allow_html=True)
     def __init__(self, dataset_path):
         """
         Initialize the RoFT Game with the dataset
         :param dataset_path: Path to the roft.csv file
         """
         self.df = pd.read_csv(dataset_path)
         self.current_sentences = None
         self.true_boundary_index = None
         self.current_guess_index = None
+        # Predefined reasons from the dataset description
         self.predefined_reasons = [
             "grammar",
+            "repetition",
+            "irrelevant",
+            "contradicts_sentence",
+            "contradicts_knowledge",
+            "common_sense",
+            "coreference",
             "generic"
         ]
         """
         Load a random sample from the dataset
         """
+        # Filter for samples with valid generations and reasons
         valid_samples = self.df[
+            (self.df['gen_body'].notna()) &
+            (self.df['reason'].notna()) &
             (self.df['reason'] != '[]')
         ]
+        # Select a random sample
         self.current_sample = valid_samples.sample(n=1).iloc[0]
+        # Prepare sentences
         prompt_sentences = self.current_sample['prompt_body'].split('_SEP_')
         gen_sentences = self.current_sample['gen_body'].split('_SEP_')
+        # Combine and truncate to 10 sentences
         combined_sentences = prompt_sentences + gen_sentences
         self.current_sentences = combined_sentences[:10]
+        # Store true boundary
         self.true_boundary_index = self.current_sample['true_boundary_index']
+        # Parse reasons from the dataset
         try:
             self.current_reasons = ast.literal_eval(self.current_sample['reason'])
         except:
             self.current_reasons = []
+        # Reset current guess
         self.current_guess_index = None
     def check_guess(self, guess_index):
+        """
+        Check if the guess is correct
+        :param guess_index: Index of the guessed boundary
+        :return: Points earned
+        """
         self.current_guess_index = guess_index
+        # Calculate points based on closeness to true boundary
         if guess_index == self.true_boundary_index:
             return 5
         elif guess_index > self.true_boundary_index:
         else:
             return 0
+    def validate_reason(self, user_reason):
+        """
+        Validate user's reason against dataset reasons
+        :param user_reason: Reason provided by user
+        :return: Tuple of (is_valid, matching_reasons)
+        """
+        # Convert user reason to lowercase for matching
+        user_reason_lower = user_reason.lower()
+        # Check against predefined reasons and current sample's reasons
+        matching_reasons = []
+        # Check predefined reasons
+        for reason in self.predefined_reasons:
+            if reason.lower() in user_reason_lower:
+                matching_reasons.append(reason)
+        # Check original sample's reasons
+        for orig_reason in self.current_reasons:
+            if orig_reason.lower() in user_reason_lower:
+                matching_reasons.append(orig_reason)
+        return len(matching_reasons) > 0, matching_reasons
+    def save_annotation(self, guess_index, reason, reason_validity):
+        """
+        Save annotation to a text file
+        :param guess_index: Index of the guessed boundary
+        :param reason: Reason for the guess
+        :param reason_validity: Validity of the reason
+        """
+        # Ensure logs directory exists
         os.makedirs('logs', exist_ok=True)
+        # Generate unique filename with timestamp
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
         filename = f'logs/annotation_{timestamp}.txt'
+        # Prepare annotation details
         annotation_details = [
             f"Timestamp: {timestamp}",
             f"Model: {self.current_sample['model']}",
             f"Dataset: {self.current_sample['dataset']}",
             f"Guess Index: {guess_index + 1}",
             f"True Boundary Index: {self.true_boundary_index + 1}",
+            f"Original Dataset Reasons: {self.current_reasons}",
+            f"User Reason: {reason}",
+            f"Reason Validity: {reason_validity[0]}",
+            f"Matching Reasons: {reason_validity[1]}",
+            "\nFull Text:\n" + "\n".join(f"{i+1}. {sent}" for i, sent in enumerate(self.current_sentences))
         ]
+        # Write to file
         with open(filename, 'w') as f:
             f.write("\n".join(annotation_details))
 def main():
     local_css()
+    # Fancy title with animation
     st.markdown("""
+    <h1 style='text-align: center; color: #2c3e50;
+    text-shadow: 2px 2px 4px rgba(0,0,0,0.3);
+    animation: fadeIn 2s;'>
     🕵️ Real or Fake Text Detective 🕵️‍♀️
     </h1>
     """, unsafe_allow_html=True)
+    # Game introduction
+    st.markdown("""
+    <div class='game-container'>
+    <p style='text-align: center; font-style: italic;'>
+    Sharpen your AI detection skills! Read carefully and identify where human writing transforms into machine-generated text.
+    </p>
+    </div>
+    """, unsafe_allow_html=True)
+    # Initialize game session state
     if 'game' not in st.session_state:
         st.session_state.game = RoFTGame('roft.csv')
         st.session_state.game.load_random_sample()
         st.session_state.total_points = 0
         st.session_state.rounds_played = 0
+    # Game container
+    st.markdown("<div class='game-container'>", unsafe_allow_html=True)
+    # Game information in sidebar with icons
     st.sidebar.markdown("## 🎮 Game Stats")
     st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}")
     st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}")
+        # Animated difficulty indicator
+    difficulty_map = {
+        'gpt2': '🟢 Easy',
+        'gpt2-xl': '🟠 Medium',
+        'ctrl': '🔴 Hard'
+    }
+    current_model = st.session_state.game.current_sample['model']
+    difficulty = difficulty_map.get(current_model, '⚪ Unknown')
+    st.sidebar.markdown(f"### 🎯 Difficulty: {difficulty}")
+    # Display sentences with enhanced styling and radio buttons
     st.subheader("🔍 Examine the Text Carefully")
+    selected_guess = st.radio(
+        "Where do you think the AI-generated text begins?",
+        options=[f"{i+1}. {sentence}" for i, sentence in enumerate(st.session_state.game.current_sentences)],
+        label_visibility="collapsed"
+    )
+    # Reason input with predefined options and visual enhancements
+    st.markdown("### 🧐 Explain Your Reasoning")
+    reason_options = st.session_state.game.predefined_reasons
+    selected_predefined_reasons = st.multiselect(
+        "Select indicators of AI generation",
+        options=reason_options
+    )
+    # Custom reason input
+    custom_reason = st.text_area("Additional detective notes (optional)")
+    # Combine predefined and custom reasons
+    full_reason = " ".join(selected_predefined_reasons)
+    if custom_reason:
+        full_reason += f" {custom_reason}"
+    # Guess submission
     if st.button("Submit Guess"):
+        if not full_reason.strip():
+            st.warning("Please provide a reason for your guess.")
         else:
+            # Convert guess to index (subtract 1 for 0-based indexing)
+            guess_index = int(selected_guess.split('.')[0]) - 1
+            # Check guess and update points
+            points_earned = st.session_state.game.check_guess(guess_index)
             st.session_state.total_points += points_earned
             st.session_state.rounds_played += 1
+            # If guess is correct, validate reason
+            if guess_index == st.session_state.game.true_boundary_index:
+                reason_validity = st.session_state.game.validate_reason(full_reason)
+                st.subheader("Results")
+                st.write(f"Your Guess: Sentence {selected_guess}")
+                st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}")
+                st.write(f"Points Earned: {points_earned}")
+                # Display reason validation
+                st.write("Reason Validation:")
+                st.write(f"Valid Reason: {reason_validity[0]}")
+                if reason_validity[1]:
+                    st.write("Matching Reasons:", ", ".join(reason_validity[1]))
+                # Save annotation
+                st.session_state.game.save_annotation(guess_index, full_reason, reason_validity)
             else:
+                st.subheader("Results")
+                st.write(f"Your Guess: Sentence {selected_guess}")
+                st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}")
+                st.write(f"Points Earned: {points_earned}")
+            # Option to continue
             if st.button("Next Round"):
                 st.session_state.game.load_random_sample()
                 st.experimental_rerun()
     st.markdown("</div>", unsafe_allow_html=True)
+    # Optional: Show metadata for current sample
+    if st.checkbox("Show Sample Metadata"):
+        st.write("Current Sample Details:")
+        sample = st.session_state.game.current_sample
+        st.write(f"Model: {sample['model']}")
+        st.write(f"Dataset: {sample['dataset']}")
+        st.write(f"Sampling Strategy (p): {sample['dec_strat_value']}")
+        st.write(f"Original Reasons: {st.session_state.game.current_reasons}")
 if __name__ == "__main__":
     main()