Spaces:

sepp81
/

knjdkjafk

Sleeping

App Files Files Community

sepp81 commited on Jan 3

Commit

6de7b7f

verified ·

1 Parent(s): ffc982a

Update app.py

Browse files

Files changed (1) hide show

app.py +49 -193

app.py CHANGED Viewed

@@ -11,7 +11,6 @@ def local_css():
     st.markdown("""
     <style>
     /* Global Styling */
     /* Game Container */
     .game-container {
@@ -20,19 +19,18 @@ def local_css():
         box-shadow: 0 4px 6px rgba(0,0,0,0.1);
         margin-bottom: 20px;
     }
     /* Sentences Styling */
     .sentence-container {
         border-left: 4px solid #3498db;
         padding: 10px;
         margin-bottom: 10px;
-        transition: all 0.3s ease;
     }
     .sentence-container:hover {
         transform: translateX(5px);
     }
     /* Buttons */
     .stButton>button {
         color: white;
@@ -41,46 +39,30 @@ def local_css():
         padding: 10px 20px;
         transition: all 0.3s ease;
     }
     .stButton>button:hover {
         transform: scale(1.05);
     }
     /* Radio Buttons */
     .stRadio>div {
         display: flex;
         flex-wrap: wrap;
         gap: 10px;
     }
     .stRadio>div>label {
         background-color: #ecf0f1;
         padding: 10px;
         border-radius: 10px;
         transition: all 0.3s ease;
     }
     .stRadio>div>label:hover {
         background-color: #3498db;
         color: white;
     }
     /* Sidebar */
     .css-1aumxhk {
         background-color: #2c3e50;
         color: white;
     }
-    /* Reason Validation */
-    .reason-valid {
-        color: #2ecc71;
-        font-weight: bold;
-    }
-    .reason-invalid {
-        color: #e74c3c;
-        font-weight: bold;
-    }
     </style>
     """, unsafe_allow_html=True)
@@ -88,7 +70,7 @@ class RoFTGame:
     def __init__(self, dataset_path):
         """
         Initialize the RoFT Game with the dataset
         :param dataset_path: Path to the roft.csv file
         """
         self.df = pd.read_csv(dataset_path)
@@ -96,15 +78,14 @@ class RoFTGame:
         self.current_sentences = None
         self.true_boundary_index = None
         self.current_guess_index = None
-        # Predefined reasons from the dataset description
         self.predefined_reasons = [
             "grammar",
-            "repetition",
-            "irrelevant",
-            "contradicts_sentence",
-            "contradicts_knowledge",
-            "common_sense",
-            "coreference",
             "generic"
         ]
@@ -112,46 +93,32 @@ class RoFTGame:
         """
         Load a random sample from the dataset
         """
-        # Filter for samples with valid generations and reasons
         valid_samples = self.df[
-            (self.df['gen_body'].notna()) &
-            (self.df['reason'].notna()) &
             (self.df['reason'] != '[]')
         ]
-        # Select a random sample
         self.current_sample = valid_samples.sample(n=1).iloc[0]
-        # Prepare sentences
         prompt_sentences = self.current_sample['prompt_body'].split('_SEP_')
         gen_sentences = self.current_sample['gen_body'].split('_SEP_')
-        # Combine and truncate to 10 sentences
         combined_sentences = prompt_sentences + gen_sentences
         self.current_sentences = combined_sentences[:10]
-        # Store true boundary
         self.true_boundary_index = self.current_sample['true_boundary_index']
-        # Parse reasons from the dataset
         try:
             self.current_reasons = ast.literal_eval(self.current_sample['reason'])
         except:
             self.current_reasons = []
-        # Reset current guess
         self.current_guess_index = None
     def check_guess(self, guess_index):
-        """
-        Check if the guess is correct
-        :param guess_index: Index of the guessed boundary
-        :return: Points earned
-        """
         self.current_guess_index = guess_index
-        # Calculate points based on closeness to true boundary
         if guess_index == self.true_boundary_index:
             return 5
         elif guess_index > self.true_boundary_index:
@@ -159,191 +126,80 @@ class RoFTGame:
         else:
             return 0
-    def validate_reason(self, user_reason):
-        """
-        Validate user's reason against dataset reasons
-        :param user_reason: Reason provided by user
-        :return: Tuple of (is_valid, matching_reasons)
-        """
-        # Convert user reason to lowercase for matching
-        user_reason_lower = user_reason.lower()
-        # Check against predefined reasons and current sample's reasons
-        matching_reasons = []
-        # Check predefined reasons
-        for reason in self.predefined_reasons:
-            if reason.lower() in user_reason_lower:
-                matching_reasons.append(reason)
-        # Check original sample's reasons
-        for orig_reason in self.current_reasons:
-            if orig_reason.lower() in user_reason_lower:
-                matching_reasons.append(orig_reason)
-        return len(matching_reasons) > 0, matching_reasons
-    def save_annotation(self, guess_index, reason, reason_validity):
-        """
-        Save annotation to a text file
-        :param guess_index: Index of the guessed boundary
-        :param reason: Reason for the guess
-        :param reason_validity: Validity of the reason
-        """
-        # Ensure logs directory exists
         os.makedirs('logs', exist_ok=True)
-        # Generate unique filename with timestamp
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
         filename = f'logs/annotation_{timestamp}.txt'
-        # Prepare annotation details
         annotation_details = [
             f"Timestamp: {timestamp}",
             f"Model: {self.current_sample['model']}",
             f"Dataset: {self.current_sample['dataset']}",
             f"Guess Index: {guess_index + 1}",
             f"True Boundary Index: {self.true_boundary_index + 1}",
-            f"Original Dataset Reasons: {self.current_reasons}",
-            f"User Reason: {reason}",
-            f"Reason Validity: {reason_validity[0]}",
-            f"Matching Reasons: {reason_validity[1]}",
-            "\nFull Text:\n" + "\n".join(f"{i+1}. {sent}" for i, sent in enumerate(self.current_sentences))
         ]
-        # Write to file
         with open(filename, 'w') as f:
             f.write("\n".join(annotation_details))
 def main():
     local_css()
-    # Fancy title with animation
     st.markdown("""
-    <h1 style='text-align: center; color: #2c3e50;
-    text-shadow: 2px 2px 4px rgba(0,0,0,0.3);
-    animation: fadeIn 2s;'>
     🕵️ Real or Fake Text Detective 🕵️‍♀️
     </h1>
     """, unsafe_allow_html=True)
-    # Game introduction
-    st.markdown("""
-    <div class='game-container'>
-    <p style='text-align: center; font-style: italic;'>
-    Sharpen your AI detection skills! Read carefully and identify where human writing transforms into machine-generated text.
-    </p>
-    </div>
-    """, unsafe_allow_html=True)
-    # Initialize game session state
     if 'game' not in st.session_state:
         st.session_state.game = RoFTGame('roft.csv')
         st.session_state.game.load_random_sample()
         st.session_state.total_points = 0
         st.session_state.rounds_played = 0
-    # Game container
-    st.markdown("<div class='game-container'>", unsafe_allow_html=True)
-    # Game information in sidebar with icons
     st.sidebar.markdown("## 🎮 Game Stats")
     st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}")
     st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}")
-        # Animated difficulty indicator
-    difficulty_map = {
-        'gpt2': '🟢 Easy',
-        'gpt2-xl': '🟠 Medium',
-        'ctrl': '🔴 Hard'
-    }
-    current_model = st.session_state.game.current_sample['model']
-    difficulty = difficulty_map.get(current_model, '⚪ Unknown')
-    st.sidebar.markdown(f"### 🎯 Difficulty: {difficulty}")
-    # Display sentences with enhanced styling
     st.subheader("🔍 Examine the Text Carefully")
     for i, sentence in enumerate(st.session_state.game.current_sentences):
-        st.markdown(f"""
-        <div class='sentence-container'>
-        <strong>{i+1}.</strong> {sentence}
-        </div>
-        """, unsafe_allow_html=True)
-    # Boundary selection with visual improvements
-    st.markdown("### 🚨 Detect AI Transition Point")
-    guess = st.radio(
-        "Where do you think the AI-generated text begins?",
-        options=[str(i+1) for i in range(len(st.session_state.game.current_sentences))]
-    )
-    # Reason input with predefined options and visual enhancements
-    st.markdown("### 🧐 Explain Your Reasoning")
-    reason_options = st.session_state.game.predefined_reasons
-    selected_predefined_reasons = st.multiselect(
-        "Select indicators of AI generation",
-        options=reason_options
-    )
-    # Custom reason input
-    custom_reason = st.text_area("Additional detective notes (optional)")
-    # Combine predefined and custom reasons
-    full_reason = " ".join(selected_predefined_reasons)
-    if custom_reason:
-        full_reason += f" {custom_reason}"
-    # Guess submission
     if st.button("Submit Guess"):
-        if not full_reason.strip():
-            st.warning("Please provide a reason for your guess.")
         else:
-            # Convert guess to index (subtract 1 for 0-based indexing)
-            guess_index = int(guess) - 1
-            # Check guess and update points
-            points_earned = st.session_state.game.check_guess(guess_index)
             st.session_state.total_points += points_earned
             st.session_state.rounds_played += 1
-            # Validate reason
-            reason_validity = st.session_state.game.validate_reason(full_reason)
-            # Save annotation
-            st.session_state.game.save_annotation(guess_index, full_reason, reason_validity)
-            # Show results
             st.subheader("Results")
-            st.write(f"Your Guess: Sentence {guess}")
             st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}")
             st.write(f"Points Earned: {points_earned}")
-            # Display reason validation
-            st.write("Reason Validation:")
-            st.write(f"Valid Reason: {reason_validity[0]}")
-            if reason_validity[1]:
-                st.write("Matching Reasons:", ", ".join(reason_validity[1]))
-            # Option to continue
             if st.button("Next Round"):
                 st.session_state.game.load_random_sample()
                 st.experimental_rerun()
-    st.markdown("</div>", unsafe_allow_html=True)
-    # Optional: Show metadata for current sample
-    if st.checkbox("Show Sample Metadata"):
-        st.write("Current Sample Details:")
-        sample = st.session_state.game.current_sample
-        st.write(f"Model: {sample['model']}")
-        st.write(f"Dataset: {sample['dataset']}")
-        st.write(f"Sampling Strategy (p): {sample['dec_strat_value']}")
-        st.write(f"Original Reasons: {st.session_state.game.current_reasons}")
 if __name__ == "__main__":
     main()

     st.markdown("""
     <style>
     /* Global Styling */
     /* Game Container */
     .game-container {
         box-shadow: 0 4px 6px rgba(0,0,0,0.1);
         margin-bottom: 20px;
     }
     /* Sentences Styling */
     .sentence-container {
         border-left: 4px solid #3498db;
         padding: 10px;
         margin-bottom: 10px;
+        display: flex;
+        align-items: center;
+        justify-content: space-between;
     }
     .sentence-container:hover {
         transform: translateX(5px);
     }
     /* Buttons */
     .stButton>button {
         color: white;
         padding: 10px 20px;
         transition: all 0.3s ease;
     }
     .stButton>button:hover {
         transform: scale(1.05);
     }
     /* Radio Buttons */
     .stRadio>div {
         display: flex;
         flex-wrap: wrap;
         gap: 10px;
     }
     .stRadio>div>label {
         background-color: #ecf0f1;
         padding: 10px;
         border-radius: 10px;
         transition: all 0.3s ease;
     }
     .stRadio>div>label:hover {
         background-color: #3498db;
         color: white;
     }
     /* Sidebar */
     .css-1aumxhk {
         background-color: #2c3e50;
         color: white;
     }
     </style>
     """, unsafe_allow_html=True)
     def __init__(self, dataset_path):
         """
         Initialize the RoFT Game with the dataset
         :param dataset_path: Path to the roft.csv file
         """
         self.df = pd.read_csv(dataset_path)
         self.current_sentences = None
         self.true_boundary_index = None
         self.current_guess_index = None
         self.predefined_reasons = [
             "grammar",
+            "repetition",
+            "irrelevant",
+            "contradicts_sentence",
+            "contradicts_knowledge",
+            "common_sense",
+            "coreference",
             "generic"
         ]
         """
         Load a random sample from the dataset
         """
         valid_samples = self.df[
+            (self.df['gen_body'].notna()) &
+            (self.df['reason'].notna()) &
             (self.df['reason'] != '[]')
         ]
         self.current_sample = valid_samples.sample(n=1).iloc[0]
         prompt_sentences = self.current_sample['prompt_body'].split('_SEP_')
         gen_sentences = self.current_sample['gen_body'].split('_SEP_')
         combined_sentences = prompt_sentences + gen_sentences
         self.current_sentences = combined_sentences[:10]
         self.true_boundary_index = self.current_sample['true_boundary_index']
         try:
             self.current_reasons = ast.literal_eval(self.current_sample['reason'])
         except:
             self.current_reasons = []
         self.current_guess_index = None
     def check_guess(self, guess_index):
         self.current_guess_index = guess_index
         if guess_index == self.true_boundary_index:
             return 5
         elif guess_index > self.true_boundary_index:
         else:
             return 0
+    def save_annotation(self, guess_index, reason):
         os.makedirs('logs', exist_ok=True)
         timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
         filename = f'logs/annotation_{timestamp}.txt'
         annotation_details = [
             f"Timestamp: {timestamp}",
             f"Model: {self.current_sample['model']}",
             f"Dataset: {self.current_sample['dataset']}",
             f"Guess Index: {guess_index + 1}",
             f"True Boundary Index: {self.true_boundary_index + 1}",
+            f"User Reason: {reason}"
         ]
         with open(filename, 'w') as f:
             f.write("\n".join(annotation_details))
 def main():
     local_css()
     st.markdown("""
+    <h1 style='text-align: center; color: #2c3e50;'>
     🕵️ Real or Fake Text Detective 🕵️‍♀️
     </h1>
     """, unsafe_allow_html=True)
     if 'game' not in st.session_state:
         st.session_state.game = RoFTGame('roft.csv')
         st.session_state.game.load_random_sample()
         st.session_state.total_points = 0
         st.session_state.rounds_played = 0
     st.sidebar.markdown("## 🎮 Game Stats")
     st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}")
     st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}")
+    st.markdown("<div class='game-container'>", unsafe_allow_html=True)
     st.subheader("🔍 Examine the Text Carefully")
+    guess = None
     for i, sentence in enumerate(st.session_state.game.current_sentences):
+        col1, col2 = st.columns([9, 1])
+        with col1:
+            st.markdown(f"<div class='sentence-container'><strong>{i+1}.</strong> {sentence}</div>", unsafe_allow_html=True)
+        with col2:
+            if st.radio("", ["", str(i + 1)], key=f"guess_{i}"):
+                guess = i
     if st.button("Submit Guess"):
+        if guess is None:
+            st.warning("Please select where the AI-generated text begins.")
         else:
+            points_earned = st.session_state.game.check_guess(guess)
             st.session_state.total_points += points_earned
             st.session_state.rounds_played += 1
             st.subheader("Results")
+            st.write(f"Your Guess: Sentence {guess + 1}")
             st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}")
             st.write(f"Points Earned: {points_earned}")
+            if points_earned > 0:
+                reason = st.text_area("Explain Your Reason")
+                if reason:
+                    st.session_state.game.save_annotation(guess, reason)
+                    st.success("Reason saved successfully.")
+            else:
+                st.info("You didn't get the boundary right. Try again in the next round!")
             if st.button("Next Round"):
                 st.session_state.game.load_random_sample()
                 st.experimental_rerun()
+    st.markdown("</div>", unsafe_allow_html=True)
 if __name__ == "__main__":
     main()