import streamlit as st import pandas as pd import numpy as np import random import os from datetime import datetime import ast # Custom CSS for enhanced styling def local_css(): st.markdown(""" """, unsafe_allow_html=True) class RoFTGame: def __init__(self, dataset_path): """ Initialize the RoFT Game with the dataset :param dataset_path: Path to the roft.csv file """ self.df = pd.read_csv(dataset_path) self.current_sample = None self.current_sentences = None self.true_boundary_index = None self.current_guess_index = None # Predefined reasons from the dataset description self.predefined_reasons = [ "grammar", "repetition", "irrelevant", "contradicts_sentence", "contradicts_knowledge", "common_sense", "coreference", "generic" ] def load_random_sample(self): """ Load a random sample from the dataset """ # Filter for samples with valid generations and reasons valid_samples = self.df[ (self.df['gen_body'].notna()) & (self.df['reason'].notna()) & (self.df['reason'] != '[]') ] # Select a random sample self.current_sample = valid_samples.sample(n=1).iloc[0] # Prepare sentences prompt_sentences = self.current_sample['prompt_body'].split('_SEP_') gen_sentences = self.current_sample['gen_body'].split('_SEP_') # Combine and truncate to 10 sentences combined_sentences = prompt_sentences + gen_sentences self.current_sentences = combined_sentences[:10] # Store true boundary self.true_boundary_index = self.current_sample['true_boundary_index'] # Parse reasons from the dataset try: self.current_reasons = ast.literal_eval(self.current_sample['reason']) except: self.current_reasons = [] # Reset current guess self.current_guess_index = None def check_guess(self, guess_index): """ Check if the guess is correct :param guess_index: Index of the guessed boundary :return: Points earned """ self.current_guess_index = guess_index # Calculate points based on closeness to true boundary if guess_index == self.true_boundary_index: return 5 elif guess_index > self.true_boundary_index: return max(5 - (guess_index - self.true_boundary_index), 0) else: return 0 def validate_reason(self, user_reason): """ Validate user's reason against dataset reasons :param user_reason: Reason provided by user :return: Tuple of (is_valid, matching_reasons) """ # Convert user reason to lowercase for matching user_reason_lower = user_reason.lower() # Check against predefined reasons and current sample's reasons matching_reasons = [] # Check predefined reasons for reason in self.predefined_reasons: if reason.lower() in user_reason_lower: matching_reasons.append(reason) # Check original sample's reasons for orig_reason in self.current_reasons: if orig_reason.lower() in user_reason_lower: matching_reasons.append(orig_reason) return len(matching_reasons) > 0, matching_reasons def save_annotation(self, guess_index, reason, reason_validity): """ Save annotation to a text file :param guess_index: Index of the guessed boundary :param reason: Reason for the guess :param reason_validity: Validity of the reason """ # Ensure logs directory exists os.makedirs('logs', exist_ok=True) # Generate unique filename with timestamp timestamp = datetime.now().strftime("%Y%m%d_%H%M%S") filename = f'logs/annotation_{timestamp}.txt' # Prepare annotation details annotation_details = [ f"Timestamp: {timestamp}", f"Model: {self.current_sample['model']}", f"Dataset: {self.current_sample['dataset']}", f"Guess Index: {guess_index + 1}", f"True Boundary Index: {self.true_boundary_index + 1}", f"Original Dataset Reasons: {self.current_reasons}", f"User Reason: {reason}", f"Reason Validity: {reason_validity[0]}", f"Matching Reasons: {reason_validity[1]}", "\nFull Text:\n" + "\n".join(f"{i+1}. {sent}" for i, sent in enumerate(self.current_sentences)) ] # Write to file with open(filename, 'w') as f: f.write("\n".join(annotation_details)) def main(): local_css() # Fancy title with animation st.markdown("""

🕵️ Real or Fake Text Detective 🕵️‍♀️

""", unsafe_allow_html=True) # Game introduction st.markdown("""

Sharpen your AI detection skills! Read carefully and identify where human writing transforms into machine-generated text.

""", unsafe_allow_html=True) # Initialize game session state if 'game' not in st.session_state: st.session_state.game = RoFTGame('roft.csv') st.session_state.game.load_random_sample() st.session_state.total_points = 0 st.session_state.rounds_played = 0 # Game container st.markdown("

", unsafe_allow_html=True) # Game information in sidebar with icons st.sidebar.markdown("## 🎮 Game Stats") st.sidebar.markdown(f"### 🏆 Total Points: {st.session_state.total_points}") st.sidebar.markdown(f"### 🎲 Rounds Played: {st.session_state.rounds_played}") # Animated difficulty indicator difficulty_map = { 'gpt2': '🟢 Easy', 'gpt2-xl': '🟠 Medium', 'ctrl': '🔴 Hard' } current_model = st.session_state.game.current_sample['model'] difficulty = difficulty_map.get(current_model, '⚪ Unknown') st.sidebar.markdown(f"### 🎯 Difficulty: {difficulty}") # Display sentences with enhanced styling and radio buttons st.subheader("🔍 Examine the Text Carefully") selected_guess = st.radio( "Where do you think the AI-generated text begins?", options=[f"{i+1}. {sentence}" for i, sentence in enumerate(st.session_state.game.current_sentences)], label_visibility="collapsed" ) # Reason input with predefined options and visual enhancements st.markdown("### 🧐 Explain Your Reasoning") reason_options = st.session_state.game.predefined_reasons selected_predefined_reasons = st.multiselect( "Select indicators of AI generation", options=reason_options ) # Custom reason input custom_reason = st.text_area("Additional detective notes (optional)") # Combine predefined and custom reasons full_reason = " ".join(selected_predefined_reasons) if custom_reason: full_reason += f" {custom_reason}" # Guess submission if st.button("Submit Guess"): if not full_reason.strip(): st.warning("Please provide a reason for your guess.") else: # Convert guess to index (subtract 1 for 0-based indexing) guess_index = int(selected_guess.split('.')[0]) - 1 # Check guess and update points points_earned = st.session_state.game.check_guess(guess_index) st.session_state.total_points += points_earned st.session_state.rounds_played += 1 # If guess is correct, validate reason if guess_index == st.session_state.game.true_boundary_index: reason_validity = st.session_state.game.validate_reason(full_reason) st.subheader("Results") st.write(f"Your Guess: Sentence {selected_guess}") st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}") st.write(f"Points Earned: {points_earned}") # Display reason validation st.write("Reason Validation:") st.write(f"Valid Reason: {reason_validity[0]}") if reason_validity[1]: st.write("Matching Reasons:", ", ".join(reason_validity[1])) # Save annotation st.session_state.game.save_annotation(guess_index, full_reason, reason_validity) else: st.subheader("Results") st.write(f"Your Guess: Sentence {selected_guess}") st.write(f"Actual Boundary: Sentence {st.session_state.game.true_boundary_index + 1}") st.write(f"Points Earned: {points_earned}") # Option to continue if st.button("Next Round"): st.session_state.game.load_random_sample() st.experimental_rerun() st.markdown("

", unsafe_allow_html=True) # Optional: Show metadata for current sample if st.checkbox("Show Sample Metadata"): st.write("Current Sample Details:") sample = st.session_state.game.current_sample st.write(f"Model: {sample['model']}") st.write(f"Dataset: {sample['dataset']}") st.write(f"Sampling Strategy (p): {sample['dec_strat_value']}") st.write(f"Original Reasons: {st.session_state.game.current_reasons}") if __name__ == "__main__": main()