Spaces:

tsrivallabh
/

LLM-Powered-Fact-Checker

Sleeping

File size: 9,680 Bytes

import streamlit as st
from fact_checker import FactChecker
from openai import OpenAI
import os
from dotenv import load_dotenv
import csv
from datetime import datetime
import pandas as pd
import random

load_dotenv()

def store_feedback_csv(claim, result, feedback, csv_file="data/feedback_log.csv"):
    now = datetime.now().strftime("%Y-%m-%d %H:%M:%S")
    row = [
        now,
        claim,
        result.get("verdict", ""),
        result.get("confidence", ""),
        "|".join(result.get("evidence", [])),
        result.get("reasoning", ""),
        feedback
    ]
    header = ["datetime", "claim", "verdict", "confidence", "evidence", "reasoning", "feedback"]
    
    # Create file if it doesn't exist
    if not os.path.exists(csv_file):
        with open(csv_file, "w", newline='', encoding="utf-8") as f:
            writer = csv.writer(f)
            writer.writerow(header)
    
    # Append to existing file
    with open(csv_file, "a", newline='', encoding="utf-8") as f:
        writer = csv.writer(f)
        writer.writerow(row)

def initialize_services():
    return FactChecker(
        chroma_path="app/chroma_db",
        collection_name="pib_titles",
        groq_client=OpenAI(
            api_key=os.getenv("GROQ_API_KEY"),
            base_url="https://api.groq.com/openai/v1"
        )
    )

def main():
    # Add sticky title using HTML and CSS
    st.markdown("""
<style>
.sticky-title {
    position: sticky;
    top: 0;
    z-index: 999;
    background: white;
    padding-top: 1rem;
    padding-bottom: 1rem;
    margin-bottom: 1rem;
    border-bottom: 2px solid #f0f0f0;
}
</style>
<div class="sticky-title">
    <h1>🔍 Fact Checker</h1>
</div>
""", unsafe_allow_html=True)
    checker = initialize_services()

    # Initialize session state variables
    if "feedback_submitted" not in st.session_state:
        st.session_state.feedback_submitted = False
    if "last_claim" not in st.session_state:
        st.session_state.last_claim = ""
    if "result" not in st.session_state:
        st.session_state.result = None

    # --- Custom CSS for wider columns and better visuals ---
    st.markdown("""
<style>
/* Reduce max-width and remove side paddings/margins for full width */
.block-container {
    padding-top: 1rem;
    padding-bottom: 1rem;
    max-width: 100% !important;
    padding-left: 1rem !important;
    padding-right: 1rem !important;
     text-align: center;
}

/* Remove default margins on main content to reduce gaps */
main > div {
    margin-left: 0 !important;
    margin-right: 0 !important;
}

/* Stretch columns fully */
.css-1kyxreq, .css-1r6slb0 {
    width: 100% !important;
}

/* Style the DataFrame container for full width */
.stDataFrame {
    background: #f9f9f9 !important;
    border-radius: 12px;
    border: 1px solid #e0e0e0;
    padding: 0.5rem;
    width: 100% !important;
}

/* Style input area */
textarea, input[type="text"] {
    border: 2px solid #4CAF50 !important;
    border-radius: 6px !important;
    font-size: 1.1rem !important;
    background: #f4f8fc !important;
    width: 100% !important;
}

/* Style buttons */
button[kind="primary"] {
    background: #4CAF50 !important;
    color: white !important;
    border-radius: 6px !important;
    font-weight: bold !important;
}

/* Style scrollbars for DataFrame */
::-webkit-scrollbar {
    width: 8px;
    background: #f0f0f0;
}
::-webkit-scrollbar-thumb {
    background: #bdbdbd;
    border-radius: 4px;
}
</style>
""", unsafe_allow_html=True)


    # --- Layout ---
    spacer_col, left_col, right_col ,right_space= st.columns([1,9, 7,1], gap="large")

    with left_col:
        claim = st.text_area("Enter a claim to verify:", height=150)
        confidence_threshold = st.slider("Confidence Threshold", 0.0, 1.0, 0.5, 0.05)

        if st.button("Verify Claim"):
            if not claim.strip():
                st.error("Please enter a claim to verify")
                return

            with st.spinner("Analyzing..."):
                # Store result in session state
                st.session_state.result = checker.verify_claim(claim, confidence_threshold)
                st.session_state.last_claim = claim
                st.session_state.feedback_submitted = False  # Reset feedback state for new claim

            # Display results from session state
            if st.session_state.result:
                result = st.session_state.result

                # Show entity verification results
                st.subheader("Entity Verification Results")
                entities = result.get("entities", [])
                if entities:
                    for idx, entity_result in enumerate(entities, 1):
                        st.markdown(f"### Entity {idx}: {entity_result.get('entity', '')} ({entity_result.get('type', '')})")

                        if "error" in entity_result:
                            st.error(f"Error: {entity_result['error']}")
                            if "raw_response" in entity_result:
                                with st.expander("Show raw LLM response"):
                                    st.code(entity_result["raw_response"])
                            continue

                        verdict_color = {
                            "Valid": "green",
                            "Invalid": "red",
                            "Unverified": "orange"
                        }.get(entity_result.get("verdict", ""), "gray")
                        st.markdown(f"**Verdict:** :{verdict_color}[{entity_result.get('verdict', 'Unknown')}]")

                        # Confidence
                        st.metric("Confidence Score", f"{entity_result.get('confidence', 0):.2f}")

                        # Evidence
                        with st.expander("View Supporting Evidence"):
                            for i, evidence in enumerate(entity_result.get("evidence", []), 1):
                                st.markdown(f"{i}. {evidence}")

                        # Reasoning
                        st.markdown("**Analysis:**")
                        st.write(entity_result.get("reasoning", "No reasoning provided"))
                else:
                    st.write("No entities detected or verified.")

                # Show claim verification results
                st.subheader("Detected Claims and Verification Results")
                claims = result.get("claims", [])
                if not claims:
                    st.info("No check-worthy claims detected in the input.")
                else:
                    for idx, claim_result in enumerate(claims, 1):
                        st.markdown(f"### Claim {idx}")
                        st.markdown(f"> {claim_result.get('claim', '')}")

                        if "error" in claim_result:
                            st.error(f"Error: {claim_result['error']}")
                            if "raw_response" in claim_result:
                                with st.expander("Show raw LLM response"):
                                    st.code(claim_result["raw_response"])
                            continue

                        verdict_color = {
                            "True": "green",
                            "False": "red",
                            "Unverifiable": "orange"
                        }.get(claim_result.get("verdict", ""), "gray")
                        st.markdown(f"**Verdict:** :{verdict_color}[{claim_result.get('verdict', 'Unknown')}]")

                        # Confidence
                        st.metric("Confidence Score", f"{claim_result.get('confidence', 0):.2f}")

                        # Evidence
                        with st.expander("View Supporting Evidence"):
                            for i, evidence in enumerate(claim_result.get("evidence", []), 1):
                                st.markdown(f"{i}. {evidence}")

                        # Reasoning
                        st.markdown("**Analysis:**")
                        st.write(claim_result.get("reasoning", "No reasoning provided"))


            # Feedback system
            feedback_key = f"feedback_radio_{st.session_state.last_claim}"
            if not st.session_state.feedback_submitted:
                feedback = st.radio(
                    "Was this analysis helpful?",
                    ["", "👍 Yes", "👎 No"],
                    horizontal=True,
                    key=feedback_key
                )
                
                if feedback:
                    store_feedback_csv(st.session_state.last_claim, result, feedback)
                    st.session_state.feedback_submitted = True
                    st.rerun()  # Use st.rerun() instead of experimental_rerun()
            else:
                st.success("Thank you for your feedback! Your input helps improve the system.")

    with right_col:
        
        st.markdown("### 📋 All Claims")
        try:
            df = pd.read_csv("data/pib_titles.csv")["title"].to_frame()
            if not df.empty:
                st.markdown("""
<style>
.scrollable-cell {
    overflow-x: auto;
    white-space: nowrap;
    max-width: 100%;
    border: 1px solid #eee;
    padding: 6px 8px;
    font-family: monospace;
    background: #fafafa;
}
</style>
""", unsafe_allow_html=True)

            

            # Render each row as a scrollable div
            for idx, row in df.iterrows():
                st.markdown(
                    f'<div class="scrollable-cell">{row["title"]}</div>',
                    unsafe_allow_html=True
    )
        except Exception as e:
            st.warning(f"Unable to display full dataset: {e}")
    


if __name__ == "__main__":
    main()