Spaces:

Nugh75
/

Edurag_beta

Sleeping

App Files Files Community

Nugh75 commited on Jan 2

Commit

59310ba

1 Parent(s): ff94340

update ristruttrazione app.py

Browse files

Files changed (31) hide show

.gitattributes +0 -35
.gitignore +0 -51
.gradio/certificate.pem +0 -31
README.md +0 -12
Structure.txt +0 -8
app.py +0 -342
app/__init__.py +0 -0
app/__pycache__/__init__.cpython-310.pyc +0 -0
app/__pycache__/config.cpython-310.pyc +0 -0
app/__pycache__/document_handling.cpython-310.pyc +0 -0
app/__pycache__/llm_handling.cpython-310.pyc +0 -0
app/__pycache__/logging_config.cpython-310.pyc +0 -0
app/app.py +0 -0
app/config.py +0 -10
app/document_handling.py +0 -320
app/import pytest.py +0 -58
app/llm_handling.py +0 -118
app/llm_handling_2.py +0 -34
app/llm_handling_3.py +0 -76
app/logging_config.py +0 -12
app/test_llm_handling.py +0 -30
app_1.py +0 -275
faiss_index/index.faiss +0 -0
faiss_index/index.pkl +0 -3
faiss_index_E-learning/index.faiss +0 -0
faiss_index_E-learning/index.pkl +0 -3
faiss_index_E-learning/metadata.json +0 -16
faiss_index_default_db/index.faiss +0 -0
faiss_index_default_db/index.pkl +0 -3
rag_chatbot.log +0 -39
requirements.txt +0 -150

.gitattributes DELETED Viewed

@@ -1,35 +0,0 @@
-*.7z filter=lfs diff=lfs merge=lfs -text
-*.arrow filter=lfs diff=lfs merge=lfs -text
-*.bin filter=lfs diff=lfs merge=lfs -text
-*.bz2 filter=lfs diff=lfs merge=lfs -text
-*.ckpt filter=lfs diff=lfs merge=lfs -text
-*.ftz filter=lfs diff=lfs merge=lfs -text
-*.gz filter=lfs diff=lfs merge=lfs -text
-*.h5 filter=lfs diff=lfs merge=lfs -text
-*.joblib filter=lfs diff=lfs merge=lfs -text
-*.lfs.* filter=lfs diff=lfs merge=lfs -text
-*.mlmodel filter=lfs diff=lfs merge=lfs -text
-*.model filter=lfs diff=lfs merge=lfs -text
-*.msgpack filter=lfs diff=lfs merge=lfs -text
-*.npy filter=lfs diff=lfs merge=lfs -text
-*.npz filter=lfs diff=lfs merge=lfs -text
-*.onnx filter=lfs diff=lfs merge=lfs -text
-*.ot filter=lfs diff=lfs merge=lfs -text
-*.parquet filter=lfs diff=lfs merge=lfs -text
-*.pb filter=lfs diff=lfs merge=lfs -text
-*.pickle filter=lfs diff=lfs merge=lfs -text
-*.pkl filter=lfs diff=lfs merge=lfs -text
-*.pt filter=lfs diff=lfs merge=lfs -text
-*.pth filter=lfs diff=lfs merge=lfs -text
-*.rar filter=lfs diff=lfs merge=lfs -text
-*.safetensors filter=lfs diff=lfs merge=lfs -text
-saved_model/**/* filter=lfs diff=lfs merge=lfs -text
-*.tar.* filter=lfs diff=lfs merge=lfs -text
-*.tar filter=lfs diff=lfs merge=lfs -text
-*.tflite filter=lfs diff=lfs merge=lfs -text
-*.tgz filter=lfs diff=lfs merge=lfs -text
-*.wasm filter=lfs diff=lfs merge=lfs -text
-*.xz filter=lfs diff=lfs merge=lfs -text
-*.zip filter=lfs diff=lfs merge=lfs -text
-*.zst filter=lfs diff=lfs merge=lfs -text
-*tfevents* filter=lfs diff=lfs merge=lfs -text

.gitignore DELETED Viewed

@@ -1,51 +0,0 @@
-# File di sistema di macOS
-.DS_Store
-.AppleDouble
-.LSOverride
-# Cartelle di sistema di macOS
-**/.DS_Store
-**/._*
-**/.Spotlight-V100
-**/.Trashes
-**/.fseventsd
-# File di ambiente e configurazioni locali
-.env
-.venv
-venv/
-env/
-# File di cache e log
-*.log
-*.pyc
-__pycache__/
-.pytest_cache/
-*.egg-info/
-dist/
-build/
-# File di editor/IDE
-.vscode/
-.idea/
-*.swp
-*.swo
-*.sublime-workspace
-*.sublime-project
-# File di Jupyter Notebook
-.ipynb_checkpoints/
-# File di virtualenv
-bin/
-include/
-lib/
-lib64/
-pip-selfcheck.json
-pyvenv.cfg
-# File di Python
-*.py[cod]
-*$py.class
-*.so
-.Pythonsource venv/bin/activate

.gradio/certificate.pem DELETED Viewed

@@ -1,31 +0,0 @@
------BEGIN CERTIFICATE-----
-MIIFazCCA1OgAwIBAgIRAIIQz7DSQONZRGPgu2OCiwAwDQYJKoZIhvcNAQELBQAw
-TzELMAkGA1UEBhMCVVMxKTAnBgNVBAoTIEludGVybmV0IFNlY3VyaXR5IFJlc2Vh
-cmNoIEdyb3VwMRUwEwYDVQQDEwxJU1JHIFJvb3QgWDEwHhcNMTUwNjA0MTEwNDM4
-WhcNMzUwNjA0MTEwNDM4WjBPMQswCQYDVQQGEwJVUzEpMCcGA1UEChMgSW50ZXJu
-ZXQgU2VjdXJpdHkgUmVzZWFyY2ggR3JvdXAxFTATBgNVBAMTDElTUkcgUm9vdCBY
-MTCCAiIwDQYJKoZIhvcNAQEBBQADggIPADCCAgoCggIBAK3oJHP0FDfzm54rVygc
-h77ct984kIxuPOZXoHj3dcKi/vVqbvYATyjb3miGbESTtrFj/RQSa78f0uoxmyF+
-0TM8ukj13Xnfs7j/EvEhmkvBioZxaUpmZmyPfjxwv60pIgbz5MDmgK7iS4+3mX6U
-A5/TR5d8mUgjU+g4rk8Kb4Mu0UlXjIB0ttov0DiNewNwIRt18jA8+o+u3dpjq+sW
-T8KOEUt+zwvo/7V3LvSye0rgTBIlDHCNAymg4VMk7BPZ7hm/ELNKjD+Jo2FR3qyH
-B5T0Y3HsLuJvW5iB4YlcNHlsdu87kGJ55tukmi8mxdAQ4Q7e2RCOFvu396j3x+UC
-B5iPNgiV5+I3lg02dZ77DnKxHZu8A/lJBdiB3QW0KtZB6awBdpUKD9jf1b0SHzUv
-KBds0pjBqAlkd25HN7rOrFleaJ1/ctaJxQZBKT5ZPt0m9STJEadao0xAH0ahmbWn
-OlFuhjuefXKnEgV4We0+UXgVCwOPjdAvBbI+e0ocS3MFEvzG6uBQE3xDk3SzynTn
-jh8BCNAw1FtxNrQHusEwMFxIt4I7mKZ9YIqioymCzLq9gwQbooMDQaHWBfEbwrbw
-qHyGO0aoSCqI3Haadr8faqU9GY/rOPNk3sgrDQoo//fb4hVC1CLQJ13hef4Y53CI
-rU7m2Ys6xt0nUW7/vGT1M0NPAgMBAAGjQjBAMA4GA1UdDwEB/wQEAwIBBjAPBgNV
-HRMBAf8EBTADAQH/MB0GA1UdDgQWBBR5tFnme7bl5AFzgAiIyBpY9umbbjANBgkq
-hkiG9w0BAQsFAAOCAgEAVR9YqbyyqFDQDLHYGmkgJykIrGF1XIpu+ILlaS/V9lZL
-ubhzEFnTIZd+50xx+7LSYK05qAvqFyFWhfFQDlnrzuBZ6brJFe+GnY+EgPbk6ZGQ
-3BebYhtF8GaV0nxvwuo77x/Py9auJ/GpsMiu/X1+mvoiBOv/2X/qkSsisRcOj/KK
-NFtY2PwByVS5uCbMiogziUwthDyC3+6WVwW6LLv3xLfHTjuCvjHIInNzktHCgKQ5
-ORAzI4JMPJ+GslWYHb4phowim57iaztXOoJwTdwJx4nLCgdNbOhdjsnvzqvHu7Ur
-TkXWStAmzOVyyghqpZXjFaH3pO3JLF+l+/+sKAIuvtd7u+Nxe5AW0wdeRlN8NwdC
-jNPElpzVmbUq4JUagEiuTDkHzsxHpFKVK7q4+63SM1N95R1NbdWhscdCb+ZAJzVc
-oyi3B43njTOQ5yOf+1CceWxG1bQVs5ZufpsMljq4Ui0/1lvh+wjChP4kqKOJ2qxq
-4RgqsahDYVvTH9w7jXbyLeiNdd8XM2w9U/t7y0Ff/9yi0GE44Za4rF2LN9d11TPA
-mRGunUHBcnWEvgJBQl9nJEiU0Zsnvgc/ubhPgXRR4Xq37Z0j4r7g1SgEEzwxA57d
-emyPxgcYxn/eR44/KJ4EBs+lVDR3veyJm+kXQ99b21/+jh5Xos1AnX5iItreGCc=
------END CERTIFICATE-----

README.md DELETED Viewed

@@ -1,12 +0,0 @@
----
-title: Edurag Beta
-emoji: 🔥
-colorFrom: pink
-colorTo: blue
-sdk: gradio
-sdk_version: 5.9.1
-app_file: app.py
-pinned: false
----
-Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

Structure.txt DELETED Viewed

@@ -1,8 +0,0 @@
-.
-├── app.py
-└── app
-    ├── __init__.py
-    ├── config.py
-    ├── document_handling.py
-    ├── llm_handling.py
-    └── logging_config.py

app.py DELETED Viewed

@@ -1,342 +0,0 @@
-import gradio as gr
-import logging
-# Ipotizziamo che tu abbia queste funzioni nel tuo progetto:
-# - list_databases(), create_database(), modify_database(), delete_database()...
-# - list_indexed_files(), upload_and_index(), delete_file_from_database(), etc.
-# - search_documents(), list_indexed_documents()...
-#
-# Se hanno nomi o posizioni diverse, adatta gli import di conseguenza
-from app.document_handling import (
-    list_databases,
-    create_database,
-    modify_database,
-    delete_database,
-    upload_and_index,
-    list_indexed_files,
-    delete_file_from_database,
-    list_indexed_documents,
-    search_documents,
-)
-from app.llm_handling import answer_question
-from app.logging_config import configure_logging
-configure_logging()
-def update_dropdowns():
-    """Aggiorna tutti i dropdown con la lista aggiornata dei database."""
-    databases = list_databases()
-    # Ritorniamo 6 update() perché nel codice ci sono 6 dropdown da sincronizzare
-    return [gr.update(choices=databases) for _ in range(6)]
-def extract_text_from_files(files):
-    """Estrae e concatena il testo da PDF, DOCX e TXT."""
-    text = ""
-    for file in files:
-        try:
-            if file.name.endswith('.pdf'):
-                text += extract_text_from_pdf(file.name)   # Definita in document_handling
-            elif file.name.endswith('.docx'):
-                text += extract_text_from_docx(file.name)  # Definita in document_handling
-            else:
-                with open(file.name, 'r', encoding='utf-8') as f:
-                    text += f.read()
-        except Exception as e:
-            logging.error(f"Errore durante la lettura del file {file.name}: {e}")
-    return text
-with gr.Blocks() as rag_chatbot:
-    gr.Markdown("# Chatbot basato su RAG")
-    databases = list_databases()
-    # Questi State() servono per la gestione dei dropdown.
-    # Se non ti servono come stati separati, puoi anche rimuoverli.
-    db_name_upload = gr.State()
-    db_name_list = gr.State()
-    db_name_chat = gr.State()
-    db_name_new = gr.State()
-    modify_db_old_name = gr.State()
-    delete_db_dropdown = gr.State()
-    # =============================================
-    #                 TAB: Chatbot
-    # =============================================
-    with gr.Tab("Chatbot"):
-        with gr.Row():
-            with gr.Column(scale=2):
-                # Dropdown per selezionare il DB
-                db_name_chat = gr.Dropdown(
-                    choices=databases,
-                    label="Seleziona Database",
-                    value="default_db"
-                )
-                # Chatbot component
-                chatbot = gr.Chatbot(label="Conversazione", type="messages")
-                # Input domanda
-                question_input = gr.Textbox(
-                    label="Fai una domanda",
-                    placeholder="Scrivi qui la tua domanda...",
-                    lines=2
-                )
-               # Bottoni azione
-                with gr.Row():
-                    ask_button = gr.Button("Invia")
-                    clear_button = gr.Button("Pulisci Chat")
-                # File upload con dimensioni ridotte
-                with gr.Row():
-                    file_input = gr.File(
-                        label="Carica PDF/Docx/TXT per la conversazione",
-                        file_types=[".pdf", ".docx", ".txt"],
-                        file_count="multiple",
-                        height="100px",  # Altezza ridotta
-                        scale=3  # Riduce la larghezza relativa
-                    )
-                    upload_button = gr.Button("Carica Documenti", scale=1)
-        # Stato chat
-        chat_state = gr.State([])
-        # ----------------------
-        #  FUNZIONI DI CALLBACK
-        # ----------------------
-        def chat_upload_and_respond(files, chat_history, db_name):
-            # Se chat_history è None, inizializziamo
-            if chat_history is None:
-                chat_history = []
-            # Estrai il testo dai file
-            text = extract_text_from_files(files)
-            # Aggiungo un messaggio "assistant" che mostra il testo caricato
-            chat_history.append({
-                "role": "assistant",
-                "content": f"📄 Contenuto dei documenti caricati:\n{text}"
-            })
-            return chat_history
-        def respond(message, chat_history, db_name):
-            if chat_history is None:
-                chat_history = []
-            # `answer_question` restituisce due messaggi (user + assistant) in lista
-            new_messages = answer_question(message, db_name)
-            # Li aggiungiamo in coda alla history
-            chat_history.extend(new_messages)
-            # Ritorniamo l'input svuotato (per pulire il Textbox) e la nuova history
-            return "", chat_history
-        def clear_chat():
-            # Svuota la chat
-            return [], []
-        # ------------------
-        #   EVENTI BOTTONE
-        # ------------------
-        upload_button.click(
-            fn=chat_upload_and_respond,
-            inputs=[file_input, chat_state, db_name_chat],
-            outputs=chatbot
-        )
-        ask_button.click(
-            fn=respond,
-            inputs=[question_input, chat_state, db_name_chat],
-            outputs=[question_input, chatbot]
-        )
-        clear_button.click(
-            fn=clear_chat,
-            outputs=[chatbot, chat_state]
-        )
-    # =============================================
-    #            TAB: Gestione Database
-    # =============================================
-    with gr.Tab("Gestione Database"):
-        gr.Markdown("## Operazioni sui Database")
-        with gr.Row():
-            with gr.Column():
-                gr.Markdown("### Crea Database")
-                db_name_input = gr.Textbox(label="Nome Nuovo Database")
-                create_db_button = gr.Button("Crea Database")
-                create_output = gr.Textbox(label="Stato Creazione")
-            with gr.Column():
-                gr.Markdown("### Rinomina Database")
-                modify_db_old_name = gr.Dropdown(choices=databases, label="Database da Rinominare")
-                modify_db_new_name = gr.Textbox(label="Nuovo Nome")
-                modify_db_button = gr.Button("Rinomina Database")
-                modify_output = gr.Textbox(label="Stato Modifica")
-            with gr.Column():
-                gr.Markdown("### Elimina Database")
-                delete_db_dropdown = gr.Dropdown(choices=databases, label="Database da Eliminare")
-                delete_db_button = gr.Button("Elimina Database")
-                delete_output = gr.Textbox(label="Stato Eliminazione")
-        # Eventi per i pulsanti di gestione DB
-        create_db_button.click(
-            create_database,           # funzione
-            inputs=db_name_input,      # input
-            outputs=create_output      # output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-        modify_db_button.click(
-            modify_database,
-            inputs=[modify_db_old_name, modify_db_new_name],
-            outputs=modify_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-        delete_db_button.click(
-            delete_database,
-            inputs=delete_db_dropdown,
-            outputs=delete_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-    # =============================================
-    #         TAB: Gestione Documenti
-    # =============================================
-    with gr.Tab("Gestione Documenti"):
-        with gr.Column():
-            gr.Markdown("### Carica Documenti")
-            with gr.Row():
-                file_input = gr.File(
-                    label="Carica i tuoi documenti",
-                    file_types=[".txt", ".pdf", ".docx"],
-                    file_count="multiple"
-                )
-                db_name_upload = gr.Dropdown(
-                    choices=databases,
-                    label="Seleziona Database",
-                    value="default_db"
-                )
-            with gr.Row():
-                title_input = gr.Textbox(label="Titolo del documento")
-                author_input = gr.Textbox(label="Autore")
-            upload_button = gr.Button("Indicizza Documenti")
-            upload_output = gr.Textbox(label="Stato Upload")
-            with gr.Column():
-                gr.Markdown("### Documenti nel Database")
-                db_name_list = gr.Dropdown(
-                    choices=databases,
-                    label="Seleziona Database",
-                    value="default_db"
-                )
-                list_button = gr.Button("Visualizza Files")
-                list_output = gr.Textbox(label="Files nel Database")
-                delete_file_input = gr.Textbox(label="Nome file da eliminare")
-                delete_file_button = gr.Button("Elimina File")
-                delete_file_output = gr.Textbox(label="Stato Eliminazione")
-        # Eventi
-        upload_button.click(
-            upload_and_index,
-            inputs=[file_input, title_input, author_input, db_name_upload],
-            outputs=upload_output
-        ).then(
-            list_indexed_files,
-            inputs=db_name_list,
-            outputs=list_output
-        )
-        list_button.click(
-            list_indexed_files,
-            inputs=db_name_list,
-            outputs=list_output
-        )
-        delete_file_button.click(
-            delete_file_from_database,
-            inputs=[delete_file_input, db_name_list],
-            outputs=delete_file_output
-        ).then(
-            list_indexed_files,
-            inputs=db_name_list,
-            outputs=list_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-    # =============================================
-    #      TAB: Visualizza Documenti Indicizzati
-    # =============================================
-    with gr.Tab("Visualizza Documenti Indicizzati"):
-        with gr.Column():
-            gr.Markdown("### Documenti nel Database")
-            db_name_list = gr.Dropdown(
-                choices=databases,
-                label="Seleziona Database",
-                value="default_db",
-                interactive=True
-            )
-            list_button = gr.Button("Visualizza Documenti")
-            list_output = gr.Textbox(
-                label="Elenco Documenti",
-                lines=10,
-                interactive=False,
-                value="Clicca 'Visualizza Documenti' per vedere l'elenco"
-            )
-            list_button.click(
-                fn=list_indexed_documents,
-                inputs=[db_name_list],
-                outputs=[list_output],
-                api_name="list_docs"
-            )
-    # =============================================
-    #         TAB: Nuove Funzionalità
-    # =============================================
-    with gr.Tab("Nuove Funzionalità"):
-        gr.Markdown("## Cerca Documenti e Genera Riassunto")
-        db_name_new = gr.Dropdown(choices=databases, label="Seleziona Database", value="default_db")
-        search_input = gr.Textbox(label="Inserisci Termine di Ricerca")
-        search_button = gr.Button("Cerca Documenti")
-        search_output = gr.Textbox(label="Documenti Trovati")
-        summary_button = gr.Button("Genera Riassunto")
-        summary_output = gr.Textbox(label="Riassunto")
-        search_button.click(
-            search_documents,
-            inputs=[search_input, db_name_new],
-            outputs=search_output
-        )
-        # Esempio di eventuale generazione riassunto
-        # summary_button.click(
-        #     generate_summary,
-        #     inputs=db_name_new,
-        #     outputs=summary_output
-        # )
-# Avvio dell'app
-if __name__ == "__main__":
-    rag_chatbot.launch()

app/__init__.py DELETED Viewed

File without changes

app/__pycache__/__init__.cpython-310.pyc DELETED Viewed

Binary file (153 Bytes)

app/__pycache__/config.cpython-310.pyc DELETED Viewed

Binary file (337 Bytes)

app/__pycache__/document_handling.cpython-310.pyc DELETED Viewed

Binary file (9.51 kB)

app/__pycache__/llm_handling.cpython-310.pyc DELETED Viewed

Binary file (3.12 kB)

app/__pycache__/logging_config.cpython-310.pyc DELETED Viewed

Binary file (474 Bytes)

app/app.py DELETED Viewed

File without changes

app/config.py DELETED Viewed

@@ -1,10 +0,0 @@
-import os
-from dotenv import load_dotenv
-# Carica le variabili d'ambiente dal file .env
-load_dotenv()
-# Configurazione del modello
-OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
-if not OPENAI_API_KEY:
-    raise ValueError("OPENAI_API_KEY non trovata. Verifica il file .env")

app/document_handling.py DELETED Viewed

@@ -1,320 +0,0 @@
-import logging
-import gradio as gr  # Aggiunto import mancante
-from langchain_community.vectorstores import FAISS
-from langchain_huggingface import HuggingFaceEmbeddings
-import os
-import shutil
-import PyPDF2
-from docx import Document
-from langchain.text_splitter import RecursiveCharacterTextSplitter
-from dataclasses import dataclass
-import json
-from datetime import datetime
-# Initialize the text splitter
-text_splitter = RecursiveCharacterTextSplitter(chunk_size=500, chunk_overlap=100)
-# -------------- UTILITY FUNCTIONS --------------
-@dataclass
-class DocumentMetadata:
-    filename: str
-    title: str
-    author: str
-    upload_date: str
-    chunks: int
-    def to_dict(self):
-        return {
-            "filename": self.filename,
-            "title": self.title,
-            "author": self.author,
-            "upload_date": self.upload_date,
-            "chunks": self.chunks
-        }
-def save_metadata(metadata_list, db_name):
-    db_path = f"faiss_index_{db_name}"
-    metadata_file = os.path.join(db_path, "metadata.json")
-    existing_metadata = []
-    if os.path.exists(metadata_file):
-        with open(metadata_file, 'r') as f:
-            existing_metadata = json.load(f)
-    existing_metadata.extend([m.to_dict() for m in metadata_list])
-    with open(metadata_file, 'w') as f:
-        json.dump(existing_metadata, f, indent=2)
-def extract_text_from_pdf(file_path):
-    with open(file_path, 'rb') as f:
-        reader = PyPDF2.PdfReader(f)
-        text = ""
-        for page in reader.pages:
-            text += page.extract_text()
-        return text
-def extract_text_from_docx(file_path):
-    doc = Document(file_path)
-    text = ""
-    for para in doc.paragraphs:
-        text += para.text + "\n"
-    return text
-# -------------- CHATBOT TAB FUNCTIONS --------------
-def answer_question(question, db_name="default_db"):
-    db_path = f"faiss_index_{db_name}"
-    if not os.path.exists(db_path):
-        logging.warning(f"L'indice FAISS per il database {db_name} non esiste.")
-        return "Database non trovato."
-    embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
-    vectorstore = FAISS.load_local(db_path, embeddings, allow_dangerous_deserialization=True)
-    # Perform a similarity search
-    docs = vectorstore.similarity_search(question)
-    if not docs:
-        return "Nessun documento corrispondente alla query."
-    # Collect the document contents
-    results = [doc.page_content for doc in docs]
-    return "\n\n".join(results)
-# -------------- DATABASE MANAGEMENT TAB FUNCTIONS --------------
-def create_database(db_name):
-    logging.info(f"Creating database: {db_name}")
-    db_path = f"faiss_index_{db_name}"
-    if os.path.exists(db_path):
-        return f"Il database {db_name} esiste già."
-    try:
-        os.makedirs(db_path)
-        logging.info(f"Database {db_name} created successfully.")
-        databases = list_databases()
-        return (f"Database {db_name} creato con successo.", databases)
-    except Exception as e:
-        logging.error(f"Errore nella creazione del database: {e}")
-        return (f"Errore nella creazione del database: {e}", [])
-def delete_database(db_name):
-    db_path = f"faiss_index_{db_name}"
-    if not os.path.exists(db_path):
-        return f"Il database {db_name} non esiste."
-    try:
-        shutil.rmtree(db_path)
-        logging.info(f"Database {db_name} eliminato con successo.")
-        return f"Database {db_name} eliminato con successo."
-    except OSError as e:
-        logging.error(f"Impossibile eliminare il database {db_name}: {e}")
-        return f"Impossibile eliminare il database {db_name}: {e}"
-def modify_database(old_db_name, new_db_name):
-    old_db_path = f"faiss_index_{old_db_name}"
-    new_db_path = f"faiss_index_{new_db_name}"
-    if not os.path.exists(old_db_path):
-        return f"Il database {old_db_name} non esiste."
-    if os.path.exists(new_db_path):
-        return f"Il database {new_db_name} esiste già."
-    try:
-        os.rename(old_db_path, new_db_path)
-        return f"Database {old_db_name} rinominato in {new_db_name} con successo."
-    except Exception as e:
-        return f"Errore durante la modifica del database: {e}"
-def list_databases():
-    try:
-        databases = []
-        for item in os.listdir():
-            if os.path.isdir(item) and item.startswith("faiss_index_"):
-                db_name = item.replace("faiss_index_", "")
-                databases.append(db_name)
-        # Ensure "default_db" is in the list
-        if "default_db" not in databases:
-            databases.append("default_db")
-        return databases
-    except Exception as e:
-        logging.error(f"Error listing databases: {e}")
-        return []
-# -------------- DOCUMENT MANAGEMENT TAB FUNCTIONS --------------
-def upload_and_index(files, title, author, db_name="default_db"):
-    if not files:
-        return "Nessun file caricato."
-    documents = []
-    doc_metadata = []
-    for file in files:
-        try:
-            if file.name.endswith('.pdf'):
-                text = extract_text_from_pdf(file.name)
-            elif file.name.endswith('.docx'):
-                text = extract_text_from_docx(file.name)
-            else:
-                with open(file.name, 'r', encoding='utf-8') as f:
-                    text = f.read()
-            chunks = text_splitter.split_text(text)
-            # Metadata per il documento
-            doc_meta = DocumentMetadata(
-                filename=os.path.basename(file.name),
-                title=title,
-                author=author,
-                upload_date=datetime.now().strftime("%Y-%m-%d %H:%M:%S"),
-                chunks=len(chunks)
-            )
-            # Metadata per ogni chunk
-            for i, chunk in enumerate(chunks):
-                chunk_metadata = {
-                    "content": chunk,
-                    "source": os.path.basename(file.name),
-                    "title": title,
-                    "author": author,
-                    "chunk_index": i,
-                    "total_chunks": len(chunks),
-                    "upload_date": doc_meta.upload_date
-                }
-                documents.append(chunk_metadata)
-            doc_metadata.append(doc_meta)
-        except Exception as e:
-            logging.error(f"Errore durante la lettura del file {file.name}: {e}")
-            continue
-    if documents:
-        try:
-            db_path = f"faiss_index_{db_name}"
-            os.makedirs(db_path, exist_ok=True)
-            embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
-            texts = [doc["content"] for doc in documents]
-            metadatas = [{k: v for k, v in doc.items() if k != "content"} for doc in documents]
-            vectorstore = FAISS.from_texts(texts, embeddings, metadatas=metadatas)
-            vectorstore.save_local(db_path)
-            # Salva i metadati del documento
-            save_metadata(doc_metadata, db_name)
-            return f"Documenti indicizzati con successo nel database {db_name}!"
-        except Exception as e:
-            logging.error(f"Errore durante l'indicizzazione: {e}")
-            return f"Errore durante l'indicizzazione: {e}"
-    return "Nessun documento processato."
-def list_indexed_files(db_name="default_db"):
-    db_path = f"faiss_index_{db_name}"
-    metadata_file = os.path.join(db_path, "metadata.json")
-    if not os.path.exists(metadata_file):
-        return "Nessun file nel database."
-    try:
-        with open(metadata_file, 'r') as f:
-            metadata = json.load(f)
-        output = []
-        for doc in metadata:
-            output.append(
-                f"📄 {doc['title']}\n"
-                f"   Autore: {doc['author']}\n"
-                f"   File: {doc['filename']}\n"
-                f"   Chunks: {doc['chunks']}\n"
-                f"   Caricato il: {doc['upload_date']}\n"
-            )
-        return "\n".join(output) if output else "Nessun documento nel database."
-    except Exception as e:
-        logging.error(f"Errore nella lettura dei metadati: {e}")
-        return f"Errore nella lettura dei metadati: {e}"
-def delete_file_from_database(file_name, db_name="default_db"):
-    db_path = f"faiss_index_{db_name}"
-    file_list_path = os.path.join(db_path, "file_list.txt")
-    if not os.path.exists(file_list_path):
-        return "Database non trovato."
-    try:
-        # Leggi la lista dei file
-        with open(file_list_path, "r") as f:
-            files = f.readlines()
-        # Rimuovi il file dalla lista
-        files = [f.strip() for f in files if f.strip() != file_name]
-        # Riscrivi la lista aggiornata
-        with open(file_list_path, "w") as f:
-            for file in files:
-                f.write(f"{file}\n")
-        return f"File {file_name} rimosso dal database {db_name}."
-    except Exception as e:
-        return f"Errore durante la rimozione del file: {e}"
-# -------------- DOCUMENT VISUALIZATION TAB FUNCTIONS --------------
-def list_indexed_documents(db_name="default_db"):
-    db_path = f"faiss_index_{db_name}"
-    metadata_file = os.path.join(db_path, "metadata.json")
-    if not os.path.exists(db_path):
-        return f"Il database {db_name} non esiste."
-    if not os.path.exists(metadata_file):
-        return f"Nessun documento nel database {db_name}."
-    try:
-        with open(metadata_file, 'r') as f:
-            metadata = json.load(f)
-        if not metadata:
-            return "Nessun documento trovato nel database."
-        output_lines = ["📚 Documenti nel database:"]
-        for doc in metadata:
-            output_lines.extend([
-                f"\n📄 Documento: {doc['title']}",
-                f"   📝 Autore: {doc['author']}",
-                f"   📁 File: {doc['filename']}",
-                f"   🕒 Caricato il: {doc['upload_date']}",
-                f"   📑 Chunks: {doc['chunks']}"
-            ])
-        result = "\n".join(output_lines)
-        logging.info(f"Documenti trovati nel database {db_name}: {result}")
-        return result
-    except Exception as e:
-        error_msg = f"Errore nella lettura dei metadati: {e}"
-        logging.error(error_msg)
-        return error_msg
-# -------------- NEW FEATURES TAB FUNCTIONS --------------
-def search_documents(query, db_name="default_db"):
-    db_path = f"faiss_index_{db_name}"
-    if not os.path.exists(db_path):
-        logging.warning(f"L'indice FAISS per il database {db_name} non esiste.")
-        return "Database non trovato."
-    embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
-    vectorstore = FAISS.load_local(db_path, embeddings, allow_dangerous_deserialization=True)
-    # Perform a similarity search
-    docs = vectorstore.similarity_search(query)
-    if not docs:
-        return "Nessun documento corrispondente alla query."
-    # Collect the document contents
-    results = [doc.page_content for doc in docs]
-    return "\n\n".join(results)
-def generate_summary(db_name="default_db"):
-    # Placeholder for summarization logic
-    return "This is a summary of the documents in the database."

app/import pytest.py DELETED Viewed

@@ -1,58 +0,0 @@
-import pytest
-from unittest.mock import Mock, patch
-import os
-from .llm_handling import answer_question
-# app/test_llm_handling.py
-@pytest.fixture
-def mock_embeddings():
-    with patch('langchain_community.embeddings.HuggingFaceEmbeddings') as mock:
-        yield mock
-@pytest.fixture
-def mock_vectorstore():
-    with patch('langchain_community.vectorstores.FAISS') as mock:
-        mock_instance = Mock()
-        mock_instance.as_retriever.return_value = Mock()
-        mock.load_local.return_value = mock_instance
-        yield mock
-@pytest.fixture
-def mock_chat_openai():
-    with patch('langchain_openai.ChatOpenAI') as mock:
-        yield mock
-def test_database_not_found():
-    result = answer_question("test question", "nonexistent_db")
-    assert len(result) == 2
-    assert result[0]["role"] == "user"
-    assert result[0]["content"] == "test question"
-    assert result[1]["role"] == "assistant"
-    assert result[1]["content"] == "Database non trovato"
-@patch('os.path.exists', return_value=True)
-def test_successful_answer(mock_exists, mock_embeddings, mock_vectorstore, mock_chat_openai):
-    mock_qa_chain = Mock()
-    mock_qa_chain.return_value = {"result": "Test answer"}
-    with patch('langchain.chains.RetrievalQA.from_chain_type', return_value=mock_qa_chain):
-        result = answer_question("test question", "test_db")
-        assert len(result) == 2
-        assert result[0]["role"] == "user"
-        assert result[0]["content"] == "test question"
-        assert result[1]["role"] == "assistant"
-        assert result[1]["content"] == "Test answer"
-@patch('os.path.exists', return_value=True)
-def test_error_handling(mock_exists, mock_embeddings):
-    mock_embeddings.side_effect = Exception("Test error")
-    result = answer_question("test question", "test_db")
-    assert len(result) == 2
-    assert result[0]["role"] == "user"
-    assert result[0]["content"] == "test question"
-    assert result[1]["role"] == "assistant"
-    assert "Si è verificato un errore: Test error" in result[1]["content"]

app/llm_handling.py DELETED Viewed

@@ -1,118 +0,0 @@
-import logging
-import os
-import shutil
-from openai import OpenAI
-from langchain_community.vectorstores import FAISS
-from langchain_community.embeddings import HuggingFaceEmbeddings
-import gradio as gr
-from app.config import OPENAI_API_KEY
-# Se hai funzioni per gestire i database (list_databases, ensure_default_db, ecc.),
-# importale dal modulo corretto:
-# from app.document_handling import list_databases, ensure_default_db
-logging.basicConfig(level=logging.INFO)
-def answer_question(question, db_name, chat_history=None):
-    """
-    Risponde alla domanda 'question' usando i documenti del database 'db_name'.
-    Restituisce una lista di 2 messaggi in formato:
-      [
-        {"role": "user", "content": <domanda>},
-        {"role": "assistant", "content": <risposta>}
-      ]
-    In questa versione, viene effettuato il log dei 'chunk' recuperati durante
-    la ricerca di similarità.
-    """
-    if chat_history is None:
-        chat_history = []
-    logging.info(f"Inizio elaborazione domanda: {question} per database: {db_name}")
-    try:
-        embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
-        db_path = f"faiss_index_{db_name}"
-        if not os.path.exists(db_path):
-            logging.warning(f"Database {db_name} non trovato.")
-            return [
-                {"role": "user", "content": question},
-                {"role": "assistant", "content": "Database non trovato"}
-            ]
-        # Carica l'indice FAISS
-        vectorstore = FAISS.load_local(db_path, embeddings, allow_dangerous_deserialization=True)
-        # Cerca i documenti (chunk) più simili
-        relevant_docs = vectorstore.similarity_search(question, k=3)
-        # Logga i chunk recuperati
-        for idx, doc in enumerate(relevant_docs):
-            logging.info(f"--- Chunk {idx+1} ---")
-            logging.info(doc.page_content)
-            logging.info("---------------------")
-        # Prepara il contesto dai documenti
-        context = "\n".join([doc.page_content for doc in relevant_docs])
-        client = OpenAI(api_key=OPENAI_API_KEY)
-        messages = [
-            {"role": "system", "content": f"Usa questo contesto per rispondere: {context}"},
-            {"role": "user", "content": question}
-        ]
-        # Esegui la chiamata a OpenAI
-        response = client.chat.completions.create(
-            model="gpt-3.5-turbo",
-            messages=messages,
-            temperature=0,
-            max_tokens=2048
-        )
-        answer = response.choices[0].message.content
-        return [
-            {"role": "user", "content": question},
-            {"role": "assistant", "content": answer}
-        ]
-    except Exception as e:
-        logging.error(f"Errore durante la generazione della risposta: {e}")
-        return [
-            {"role": "user", "content": question},
-            {"role": "assistant", "content": f"Si è verificato un errore: {str(e)}"}
-        ]
-def delete_database(db_name):
-    """
-    Cancella il database FAISS corrispondente a 'db_name'.
-    Restituisce un messaggio di stato e l'aggiornamento del dropdown in Gradio.
-    """
-    db_path = f"faiss_index_{db_name}"
-    if not os.path.exists(db_path):
-        return f"Il database {db_name} non esiste.", gr.Dropdown.update(choices=[])
-    try:
-        shutil.rmtree(db_path)
-        logging.info(f"Database {db_name} eliminato con successo.")
-        # Se hai una funzione list_databases(), usala per aggiornare la dropdown
-        return f"Database {db_name} eliminato con successo.", gr.Dropdown.update(choices=[])
-    except OSError as e:
-        logging.error(f"Impossibile eliminare il database {db_name}: {e}")
-        return f"Impossibile eliminare il database {db_name}: {e}", gr.Dropdown.update(choices=[])
-if __name__ == "__main__":
-    # Se esiste una funzione ensure_default_db(), decommenta:
-    # ensure_default_db()
-    # Qui potresti testare la funzione answer_question o avviare
-    # il tuo server Gradio. Ad esempio:
-    #
-    # from app.interface import rag_chatbot
-    # rag_chatbot.launch(share=True)
-    pass

app/llm_handling_2.py DELETED Viewed

@@ -1,34 +0,0 @@
-import logging
-from langchain_openai import ChatOpenAI
-from app.config import OPENAI_API_KEY
-def answer_question(question):
-    logging.info(f"Chiamata all'LLM con domanda: {question}")
-    sys = (
-        "Sei un assistente AI per la lingua Italiana di nome Counselorbot. "
-        "Rispondi nella lingua usata per la domanda in modo chiaro, semplice ed esaustivo."
-    )
-    messages = [
-        {"role": "system", "content": sys},
-        {"role": "user", "content": question}
-    ]
-    logging.info(f"Messages sent to LLM: {messages}")
-    try:
-        llm = ChatOpenAI(
-            model="gpt-4o-mini",
-            openai_api_key=OPENAI_API_KEY,
-            temperature=0.6,
-            max_tokens=512,
-            top_p=0.9
-        )
-        response = llm.invoke(input=messages)
-        logging.info(f"Contesto RAG inviato all'LLM: {messages}")
-        logging.info(f"Risposta ricevuta dall'LLM: {response}")
-        answer = response.content.strip()
-        logging.info(f"Domanda: {question} | Risposta: {answer}")
-        return answer
-    except Exception as e:
-        logging.error(f"Errore durante la generazione della risposta: {e}")
-        return f"Errore durante la generazione della risposta: {e}"

app/llm_handling_3.py DELETED Viewed

@@ -1,76 +0,0 @@
-import logging
-from openai import OpenAI
-from langchain_community.vectorstores import FAISS
-from langchain_community.embeddings import HuggingFaceEmbeddings
-from app.config import OPENAI_API_KEY
-import gradio as gr
-import os
-import shutil
-logging.basicConfig(level=logging.INFO)
-def answer_question(question, db_name, chat_history=None):
-    if chat_history is None:
-        chat_history = []
-    logging.info(f"Inizio elaborazione domanda: {question} per database: {db_name}")
-    try:
-        embeddings = HuggingFaceEmbeddings(model_name="sentence-transformers/all-MiniLM-L6-v2")
-        db_path = f"faiss_index_{db_name}"
-        if not os.path.exists(db_path):
-            return [{"role": "user", "content": question},
-                   {"role": "assistant", "content": "Database non trovato"}]
-        vectorstore = FAISS.load_local(db_path, embeddings, allow_dangerous_deserialization=True)
-        relevant_docs = vectorstore.similarity_search(question, k=3)
-        # Prepara il contesto dai documenti
-        context = "\n".join([doc.page_content for doc in relevant_docs])
-        client = OpenAI(api_key=OPENAI_API_KEY)
-        messages = [
-            {"role": "system", "content": f"Usa questo contesto per rispondere: {context}"},
-            {"role": "user", "content": question}
-        ]
-        response = client.chat.completions.create(
-            model="gpt-3.5-turbo",  # Cambiato da gpt-4o-mini a un modello supportato
-            messages=messages,
-            temperature=0,
-            max_tokens=2048
-        )
-        answer = response.choices[0].message.content
-        return [
-            {"role": "user", "content": question},
-            {"role": "assistant", "content": answer}
-        ]
-    except Exception as e:
-        logging.error(f"Errore durante la generazione della risposta: {e}")
-        return [
-            {"role": "user", "content": question},
-            {"role": "assistant", "content": f"Si è verificato un errore: {str(e)}"}
-        ]
-# Nel document_handling.py, aggiornare delete_database per restituire anche l'aggiornamento del dropdown
-def delete_database(db_name):
-    db_path = f"faiss_index_{db_name}"
-    if not os.path.exists(db_path):
-        return f"Il database {db_name} non esiste.", gr.Dropdown.update(choices=list_databases())
-    try:
-        shutil.rmtree(db_path)
-        logging.info(f"Database {db_name} eliminato con successo.")
-        return f"Database {db_name} eliminato con successo.", gr.Dropdown.update(choices=list_databases())
-    except OSError as e:
-        logging.error(f"Impossibile eliminare il database {db_name}: {e}")
-        return f"Impossibile eliminare il database {db_name}: {e}", gr.Dropdown.update(choices=list_databases())
-# Manca la chiamata a ensure_default_db()
-if __name__ == "__main__":
-    ensure_default_db()  # Aggiungere questa chiamata
-    rag_chatbot.launch(share=True)

app/logging_config.py DELETED Viewed

@@ -1,12 +0,0 @@
-import logging
-from dotenv import load_dotenv
-# Carica variabili d'ambiente dal file .env
-load_dotenv()
-def configure_logging():
-    logging.basicConfig(
-        filename="rag_chatbot.log",
-        level=logging.INFO,
-        format="%(asctime)s - %(levelname)s - %(message)s"
-    )

app/test_llm_handling.py DELETED Viewed

@@ -1,30 +0,0 @@
-def test_database_not_found():
-    result = answer_question("test question", "nonexistent_db")
-    assert len(result) == 1
-    assert len(result[0]) == 2
-    assert result[0][0] == "test question"
-    assert result[0][1] == "Database non trovato"
-@patch('os.path.exists', return_value=True)
-def test_successful_answer(mock_exists, mock_embeddings, mock_vectorstore, mock_chat_openai):
-    mock_qa_chain = Mock()
-    mock_qa_chain.return_value = {"result": "Test answer"}
-    with patch('langchain.chains.RetrievalQA.from_chain_type', return_value=mock_qa_chain):
-        result = answer_question("test question", "test_db")
-        assert len(result) == 1
-        assert len(result[0]) == 2
-        assert result[0][0] == "test question"
-        assert result[0][1] == "Test answer"
-@patch('os.path.exists', return_value=True)
-def test_error_handling(mock_exists, mock_embeddings):
-    mock_embeddings.side_effect = Exception("Test error")
-    result = answer_question("test question", "test_db")
-    assert len(result) == 1
-    assert len(result[0]) == 2
-    assert result[0][0] == "test question"
-    assert "Si è verificato un errore: Test error" in result[0][1]

app_1.py DELETED Viewed

@@ -1,275 +0,0 @@
-import gradio as gr
-from app.document_handling import *
-from app.llm_handling import answer_question
-from app.logging_config import configure_logging
-configure_logging()
-def update_dropdowns():
-    """Aggiorna tutti i dropdown con la lista aggiornata dei database"""
-    databases = list_databases()
-    return [gr.update(choices=databases) for _ in range(6)]
-def extract_text_from_files(files):
-    text = ""
-    for file in files:
-        try:
-            if file.name.endswith('.pdf'):
-                text += extract_text_from_pdf(file.name)
-            elif file.name.endswith('.docx'):
-                text += extract_text_from_docx(file.name)
-            else:
-                with open(file.name, 'r', encoding='utf-8') as f:
-                    text += f.read()
-        except Exception as e:
-            logging.error(f"Errore durante la lettura del file {file.name}: {e}")
-    return text
-with gr.Blocks() as rag_chatbot:
-    gr.Markdown("# Chatbot basato su RAG")
-    databases = list_databases()
-    # Definizione dei dropdown prima del loro utilizzo
-    db_name_upload = gr.State()
-    db_name_list = gr.State()
-    db_name_chat = gr.State()
-    db_name_new = gr.State()
-    modify_db_old_name = gr.State()
-    delete_db_dropdown = gr.State()
-    with gr.Tab("Chatbot"):
-        with gr.Row():
-            with gr.Column(scale=2):
-                db_name_chat = gr.Dropdown(choices=databases, label="Seleziona Database", value="default_db")
-                # Aggiornato il tipo del chatbot
-                chatbot = gr.Chatbot(label="Conversazione", type="messages")
-                with gr.Row():
-                    # Aggiunta upload file direttamente nella chat
-                    file_input = gr.File(
-                        label="Carica PDF per la conversazione",
-                        file_types=[".pdf", ".docx", ".txt"],
-                        file_count="multiple"
-                    )
-                    upload_button = gr.Button("Carica Documenti")
-                question_input = gr.Textbox(
-                    label="Fai una domanda",
-                    placeholder="Scrivi qui la tua domanda...",
-                    lines=2
-                )
-                with gr.Row():
-                    ask_button = gr.Button("Invia")
-                    clear_button = gr.Button("Pulisci Chat")
-        chat_state = gr.State([])
-        def chat_upload_and_respond(files, chat_history, db_name):
-            # Estrai il testo dai file
-            text = extract_text_from_files(files)
-            # Aggiungi il testo alla chat come messaggio dell'utente
-            chat_history.append((None, "📄 Contenuto dei documenti caricati:"))
-            chat_history.append((None, text))
-            return chat_history
-        def respond(message, chat_history, db_name):
-            bot_message = answer_question(message, db_name)
-            chat_history.append((message, bot_message))
-            return "", chat_history
-        def clear_chat():
-            return [], []
-        # Eventi
-        upload_button.click(
-            chat_upload_and_respond,
-            inputs=[file_input, chat_state, db_name_chat],
-            outputs=[chatbot]
-        )
-        ask_button.click(
-            respond,
-            inputs=[question_input, chat_state, db_name_chat],
-            outputs=[question_input, chatbot]
-        )
-        clear_button.click(
-            clear_chat,
-            outputs=[chatbot, chat_state]
-        )
-    with gr.Tab("Gestione Database"):
-        gr.Markdown("## Operazioni sui Database")
-        with gr.Row():
-            with gr.Column():
-                gr.Markdown("### Crea Database")
-                db_name_input = gr.Textbox(label="Nome Nuovo Database")
-                create_db_button = gr.Button("Crea Database")
-                create_output = gr.Textbox(label="Stato Creazione")
-            with gr.Column():
-                gr.Markdown("### Rinomina Database")
-                modify_db_old_name = gr.Dropdown(choices=databases, label="Database da Rinominare")
-                modify_db_new_name = gr.Textbox(label="Nuovo Nome")
-                modify_db_button = gr.Button("Rinomina Database")
-                modify_output = gr.Textbox(label="Stato Modifica")
-            with gr.Column():
-                gr.Markdown("### Elimina Database")
-                delete_db_dropdown = gr.Dropdown(choices=databases, label="Database da Eliminare")
-                delete_db_button = gr.Button("Elimina Database")
-                delete_output = gr.Textbox(label="Stato Eliminazione")
-        # Eventi per i pulsanti di gestione database
-        create_db_button.click(
-            create_database,
-            inputs=db_name_input,
-            outputs=create_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-        modify_db_button.click(
-            modify_database,
-            inputs=[modify_db_old_name, modify_db_new_name],
-            outputs=modify_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-        delete_db_button.click(
-            delete_database,
-            inputs=delete_db_dropdown,
-            outputs=delete_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-    with gr.Tab("Gestione Documenti"):
-        with gr.Column():
-            gr.Markdown("### Carica Documenti")
-            with gr.Row():
-                file_input = gr.File(
-                    label="Carica i tuoi documenti",
-                    file_types=[".txt", ".pdf", ".docx"],
-                    file_count="multiple"
-                )
-                db_name_upload = gr.Dropdown(
-                    choices=databases,
-                    label="Seleziona Database",
-                    value="default_db"
-                )
-            with gr.Row():
-                title_input = gr.Textbox(label="Titolo del documento")
-                author_input = gr.Textbox(label="Autore")
-            upload_button = gr.Button("Indicizza Documenti")
-            upload_output = gr.Textbox(label="Stato Upload")
-            with gr.Column():
-                gr.Markdown("### Documenti nel Database")
-                db_name_list = gr.Dropdown(
-                    choices=databases,
-                    label="Seleziona Database",
-                    value="default_db"
-                )
-                list_button = gr.Button("Visualizza Files")
-                list_output = gr.Textbox(label="Files nel Database")
-                delete_file_input = gr.Textbox(label="Nome file da eliminare")
-                delete_file_button = gr.Button("Elimina File")
-                delete_file_output = gr.Textbox(label="Stato Eliminazione")
-        # Eventi modificati
-        upload_button.click(
-            upload_and_index,
-            inputs=[file_input, title_input, author_input, db_name_upload],
-            outputs=upload_output
-        ).then(
-            list_indexed_files,
-            inputs=db_name_list,
-            outputs=list_output
-        )
-        list_button.click(
-            list_indexed_files,
-            inputs=db_name_list,
-            outputs=list_output
-        )
-        delete_file_button.click(
-            delete_file_from_database,
-            inputs=[delete_file_input, db_name_list],
-            outputs=delete_file_output
-        ).then(
-            list_indexed_files,
-            inputs=db_name_list,
-            outputs=list_output
-        ).then(
-            update_dropdowns,
-            outputs=[db_name_upload, db_name_list, db_name_chat, db_name_new, modify_db_old_name, delete_db_dropdown]
-        )
-    with gr.Tab("Visualizza Documenti Indicizzati"):
-        with gr.Column():
-            gr.Markdown("### Documenti nel Database")
-            db_name_list = gr.Dropdown(
-                choices=databases,
-                label="Seleziona Database",
-                value="default_db",
-                interactive=True
-            )
-            list_button = gr.Button("Visualizza Documenti")
-            list_output = gr.Textbox(
-                label="Elenco Documenti",
-                lines=10,
-                interactive=False,
-                value="Clicca 'Visualizza Documenti' per vedere l'elenco"
-            )
-            # Evento click con aggiornamento
-            list_button.click(
-                fn=list_indexed_documents,
-                inputs=[db_name_list],
-                outputs=[list_output],
-                api_name="list_docs"
-            )
-    # Adding a new tab for new functionalities
-    with gr.Tab("Nuove Funzionalità"):
-        gr.Markdown("## Cerca Documenti e Genera Riassunto")
-        db_name_new = gr.Dropdown(choices=databases, label="Seleziona Database", value="default_db")
-        search_input = gr.Textbox(label="Inserisci Termine di Ricerca")
-        search_button = gr.Button("Cerca Documenti")
-        search_output = gr.Textbox(label="Documenti Trovati")
-        summary_button = gr.Button("Genera Riassunto")
-        summary_output = gr.Textbox(label="Riassunto")
-        search_button.click(
-            search_documents,
-            inputs=[search_input, db_name_new],
-            outputs=search_output
-        )
-        # summary_button.click(
-        #     generate_summary,
-        #     inputs=db_name_new,
-        #     outputs=summary_output
-        # )
-# Avvio dell'app
-if __name__ == "__main__":
-    rag_chatbot.launch()

faiss_index/index.faiss DELETED Viewed

Binary file (1.58 kB)

faiss_index/index.pkl DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:407d95e0808ddf251e3fb442241edd72c47961f5a38d5546021ef205b9fdeb57
-size 960117

faiss_index_E-learning/index.faiss DELETED Viewed

Binary file (66.1 kB)

faiss_index_E-learning/index.pkl DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a0ec4d3c22f17861b941c079acdf82d250fdafd351e9b05ab3877110a3bbdade
-size 25352

faiss_index_E-learning/metadata.json DELETED Viewed

@@ -1,16 +0,0 @@
-[
-  {
-    "filename": "istruzioni obiettivi di apprendimento.pdf",
-    "title": "Obiettivi",
-    "author": "Daniele",
-    "upload_date": "2024-12-31 19:21:10",
-    "chunks": 6
-  },
-  {
-    "filename": "mastery_Bloom.pdf",
-    "title": "Mastery Learingi",
-    "author": "Bloom",
-    "upload_date": "2024-12-31 20:25:00",
-    "chunks": 43
-  }
-]

faiss_index_default_db/index.faiss DELETED Viewed

Binary file (309 kB)

faiss_index_default_db/index.pkl DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:4c797df1c4a8ddac75b4b083391220179ce5bbcd2b962b4dfbc7d960628cd0b2
-size 107706

rag_chatbot.log DELETED Viewed

@@ -1,39 +0,0 @@
-2024-12-31 11:17:51,910 - INFO - HTTP Request: GET http://127.0.0.1:7860/gradio_api/startup-events "HTTP/1.1 200 OK"
-2024-12-31 11:17:51,920 - INFO - HTTP Request: HEAD http://127.0.0.1:7860/ "HTTP/1.1 200 OK"
-2024-12-31 11:17:52,684 - INFO - HTTP Request: GET https://api.gradio.app/pkg-version "HTTP/1.1 200 OK"
-2024-12-31 11:17:52,832 - INFO - HTTP Request: GET https://api.gradio.app/v3/tunnel-request "HTTP/1.1 200 OK"
-2024-12-31 11:17:53,187 - INFO - HTTP Request: GET https://cdn-media.huggingface.co/frpc-gradio-0.3/frpc_darwin_arm64 "HTTP/1.1 200 OK"
-2024-12-31 11:18:15,815 - INFO - Chiamata all'LLM con domanda: cosa sai fare?
-2024-12-31 11:18:15,815 - INFO - Messages sent to LLM: [{'role': 'system', 'content': 'Sei un assistente AI per la lingua Italiana di nome Counselorbot. Rispondi nella lingua usata per la domanda in modo chiaro, semplice ed esaustivo.'}, {'role': 'user', 'content': 'cosa sai fare?'}]
-2024-12-31 11:18:19,608 - INFO - HTTP Request: POST https://api.openai.com/v1/chat/completions "HTTP/1.1 200 OK"
-2024-12-31 11:18:19,630 - INFO - Contesto RAG inviato all'LLM: [{'role': 'system', 'content': 'Sei un assistente AI per la lingua Italiana di nome Counselorbot. Rispondi nella lingua usata per la domanda in modo chiaro, semplice ed esaustivo.'}, {'role': 'user', 'content': 'cosa sai fare?'}]
-2024-12-31 11:18:19,630 - INFO - Risposta ricevuta dall'LLM: content="Io posso aiutarti in diversi modi! Ecco alcune delle cose che posso fare:\n\n1. **Rispondere a domande**: Posso fornire informazioni su vari argomenti, dalla storia alla scienza, dalla cultura alla tecnologia.\n2. **Spiegare concetti**: Se hai bisogno di chiarimenti su un argomento specifico, posso spiegartelo in modo semplice e comprensibile.\n3. **Correzione di testi**: Posso aiutarti a correggere errori grammaticali o stilistici nei tuoi scritti.\n4. **Suggerire idee**: Se hai bisogno di ispirazione per un progetto, un tema o una storia, posso offrirti spunti e suggerimenti.\n5. **Conversazione**: Posso intrattenere una conversazione su vari temi, per aiutarti a praticare l'italiano o semplicemente per fare due chiacchiere.\n\nSe hai una richiesta specifica, non esitare a chiedere!" additional_kwargs={'refusal': None} response_metadata={'token_usage': {'completion_tokens': 205, 'prompt_tokens': 53, 'total_tokens': 258, 'completion_tokens_details': {'accepted_prediction_tokens': 0, 'audio_tokens': 0, 'reasoning_tokens': 0, 'rejected_prediction_tokens': 0}, 'prompt_tokens_details': {'audio_tokens': 0, 'cached_tokens': 0}}, 'model_name': 'gpt-4o-mini-2024-07-18', 'system_fingerprint': 'fp_0aa8d3e20b', 'finish_reason': 'stop', 'logprobs': None} id='run-2b27a037-9811-4ee5-b903-4ac82f430d1f-0' usage_metadata={'input_tokens': 53, 'output_tokens': 205, 'total_tokens': 258, 'input_token_details': {'audio': 0, 'cache_read': 0}, 'output_token_details': {'audio': 0, 'reasoning': 0}}
-2024-12-31 11:18:19,630 - INFO - Domanda: cosa sai fare? | Risposta: Io posso aiutarti in diversi modi! Ecco alcune delle cose che posso fare:
-1. **Rispondere a domande**: Posso fornire informazioni su vari argomenti, dalla storia alla scienza, dalla cultura alla tecnologia.
-2. **Spiegare concetti**: Se hai bisogno di chiarimenti su un argomento specifico, posso spiegartelo in modo semplice e comprensibile.
-3. **Correzione di testi**: Posso aiutarti a correggere errori grammaticali o stilistici nei tuoi scritti.
-4. **Suggerire idee**: Se hai bisogno di ispirazione per un progetto, un tema o una storia, posso offrirti spunti e suggerimenti.
-5. **Conversazione**: Posso intrattenere una conversazione su vari temi, per aiutarti a praticare l'italiano o semplicemente per fare due chiacchiere.
-Se hai una richiesta specifica, non esitare a chiedere!
-2024-12-31 11:19:07,332 - INFO - Use pytorch device_name: mps
-2024-12-31 11:19:07,332 - INFO - Load pretrained SentenceTransformer: sentence-transformers/all-MiniLM-L6-v2
-2024-12-31 11:19:10,382 - INFO - Loading faiss.
-2024-12-31 11:19:10,935 - INFO - Successfully loaded faiss.
-2024-12-31 11:19:10,941 - INFO - Documenti indicizzati con successo.
-2024-12-31 11:19:36,358 - INFO - Chiamata all'LLM con domanda: quali sono le attività nel loogbook
-2024-12-31 11:19:36,359 - INFO - Messages sent to LLM: [{'role': 'system', 'content': 'Sei un assistente AI per la lingua Italiana di nome Counselorbot. Rispondi nella lingua usata per la domanda in modo chiaro, semplice ed esaustivo.'}, {'role': 'user', 'content': 'quali sono le attività nel loogbook'}]
-2024-12-31 11:19:41,564 - INFO - HTTP Request: POST https://api.openai.com/v1/chat/completions "HTTP/1.1 200 OK"
-2024-12-31 11:19:41,570 - INFO - Contesto RAG inviato all'LLM: [{'role': 'system', 'content': 'Sei un assistente AI per la lingua Italiana di nome Counselorbot. Rispondi nella lingua usata per la domanda in modo chiaro, semplice ed esaustivo.'}, {'role': 'user', 'content': 'quali sono le attività nel loogbook'}]
-2024-12-31 11:19:41,571 - INFO - Risposta ricevuta dall'LLM: content='Il "logbook" è un registro utilizzato per annotare attività, eventi o informazioni specifiche in vari contesti, come nel settore marittimo, aereo, medico o anche in ambito lavorativo. Le attività che possono essere registrate in un logbook variano a seconda del contesto, ma generalmente includono:\n\n1. **Data e ora**: Ogni registrazione inizia con la data e l\'ora dell\'attività.\n2. **Descrizione dell\'attività**: Una breve spiegazione di cosa è stato fatto (es. volo effettuato, manutenzione eseguita, visite mediche).\n3. **Luogo**: Dove è avvenuta l\'attività.\n4. **Persone coinvolte**: Chi ha partecipato o ha assistito all\'attività.\n5. **Osservazioni**: Note aggiuntive, commenti o risultati dell\'attività.\n6. **Firma**: Spesso è richiesta la firma di chi ha effettuato la registrazione per garantire la responsabilità e la veridicità delle informazioni.\n\nSe hai un contesto specifico in mente (ad esempio, un logbook per un aereo, una nave, un\'azienda o un\'attività di ricerca), fammi sapere e posso darti informazioni più dettagliate!' additional_kwargs={'refusal': None} response_metadata={'token_usage': {'completion_tokens': 270, 'prompt_tokens': 57, 'total_tokens': 327, 'completion_tokens_details': {'accepted_prediction_tokens': 0, 'audio_tokens': 0, 'reasoning_tokens': 0, 'rejected_prediction_tokens': 0}, 'prompt_tokens_details': {'audio_tokens': 0, 'cached_tokens': 0}}, 'model_name': 'gpt-4o-mini-2024-07-18', 'system_fingerprint': 'fp_0aa8d3e20b', 'finish_reason': 'stop', 'logprobs': None} id='run-e2c1baf6-3eaa-465e-be29-382f9fccefc0-0' usage_metadata={'input_tokens': 57, 'output_tokens': 270, 'total_tokens': 327, 'input_token_details': {'audio': 0, 'cache_read': 0}, 'output_token_details': {'audio': 0, 'reasoning': 0}}
-2024-12-31 11:19:41,571 - INFO - Domanda: quali sono le attività nel loogbook | Risposta: Il "logbook" è un registro utilizzato per annotare attività, eventi o informazioni specifiche in vari contesti, come nel settore marittimo, aereo, medico o anche in ambito lavorativo. Le attività che possono essere registrate in un logbook variano a seconda del contesto, ma generalmente includono:
-1. **Data e ora**: Ogni registrazione inizia con la data e l'ora dell'attività.
-2. **Descrizione dell'attività**: Una breve spiegazione di cosa è stato fatto (es. volo effettuato, manutenzione eseguita, visite mediche).
-3. **Luogo**: Dove è avvenuta l'attività.
-4. **Persone coinvolte**: Chi ha partecipato o ha assistito all'attività.
-5. **Osservazioni**: Note aggiuntive, commenti o risultati dell'attività.
-6. **Firma**: Spesso è richiesta la firma di chi ha effettuato la registrazione per garantire la responsabilità e la veridicità delle informazioni.
-Se hai un contesto specifico in mente (ad esempio, un logbook per un aereo, una nave, un'azienda o un'attività di ricerca), fammi sapere e posso darti informazioni più dettagliate!

requirements.txt DELETED Viewed

@@ -1,150 +0,0 @@
-aiofiles==23.2.1
-aiohappyeyeballs==2.4.4
-aiohttp==3.11.11
-aiosignal==1.3.2
-annotated-types==0.7.0
-anyio==4.7.0
-asgiref==3.8.1
-async-timeout==4.0.3
-attrs==24.3.0
-backoff==2.2.1
-bcrypt==4.2.1
-build==1.2.2.post1
-cachetools==5.5.0
-certifi==2024.12.14
-charset-normalizer==3.4.1
-chroma-hnswlib==0.7.6
-chromadb==0.6.0
-click==8.1.8
-coloredlogs==15.0.1
-dataclasses-json==0.6.7
-Deprecated==1.2.15
-distro==1.9.0
-durationpy==0.9
-exceptiongroup==1.2.2
-faiss-cpu==1.9.0.post1
-fastapi==0.115.6
-ffmpy==0.5.0
-filelock==3.16.1
-flatbuffers==24.12.23
-frozenlist==1.5.0
-fsspec==2024.12.0
-google-auth==2.37.0
-googleapis-common-protos==1.66.0
-gradio==5.9.1
-gradio_client==1.5.2
-grpcio==1.68.1
-h11==0.14.0
-httpcore==1.0.7
-httptools==0.6.4
-httpx==0.28.1
-httpx-sse==0.4.0
-huggingface-hub==0.27.0
-humanfriendly==10.0
-idna==3.10
-importlib_metadata==8.5.0
-importlib_resources==6.4.5
-Jinja2==3.1.5
-jiter==0.8.2
-joblib==1.4.2
-jsonpatch==1.33
-jsonpointer==3.0.0
-kubernetes==31.0.0
-langchain==0.3.13
-langchain-community==0.3.13
-langchain-core==0.3.28
-langchain-huggingface==0.1.2
-langchain-openai==0.2.14
-langchain-text-splitters==0.3.4
-langsmith==0.2.7
-lxml==5.3.0
-markdown-it-py==3.0.0
-MarkupSafe==2.1.5
-marshmallow==3.23.2
-mdurl==0.1.2
-mmh3==5.0.1
-monotonic==1.6
-mpmath==1.3.0
-multidict==6.1.0
-mypy-extensions==1.0.0
-networkx==3.4.2
-numpy==1.26.4
-oauthlib==3.2.2
-onnxruntime==1.20.1
-openai==1.58.1
-opentelemetry-api==1.29.0
-opentelemetry-exporter-otlp-proto-common==1.29.0
-opentelemetry-exporter-otlp-proto-grpc==1.29.0
-opentelemetry-instrumentation==0.50b0
-opentelemetry-instrumentation-asgi==0.50b0
-opentelemetry-instrumentation-fastapi==0.50b0
-opentelemetry-proto==1.29.0
-opentelemetry-sdk==1.29.0
-opentelemetry-semantic-conventions==0.50b0
-opentelemetry-util-http==0.50b0
-orjson==3.10.13
-overrides==7.7.0
-packaging==24.2
-pandas==2.2.3
-pillow==11.0.0
-posthog==3.7.4
-propcache==0.2.1
-protobuf==5.29.2
-pyasn1==0.6.1
-pyasn1_modules==0.4.1
-pydantic==2.10.4
-pydantic-settings==2.7.1
-pydantic_core==2.27.2
-pydub==0.25.1
-Pygments==2.18.0
-pypdf==5.1.0
-PyPDF2==3.0.1
-PyPika==0.48.9
-pyproject_hooks==1.2.0
-python-dateutil==2.9.0.post0
-python-docx==1.1.2
-python-dotenv==1.0.1
-python-multipart==0.0.20
-pytz==2024.2
-PyYAML==6.0.2
-regex==2024.11.6
-requests==2.32.3
-requests-oauthlib==2.0.0
-requests-toolbelt==1.0.0
-rich==13.9.4
-rsa==4.9
-ruff==0.8.4
-safehttpx==0.1.6
-safetensors==0.4.5
-scikit-learn==1.6.0
-scipy==1.14.1
-semantic-version==2.10.0
-sentence-transformers==3.3.1
-shellingham==1.5.4
-six==1.17.0
-sniffio==1.3.1
-SQLAlchemy==2.0.36
-starlette==0.41.3
-sympy==1.13.1
-tenacity==9.0.0
-threadpoolctl==3.5.0
-tiktoken==0.8.0
-tokenizers==0.21.0
-tomli==2.2.1
-tomlkit==0.13.2
-torch==2.5.1
-tqdm==4.67.1
-transformers==4.47.1
-typer==0.15.1
-typing-inspect==0.9.0
-typing_extensions==4.12.2
-tzdata==2024.2
-urllib3==2.3.0
-uvicorn==0.34.0
-uvloop==0.21.0
-watchfiles==1.0.3
-websocket-client==1.8.0
-websockets==14.1
-wrapt==1.17.0
-yarl==1.18.3
-zipp==3.21.0