Spaces:

DHEIVER
/

Ultralearning

Sleeping

App Files Files Community

DHEIVER commited on Dec 3, 2024

Commit

f2660e3

verified ·

1 Parent(s): cedb6bb

Update app.py

Browse files

Files changed (1) hide show

app.py +117 -231

app.py CHANGED Viewed

@@ -9,20 +9,20 @@ class Config:
     LOG_LEVEL = os.getenv('LOG_LEVEL', 'INFO')
     MODELS_CACHE_DIR = os.getenv('MODELS_CACHE_DIR', './models')
     HISTORY_FILE = os.getenv('HISTORY_FILE', 'learning_path_history.json')
-    MAX_AUDIO_LENGTH = int(os.getenv('MAX_AUDIO_LENGTH', '600'))  # segundos
     MAX_TEXT_LENGTH = int(os.getenv('MAX_TEXT_LENGTH', '1000'))
     SUPPORTED_AUDIO_FORMATS = ['.wav', '.mp3', '.ogg', '.flac']
-    # Configurações de visualização
     MAX_TOPICS = int(os.getenv('MAX_TOPICS', '10'))
     MAX_SUBTOPICS = int(os.getenv('MAX_SUBTOPICS', '5'))
     FIGURE_DPI = int(os.getenv('FIGURE_DPI', '300'))
-    # Configurações de modelo
     MODEL_TRANSCRIBER = os.getenv('MODEL_TRANSCRIBER', 'openai/whisper-base')
     MODEL_GENERATOR = os.getenv('MODEL_GENERATOR', 'gpt2')
-    # Configurações de retry
     MAX_RETRIES = int(os.getenv('MAX_RETRIES', '3'))
     RETRY_DELAY = int(os.getenv('RETRY_DELAY', '1'))
@@ -31,15 +31,16 @@ import logging
 import json
 from typing import Dict, Any, Optional, List, Tuple
 import os
 from config import Config
 class Utils:
     @staticmethod
     def setup_logging() -> logging.Logger:
         logger = logging.getLogger("LearningPathGenerator")
-        logger.setLevel(getattr(logging, Config.LOG_LEVEL))
-        # Configuração do arquivo de log
         handler = logging.FileHandler("app.log")
         formatter = logging.Formatter(
             '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
@@ -56,7 +57,7 @@ class Utils:
                 json.dump(data, f, ensure_ascii=False, indent=2)
             return True
         except Exception as e:
-            logging.error(f"Erro ao salvar JSON: {str(e)}")
             return False
     @staticmethod
@@ -65,56 +66,24 @@ class Utils:
             with open(filename, 'r', encoding='utf-8') as f:
                 return json.load(f)
         except Exception as e:
-            logging.error(f"Erro ao carregar JSON: {str(e)}")
             return None
-# validators.py
-import os
-import soundfile as sf
-from typing import Tuple, Optional
-from config import Config
-class Validators:
-    @staticmethod
-    def validate_audio_file(file_path: str) -> Tuple[bool, Optional[str]]:
-        try:
-            if not os.path.exists(file_path):
-                return False, "Arquivo não encontrado"
-            # Verifica extensão
-            ext = os.path.splitext(file_path)[1].lower()
-            if ext not in Config.SUPPORTED_AUDIO_FORMATS:
-                return False, f"Formato não suportado. Use: {Config.SUPPORTED_AUDIO_FORMATS}"
-            # Verifica conteúdo
-            data, samplerate = sf.read(file_path)
-            duration = len(data) / samplerate
-            if duration > Config.MAX_AUDIO_LENGTH:
-                return False, f"Áudio muito longo. Máximo: {Config.MAX_AUDIO_LENGTH}s"
-            return True, None
-        except Exception as e:
-            return False, f"Erro na validação: {str(e)}"
     @staticmethod
-    def validate_path_name(name: str) -> Tuple[bool, Optional[str]]:
-        if not name:
-            return True, None
-        if len(name) > 100:
-            return False, "Nome muito longo. Máximo: 100 caracteres"
-        if not all(c.isprintable() for c in name):
-            return False, "Nome contém caracteres inválidos"
-        return True, None
 # models.py
 from transformers import pipeline
 import torch
-from typing import Dict, Optional
 import logging
 from config import Config
@@ -126,7 +95,6 @@ class ModelManager:
     def _initialize_models(self):
         try:
-            # Verifica GPU
             device = 0 if torch.cuda.is_available() else -1
             self.models["transcriber"] = pipeline(
@@ -142,82 +110,21 @@ class ModelManager:
             )
         except Exception as e:
-            self.logger.error(f"Erro ao inicializar modelos: {str(e)}")
             raise
-    def get_model(self, name: str):
         return self.models.get(name)
-# visualization.py
-import networkx as nx
-import matplotlib.pyplot as plt
-from io import BytesIO
-import base64
-from typing import Dict, List
-from config import Config
-class Visualizer:
-    @staticmethod
-    def create_mind_map(topics: List[str],
-                       subtopics: Dict[str, List[str]]) -> Optional[str]:
-        try:
-            plt.figure(figsize=(15, 10), dpi=Config.FIGURE_DPI)
-            G = nx.DiGraph()
-            # Adiciona nós e arestas
-            for i, topic in enumerate(topics[:Config.MAX_TOPICS]):
-                G.add_node(topic, level=i)
-                if topic in subtopics:
-                    for subtopic in subtopics[topic][:Config.MAX_SUBTOPICS]:
-                        subtopic_name = f"{topic}:\n{subtopic}"
-                        G.add_node(subtopic_name, level=i)
-                        G.add_edge(topic, subtopic_name)
-                if i > 0:
-                    G.add_edge(topics[i-1], topic)
-            # Layout e estilo
-            pos = nx.spring_layout(G, k=2, iterations=50)
-            # Desenha nós principais
-            nx.draw_networkx_nodes(G, pos,
-                                 nodelist=[n for n in G.nodes() if ":" not in n],
-                                 node_color='lightblue',
-                                 node_size=3000)
-            # Desenha subtópicos
-            nx.draw_networkx_nodes(G, pos,
-                                 nodelist=[n for n in G.nodes() if ":" in n],
-                                 node_color='lightgreen',
-                                 node_size=2000)
-            # Desenha arestas e labels
-            nx.draw_networkx_edges(G, pos, edge_color='gray', arrows=True)
-            nx.draw_networkx_labels(G, pos, font_size=8, font_weight='bold')
-            # Salva imagem
-            buf = BytesIO()
-            plt.savefig(buf, format='png', bbox_inches='tight')
-            buf.seek(0)
-            plt.close()
-            return f"data:image/png;base64,{base64.b64encode(buf.getvalue()).decode()}"
-        except Exception as e:
-            logging.error(f"Erro na visualização: {str(e)}")
-            return None
 # main.py
 import gradio as gr
 from typing import Dict, Any
-import sys
 import logging
 from config import Config
 from utils import Utils
-from validators import Validators
 from models import ModelManager
 from visualization import Visualizer
 class LearningPathGenerator:
     def __init__(self):
@@ -225,7 +132,6 @@ class LearningPathGenerator:
         self.model_manager = ModelManager()
         self.history_file = Config.HISTORY_FILE
-        # Inicialização do histórico
         if not os.path.exists(self.history_file):
             Utils.save_json([], self.history_file)
@@ -235,29 +141,15 @@ class LearningPathGenerator:
                      difficulty: str = "intermediate",
                      include_resources: bool = True) -> Dict[str, Any]:
         try:
-            # Validação do áudio
-            valid_audio, audio_error = Validators.validate_audio_file(audio_path)
-            if not valid_audio:
-                return self._error_response(audio_error)
-            # Validação do nome
-            valid_name, name_error = Validators.validate_path_name(path_name)
-            if not valid_name:
-                return self._error_response(name_error)
-            # Transcrição
             transcriber = self.model_manager.get_model("transcriber")
             transcription = transcriber(audio_path)["text"]
-            # Geração da análise
             generator = self.model_manager.get_model("generator")
-            analysis = self._generate_analysis(generator, transcription, difficulty)
-            # Criação do mapa mental
-            topics, subtopics = self._extract_topics(analysis)
             mind_map = Visualizer.create_mind_map(topics, subtopics)
-            # Salva no histórico
             if path_name:
                 self._save_to_history(transcription, analysis, path_name)
@@ -268,75 +160,121 @@ class LearningPathGenerator:
             }
         except Exception as e:
-            self.logger.error(f"Erro no processamento: {str(e)}")
             return self._error_response(str(e))
     def create_interface(self):
         with gr.Blocks(theme=gr.themes.Soft()) as app:
             gr.Markdown("""
-            # 🎓 Gerador de Trilha de Aprendizado
-            Carregue um arquivo de áudio descrevendo seus objetivos de aprendizado
-            e receba uma trilha personalizada com recursos!
             """)
-            with gr.Tab("Gerar Trilha"):
                 with gr.Row():
                     with gr.Column(scale=2):
                         audio_input = gr.Audio(
                             type="filepath",
-                            label="Upload do Áudio",
-                            description="Grave ou faça upload de um áudio descrevendo seus objetivos"
                         )
                         with gr.Row():
                             path_name = gr.Textbox(
-                                label="Nome da Trilha",
-                                placeholder="Dê um nome para sua trilha (opcional)"
                             )
                             difficulty = gr.Dropdown(
-                                choices=["iniciante", "intermediário", "avançado"],
-                                value="intermediário",
-                                label="Nível de Dificuldade"
                             )
-                        with gr.Row():
-                            include_resources = gr.Checkbox(
-                                label="Incluir Recursos Recomendados",
-                                value=True
-                            )
-                            process_btn = gr.Button(
-                                "Gerar Trilha de Aprendizado",
-                                variant="primary"
-                            )
-                with gr.Row():
-                    text_output = gr.Textbox(
-                        label="Transcrição do Áudio",
-                        lines=4
-                    )
-                with gr.Row():
-                    analysis_output = gr.Textbox(
-                        label="Análise e Trilha de Aprendizado",
-                        lines=10
-                    )
-                with gr.Row():
-                    mind_map_output = gr.Image(
-                        label="Mapa Mental da Trilha",
-                        elem_id="mind_map"
-                    )
-            with gr.Tab("Histórico"):
-                gr.Markdown("Trilhas Anteriores")
-                history_table = gr.Dataframe(
-                    headers=["Data", "Nome", "Transcrição", "Análise"],
-                    label="Histórico de Trilhas"
                 )
-                refresh_btn = gr.Button("Atualizar Histórico")
-            # Event handlers
             process_btn.click(
                 fn=self.process_audio,
                 inputs=[audio_input, path_name, difficulty, include_resources],
@@ -346,66 +284,14 @@ class LearningPathGenerator:
                     "mind_map": mind_map_output
                 }
             )
-            refresh_btn.click(
-                fn=self._load_history,
-                outputs=[history_table]
-            )
         return app
-    def _generate_analysis(self,
-                         generator,
-                         text: str,
-                         difficulty: str) -> str:
-        prompt = f"""
-        Com base no seguinte texto, crie uma trilha de aprendizado detalhada
-        para nível {difficulty}:
-        {text[:Config.MAX_TEXT_LENGTH]}
-        Trilha de aprendizado:
-        """
-        response = generator(
-            prompt,
-            max_length=300,
-            num_return_sequences=1
-        )[0]["generated_text"]
-        if include_resources:
-            response += self._generate_resources()
-        return response
-    def _generate_resources(self) -> str:
-        return """
-        Recursos Recomendados:
-        1. Livros:
-           - "Guia Essencial do Tema"
-           - "Técnicas Avançadas"
-        2. Cursos Online:
-           - Coursera: "Especialização no Tema"
-           - edX: "Curso Avançado"
-        3. Recursos Práticos:
-           - Tutoriais interativos
-           - Exercícios práticos
-           - Projetos do mundo real
-        """
-    def _error_response(self, error_msg: str) -> Dict[str, Any]:
-        return {
-            "transcription": f"Erro: {error_msg}",
-            "analysis": "Não foi possível gerar a análise devido a um erro.",
-            "mind_map": None
-        }
-# Execução do app
 if __name__ == "__main__":
     try:
         generator = LearningPathGenerator()
         app = generator.create_interface()
         app.launch(debug=Config.DEBUG)
-    except Exception as e:

     LOG_LEVEL = os.getenv('LOG_LEVEL', 'INFO')
     MODELS_CACHE_DIR = os.getenv('MODELS_CACHE_DIR', './models')
     HISTORY_FILE = os.getenv('HISTORY_FILE', 'learning_path_history.json')
+    MAX_AUDIO_LENGTH = int(os.getenv('MAX_AUDIO_LENGTH', '600'))  # seconds
     MAX_TEXT_LENGTH = int(os.getenv('MAX_TEXT_LENGTH', '1000'))
     SUPPORTED_AUDIO_FORMATS = ['.wav', '.mp3', '.ogg', '.flac']
+    # Visualization settings
     MAX_TOPICS = int(os.getenv('MAX_TOPICS', '10'))
     MAX_SUBTOPICS = int(os.getenv('MAX_SUBTOPICS', '5'))
     FIGURE_DPI = int(os.getenv('FIGURE_DPI', '300'))
+    # Model settings
     MODEL_TRANSCRIBER = os.getenv('MODEL_TRANSCRIBER', 'openai/whisper-base')
     MODEL_GENERATOR = os.getenv('MODEL_GENERATOR', 'gpt2')
+    # Retry settings
     MAX_RETRIES = int(os.getenv('MAX_RETRIES', '3'))
     RETRY_DELAY = int(os.getenv('RETRY_DELAY', '1'))
 import json
 from typing import Dict, Any, Optional, List, Tuple
 import os
+from datetime import datetime
 from config import Config
 class Utils:
     @staticmethod
     def setup_logging() -> logging.Logger:
         logger = logging.getLogger("LearningPathGenerator")
+        level = getattr(logging, Config.LOG_LEVEL)
+        logger.setLevel(level)
         handler = logging.FileHandler("app.log")
         formatter = logging.Formatter(
             '%(asctime)s - %(name)s - %(levelname)s - %(message)s'
                 json.dump(data, f, ensure_ascii=False, indent=2)
             return True
         except Exception as e:
+            logging.error(f"Error saving JSON: {str(e)}")
             return False
     @staticmethod
             with open(filename, 'r', encoding='utf-8') as f:
                 return json.load(f)
         except Exception as e:
+            logging.error(f"Error loading JSON: {str(e)}")
             return None
     @staticmethod
+    def extract_topics(analysis: str) -> Tuple[List[str], Dict[str, List[str]]]:
+        # Simple topic extraction logic - could be enhanced
+        topics = ["Main Topic", "Subtopic 1", "Subtopic 2"]
+        subtopics = {
+            "Main Topic": ["Detail 1", "Detail 2"],
+            "Subtopic 1": ["Point 1", "Point 2"],
+            "Subtopic 2": ["Item 1", "Item 2"]
+        }
+        return topics, subtopics
 # models.py
 from transformers import pipeline
 import torch
+from typing import Dict, Any
 import logging
 from config import Config
     def _initialize_models(self):
         try:
             device = 0 if torch.cuda.is_available() else -1
             self.models["transcriber"] = pipeline(
             )
         except Exception as e:
+            self.logger.error(f"Error initializing models: {str(e)}")
             raise
+    def get_model(self, name: str) -> Any:
         return self.models.get(name)
 # main.py
 import gradio as gr
 from typing import Dict, Any
 import logging
 from config import Config
 from utils import Utils
 from models import ModelManager
 from visualization import Visualizer
+from datetime import datetime
 class LearningPathGenerator:
     def __init__(self):
         self.model_manager = ModelManager()
         self.history_file = Config.HISTORY_FILE
         if not os.path.exists(self.history_file):
             Utils.save_json([], self.history_file)
                      difficulty: str = "intermediate",
                      include_resources: bool = True) -> Dict[str, Any]:
         try:
             transcriber = self.model_manager.get_model("transcriber")
             transcription = transcriber(audio_path)["text"]
             generator = self.model_manager.get_model("generator")
+            analysis = self._generate_analysis(generator, transcription, difficulty, include_resources)
+            topics, subtopics = Utils.extract_topics(analysis)
             mind_map = Visualizer.create_mind_map(topics, subtopics)
             if path_name:
                 self._save_to_history(transcription, analysis, path_name)
             }
         except Exception as e:
+            self.logger.error(f"Processing error: {str(e)}")
             return self._error_response(str(e))
+    def _generate_analysis(self,
+                         generator: Any,
+                         text: str,
+                         difficulty: str,
+                         include_resources: bool) -> str:
+        prompt = f"""
+        Based on the following text, create a detailed learning path
+        for {difficulty} level:
+        {text[:Config.MAX_TEXT_LENGTH]}
+        Learning path:
+        """
+        response = generator(
+            prompt,
+            max_length=300,
+            num_return_sequences=1
+        )[0]["generated_text"]
+        if include_resources:
+            response += self._generate_resources()
+        return response
+    def _generate_resources(self) -> str:
+        return """
+        Recommended Resources:
+        1. Books:
+           - "Essential Guide"
+           - "Advanced Techniques"
+        2. Online Courses:
+           - Coursera: "Topic Specialization"
+           - edX: "Advanced Course"
+        3. Practical Resources:
+           - Interactive tutorials
+           - Practice exercises
+           - Real-world projects
+        """
+    def _save_to_history(self, transcription: str, analysis: str, path_name: str):
+        history = Utils.load_json(self.history_file) or []
+        history.append({
+            "date": datetime.now().isoformat(),
+            "name": path_name,
+            "transcription": transcription,
+            "analysis": analysis
+        })
+        Utils.save_json(history, self.history_file)
+    def _error_response(self, error_msg: str) -> Dict[str, Any]:
+        return {
+            "transcription": f"Error: {error_msg}",
+            "analysis": "Could not generate analysis due to an error.",
+            "mind_map": None
+        }
     def create_interface(self):
         with gr.Blocks(theme=gr.themes.Soft()) as app:
             gr.Markdown("""
+            # 🎓 Learning Path Generator
+            Upload an audio file describing your learning goals
+            and receive a personalized learning path with resources!
             """)
+            with gr.Tab("Generate Path"):
                 with gr.Row():
                     with gr.Column(scale=2):
                         audio_input = gr.Audio(
                             type="filepath",
+                            label="Audio Upload",
+                            description="Record or upload an audio describing your goals"
                         )
                         with gr.Row():
                             path_name = gr.Textbox(
+                                label="Path Name",
+                                placeholder="Give your learning path a name (optional)"
                             )
                             difficulty = gr.Dropdown(
+                                choices=["beginner", "intermediate", "advanced"],
+                                value="intermediate",
+                                label="Difficulty Level"
                             )
+                        include_resources = gr.Checkbox(
+                            label="Include Recommended Resources",
+                            value=True
+                        )
+                        process_btn = gr.Button(
+                            "Generate Learning Path",
+                            variant="primary"
+                        )
+                text_output = gr.Textbox(
+                    label="Audio Transcription",
+                    lines=4
+                )
+                analysis_output = gr.Textbox(
+                    label="Analysis and Learning Path",
+                    lines=10
+                )
+                mind_map_output = gr.Image(
+                    label="Learning Path Mind Map"
                 )
             process_btn.click(
                 fn=self.process_audio,
                 inputs=[audio_input, path_name, difficulty, include_resources],
                     "mind_map": mind_map_output
                 }
             )
         return app
 if __name__ == "__main__":
     try:
         generator = LearningPathGenerator()
         app = generator.create_interface()
         app.launch(debug=Config.DEBUG)
+    except Exception as e:
+        logging.error(f"Application error: {str(e)}")
+        raise