File size: 12,139 Bytes
9616a51
55c034b
831e193
 
 
 
 
 
 
 
 
 
 
9616a51
831e193
 
 
b6ee9f7
 
831e193
 
 
 
97bc8ca
b58af47
97bc8ca
 
 
 
 
 
 
 
831e193
 
 
 
72b2a4f
915e40c
b58af47
915e40c
 
b58af47
 
 
915e40c
 
 
 
78a6940
 
 
 
 
b58af47
bcc273d
b58af47
bcc273d
 
9616a51
bcc273d
 
 
 
9616a51
b58af47
bcc273d
b58af47
bcc273d
 
 
 
 
b58af47
bcc273d
 
 
1ee3f25
9e07ef2
b58af47
9e07ef2
 
b58af47
 
 
 
 
 
9e07ef2
b58af47
 
9616a51
 
b58af47
9616a51
b58af47
 
9616a51
b58af47
9616a51
9e07ef2
 
b58af47
 
9e07ef2
 
 
 
b58af47
411ee97
b58af47
 
 
411ee97
78a6940
1910fa3
411ee97
b58af47
 
78a6940
411ee97
 
b58af47
831e193
 
1910fa3
72b2a4f
 
87370f4
 
 
 
 
72b2a4f
87370f4
 
 
40c546c
 
1ebc36b
 
 
 
 
 
72b2a4f
 
 
b58af47
9616a51
b4c7125
b58af47
e5d18d8
 
 
 
 
 
b58af47
e5d18d8
b58af47
bcc273d
 
9616a51
b58af47
 
 
 
e5d18d8
b58af47
1ebc36b
b58af47
0172e7f
 
 
b58af47
 
 
 
 
e5d18d8
1ebc36b
 
 
 
 
 
 
bcc273d
915e40c
b58af47
1ebc36b
 
 
 
7f28e14
1ebc36b
 
b58af47
 
 
 
 
1ebc36b
 
 
 
b58af47
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9616a51
 
 
 
 
 
1ebc36b
9616a51
 
 
b58af47
 
9616a51
 
1ebc36b
9616a51
b58af47
 
9616a51
 
 
 
 
1ebc36b
 
9616a51
b58af47
1ebc36b
b58af47
915e40c
 
9616a51
b58af47
915e40c
 
87370f4
831e193
b58af47
915e40c
bcc273d
b58af47
5bd23d0
 
 
 
 
 
b58af47
5bd23d0
 
 
b58af47
5bd23d0
 
 
 
 
 
b58af47
 
 
 
 
 
 
9616a51
 
b58af47
9616a51
b58af47
9616a51
 
b58af47
9616a51
b58af47
 
 
 
5bd23d0
 
 
b58af47
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
# modules/morphosyntax/morphosyntax_interface.py

import streamlit as st
from streamlit_float import *
from streamlit_antd_components import *
from streamlit.components.v1 import html
import spacy
from spacy import displacy
import spacy_streamlit
import pandas as pd
import base64
import re

# Importaciones locales
from .morphosyntax_process import (
    process_morphosyntactic_input,
    format_analysis_results,
    perform_advanced_morphosyntactic_analysis,
    get_repeated_words_colors,
    highlight_repeated_words,
    POS_COLORS,
    POS_TRANSLATIONS
)

from ..utils.widget_utils import generate_unique_key
from ..database.morphosyntax_iterative_mongo_db import (
    store_student_morphosyntax_base,
    store_student_morphosyntax_iteration,
    get_student_morphosyntax_analysis,
    update_student_morphosyntax_analysis,
    delete_student_morphosyntax_analysis,
    get_student_morphosyntax_data
)

import logging
logger = logging.getLogger(__name__)

###########################################################################
def initialize_arc_analysis_state():
    """Inicializa el estado del análisis de arcos y el caché si no existen"""
    if 'arc_analysis_state' not in st.session_state:
        st.session_state.arc_analysis_state = {
            'base_id': None,
            'original_text': '',
            'iteration_text': '',
            'analysis_count': 0
        }
        logger.info("Estado de análisis de arcos inicializado")

    # Inicializar caché de análisis
    if 'analysis_cache' not in st.session_state:
        st.session_state.analysis_cache = {}
        logger.info("Caché de análisis inicializado")

###########################################################################
def reset_morpho_state():
    """Resetea el estado del análisis morfosintáctico"""
    if 'arc_analysis_state' in st.session_state:
        st.session_state.arc_analysis_state = {
            'base_id': None,
            'original_text': '',
            'iteration_text': '',
            'analysis_count': 0
        }

###########################################################################
def display_original_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis original en el contenedor especificado"""
    with container:
        st.subheader("Análisis Original")
        display_morphosyntax_results(analysis, lang_code, morpho_t)

def display_iteration_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis de cambios en el contenedor especificado"""
    with container:
        st.subheader("Análisis de Cambios")
        display_morphosyntax_results(analysis, lang_code, morpho_t)

def display_arc_diagram(doc, analysis):
    """Muestra un diagrama de arco sin título"""
    try:
        for sent in doc.sents:
            rendered = displacy.render(sent, style="dep", options={
                "distance": 100,
                "arrow_spacing": 20,
                "word_spacing": 30
            })
            
            # Ajustar tamaño y posición
            rendered = rendered.replace('height="375"', 'height="200"')
            rendered = re.sub(
                r'<svg[^>]*>',
                lambda m: m.group(0).replace('height="450"', 'height="300"'),
                rendered
            )
            rendered = re.sub(
                r'<g [^>]*transform="translate\((\d+),(\d+)\)"', 
                lambda m: f'<g transform="translate({m.group(1)},50)"',
                rendered
            )
            
            # Envolver en contenedor con estilo
            rendered = f'<div class="arc-diagram-container">{rendered}</div>'
            st.write(rendered, unsafe_allow_html=True)

    except Exception as e:
        logger.error(f"Error en display_arc_diagram: {str(e)}")

###########################################################################
def cache_analysis_results(key, result):
    """Almacena resultados de análisis en caché"""
    if 'analysis_cache' not in st.session_state:
        st.session_state.analysis_cache = {}
    st.session_state.analysis_cache[key] = result
    logger.info(f"Resultado almacenado en caché con clave: {key}")

def get_cached_analysis(key):
    """Recupera resultados de análisis del caché"""
    if 'analysis_cache' not in st.session_state:
        return None
    return st.session_state.analysis_cache.get(key)

###########################################################################
def display_morphosyntax_interface(lang_code, nlp_models, morpho_t):
    try:
        # CSS para layout estable
        st.markdown("""
            <style>
            .stTextArea textarea {
                font-size: 1rem;
                line-height: 1.5;
                min-height: 100px !important;
                height: 100px !important;
            }
            .arc-diagram-container {
                width: 100%;
                padding: 0.5rem;
                margin: 0.5rem 0;
            }
            .divider {
                height: 3px;
                border: none;
                background-color: #333;
                margin: 2rem 0;
            }
            </style>
        """, unsafe_allow_html=True)

        # Inicializar estados si no existen
        initialize_arc_analysis_state()

        # -- Tabs: definimos 3 pestañas
        subtabs = st.tabs([
            "Análisis de Diagramas de Arco",
            "Análisis de Categorías",
            "Análisis Morfológico"
        ])

        # =========== Pestaña 1: Diagrama de Arco ===============
        with subtabs[0]:
            col1, col2, col3 = st.columns([2,1,2])
            with col1:
                if st.button("Nuevo Análisis", type="secondary", use_container_width=True):
                    reset_morpho_state()

            # Contenedor de todo el proceso
            with st.container():
                # Input texto original
                text_input = st.text_area(
                    "Ingrese su texto",
                    value=st.session_state.arc_analysis_state.get('original_text', ''),
                    key=f"original_text_{st.session_state.arc_analysis_state['analysis_count']}",
                    height=100
                )

                analyze_button = st.button(
                    "Analizar Texto",
                    type="primary",
                    use_container_width=True
                )

                # Procesar texto original
                if analyze_button and text_input.strip():
                    try:
                        doc = nlp_models[lang_code](text_input)
                        analysis = perform_advanced_morphosyntactic_analysis(
                            text_input,
                            nlp_models[lang_code]
                        )

                        # Guardar en Mongo
                        base_id = store_student_morphosyntax_base(
                            st.session_state.username,
                            text_input,
                            analysis['arc_diagrams']
                        )

                        if base_id:
                            # Actualizar estado
                            st.session_state.arc_analysis_state['base_id'] = base_id
                            st.session_state.arc_analysis_state['original_text'] = text_input
                            st.session_state.arc_analysis_state['analysis_count'] += 1

                            display_arc_diagram(doc, analysis)

                            st.markdown('<hr class="divider">', unsafe_allow_html=True)

                            # Caja de texto para la iteración
                            st.subheader("Iteración / Cambios:")
                            iteration_text = st.text_area(
                                "Ingrese cambios o versión modificada",
                                value=st.session_state.arc_analysis_state.get('iteration_text', ''),
                                key="iteration_text",
                                height=100
                            )

                            # Botón para analizar iteración
                            iteration_button = st.button(
                                "Analizar Cambios",
                                type="primary",
                                use_container_width=True
                            )

                            if iteration_button and iteration_text.strip():
                                try:
                                    doc_iter = nlp_models[lang_code](iteration_text)
                                    analysis_iter = perform_advanced_morphosyntactic_analysis(
                                        iteration_text,
                                        nlp_models[lang_code]
                                    )

                                    iteration_id = store_student_morphosyntax_iteration(
                                        st.session_state.username,
                                        base_id,
                                        text_input,
                                        iteration_text,
                                        analysis_iter['arc_diagrams']
                                    )

                                    if iteration_id:
                                        # Guardamos el texto de iteración en session_state
                                        st.session_state.arc_analysis_state['iteration_text'] = iteration_text
                                        display_arc_diagram(doc_iter, analysis_iter)

                                except Exception as e:
                                    st.error("Error procesando iteración")
                                    logger.error(f"Error en iteración: {str(e)}")

                    except Exception as e:
                        st.error("Error procesando análisis base")
                        logger.error(f"Error: {str(e)}")

        # =========== Pestaña 2: Categorías (placeholder) ============
        with subtabs[1]:
            st.info("Análisis de Categorías en desarrollo...")

        # =========== Pestaña 3: Análisis Morfológico (placeholder) ============
        with subtabs[2]:
            st.info("Análisis Morfológico en desarrollo...")

    except Exception as e:
        st.error("Error en la interfaz")
        logger.error(f"Error general en la interfaz: {str(e)}")

###########################################################################
def display_morphosyntax_results(result, lang_code, morpho_t):
    """
    Muestra solo el diagrama de arco.
    Args:
        result: Diccionario con el documento procesado y su análisis
        lang_code: Código del idioma
        morpho_t: Diccionario de traducciones
    """
    if result is None:
        return
        
    try:
        doc = result['doc']
        sentences = list(doc.sents)
        for i, sent in enumerate(sentences):
            try:
                st.subheader(f"{morpho_t.get('sentence', 'Sentence')} {i+1}")
                rendered = displacy.render(sent, style="dep", options={
                    "distance": 100,
                    "arrow_spacing": 20,
                    "word_spacing": 30
                })
                rendered = rendered.replace('height="375"', 'height="200"')
                rendered = re.sub(
                    r'<svg[^>]*>',
                    lambda m: m.group(0).replace('height="450"', 'height="300"'),
                    rendered
                )
                rendered = re.sub(
                    r'<g [^>]*transform="translate\((\d+),(\d+)\)"',
                    lambda m: f'<g transform="translate({m.group(1)},50)"',
                    rendered
                )
                rendered = f'<div class="arc-diagram-container">{rendered}</div>'
                st.write(rendered, unsafe_allow_html=True)
            except Exception as e:
                logger.error(f"Error en diagrama {i}: {str(e)}")
                continue
    except Exception as e:
        logger.error(f"Error en display_morphosyntax_results: {str(e)}")