File size: 14,362 Bytes
9616a51
55c034b
831e193
 
 
 
 
 
 
 
 
 
 
9616a51
831e193
 
 
b6ee9f7
 
831e193
 
 
 
97bc8ca
b58af47
a5fb792
97bc8ca
 
 
 
 
 
 
 
831e193
 
 
 
72b2a4f
915e40c
a5fb792
915e40c
 
a5fb792
 
 
 
 
915e40c
 
 
 
78a6940
 
 
 
 
a5fb792
bcc273d
a5fb792
bcc273d
 
9616a51
bcc273d
a5fb792
bcc273d
a5fb792
bcc273d
 
9616a51
a5fb792
bcc273d
a5fb792
bcc273d
 
 
 
a5fb792
bcc273d
a5fb792
bcc273d
 
 
1ee3f25
a5fb792
9e07ef2
a5fb792
9e07ef2
 
a5fb792
 
 
 
 
 
 
 
 
9e07ef2
a5fb792
 
9616a51
 
a5fb792
9616a51
a5fb792
 
9616a51
a5fb792
9616a51
9e07ef2
 
a5fb792
 
9e07ef2
 
 
 
a5fb792
411ee97
a5fb792
b58af47
a5fb792
411ee97
78a6940
1910fa3
a5fb792
411ee97
a5fb792
b58af47
a5fb792
78a6940
411ee97
 
a5fb792
831e193
a5fb792
 
 
831e193
1910fa3
72b2a4f
 
87370f4
 
 
 
 
72b2a4f
87370f4
 
 
40c546c
 
1ebc36b
 
 
 
 
 
72b2a4f
 
 
b58af47
9616a51
b4c7125
a5fb792
e5d18d8
 
 
 
 
 
a5fb792
e5d18d8
a5fb792
 
bcc273d
 
9616a51
a5fb792
 
 
 
 
 
 
 
e5d18d8
a5fb792
1ebc36b
a5fb792
0172e7f
 
 
a5fb792
 
 
 
 
 
 
 
e5d18d8
1ebc36b
 
 
a5fb792
 
 
 
1ebc36b
 
 
 
bcc273d
915e40c
a5fb792
1ebc36b
 
 
 
7f28e14
1ebc36b
 
a5fb792
 
 
 
 
 
 
 
 
 
 
 
1ebc36b
 
a5fb792
1ebc36b
 
a5fb792
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
9616a51
 
 
 
 
 
1ebc36b
9616a51
 
a5fb792
 
 
9616a51
 
1ebc36b
9616a51
a5fb792
 
 
 
 
 
9616a51
 
 
 
 
1ebc36b
 
9616a51
a5fb792
1ebc36b
a5fb792
915e40c
 
9616a51
a5fb792
915e40c
 
87370f4
831e193
a5fb792
915e40c
bcc273d
a5fb792
5bd23d0
 
 
 
 
 
a5fb792
5bd23d0
a5fb792
5bd23d0
 
 
 
 
 
 
a5fb792
 
 
 
 
 
 
 
 
 
 
9616a51
 
a5fb792
9616a51
a5fb792
9616a51
 
a5fb792
9616a51
a5fb792
 
 
 
5bd23d0
 
 
b58af47
a5fb792
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
# modules/morphosyntax/morphosyntax_interface.py

import streamlit as st
from streamlit_float import *
from streamlit_antd_components import *
from streamlit.components.v1 import html
import spacy
from spacy import displacy
import spacy_streamlit
import pandas as pd
import base64
import re

# Importaciones locales
from .morphosyntax_process import (
    process_morphosyntactic_input,
    format_analysis_results,
    perform_advanced_morphosyntactic_analysis,
    get_repeated_words_colors,
    highlight_repeated_words,
    POS_COLORS,
    POS_TRANSLATIONS
)

from ..utils.widget_utils import generate_unique_key

from ..database.morphosyntax_iterative_mongo_db import (
    store_student_morphosyntax_base,
    store_student_morphosyntax_iteration,
    get_student_morphosyntax_analysis,
    update_student_morphosyntax_analysis,
    delete_student_morphosyntax_analysis,
    get_student_morphosyntax_data
)

import logging
logger = logging.getLogger(__name__)

###########################################################################
def initialize_arc_analysis_state():
    """Inicializa el estado del análisis de arcos y el caché si no existen."""
    if 'arc_analysis_state' not in st.session_state:
        st.session_state.arc_analysis_state = {
            'base_id': None,           # ID del análisis base (ObjectId)
            'original_text': '',       # Texto original
            'original_analysis': None, # Dict con resultados del análisis base
            'iteration_text': '',      # Texto de iteración
            'iteration_analysis': None,# Dict con resultados de la iteración
            'analysis_count': 0
        }
        logger.info("Estado de análisis de arcos inicializado")

    # Inicializar caché de análisis
    if 'analysis_cache' not in st.session_state:
        st.session_state.analysis_cache = {}
        logger.info("Caché de análisis inicializado")


def reset_morpho_state():
    """Resetea el estado del análisis morfosintáctico en sesión."""
    if 'arc_analysis_state' in st.session_state:
        st.session_state.arc_analysis_state = {
            'base_id': None,
            'original_text': '',
            'original_analysis': None,
            'iteration_text': '',
            'iteration_analysis': None,
            'analysis_count': 0
        }


def display_original_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis original en el contenedor especificado."""
    with container:
        st.subheader("Análisis Original")
        display_morphosyntax_results(analysis, lang_code, morpho_t)


def display_iteration_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis de cambios en el contenedor especificado."""
    with container:
        st.subheader("Análisis de Cambios")
        display_morphosyntax_results(analysis, lang_code, morpho_t)


def display_arc_diagram(doc, analysis):
    """Muestra un diagrama de arco sin título."""
    try:
        for sent in doc.sents:
            svg_html = displacy.render(
                sent,
                style="dep",
                options={
                    "distance": 100,
                    "arrow_spacing": 20,
                    "word_spacing": 30
                }
            )
            # Ajustar tamaño y posición
            svg_html = svg_html.replace('height="375"', 'height="200"')
            svg_html = re.sub(
                r'<svg[^>]*>',
                lambda m: m.group(0).replace('height="450"', 'height="300"'),
                svg_html
            )
            svg_html = re.sub(
                r'<g [^>]*transform="translate\((\d+),(\d+)\)"',
                lambda m: f'<g transform="translate({m.group(1)},50)"',
                svg_html
            )
            
            # Envolver en contenedor con estilo
            svg_html = f'<div class="arc-diagram-container">{svg_html}</div>'
            st.write(svg_html, unsafe_allow_html=True)

    except Exception as e:
        logger.error(f"Error en display_arc_diagram: {str(e)}")


def cache_analysis_results(key, result):
    """Almacena resultados de análisis en caché."""
    if 'analysis_cache' not in st.session_state:
        initialize_arc_analysis_state()
    st.session_state.analysis_cache[key] = result
    logger.info(f"Resultado almacenado en caché con clave: {key}")


def get_cached_analysis(key):
    """Recupera resultados de análisis del caché."""
    if 'analysis_cache' not in st.session_state:
        initialize_arc_analysis_state()
        return None
    return st.session_state.analysis_cache.get(key)


def display_morphosyntax_interface(lang_code, nlp_models, morpho_t):
    """
    Interfaz principal para el análisis morfosintáctico.
    """
    try:
        # CSS para layout estable
        st.markdown("""
            <style>
            .stTextArea textarea {
                font-size: 1rem;
                line-height: 1.5;
                min-height: 100px !important;
                height: 100px !important;
            }
            .arc-diagram-container {
                width: 100%;
                padding: 0.5rem;
                margin: 0.5rem 0;
            }
            .divider {
                height: 3px;
                border: none;
                background-color: #333;
                margin: 2rem 0;
            }
            </style>
        """, unsafe_allow_html=True)

        # Inicializar estados si no existen
        initialize_arc_analysis_state()

        # Crear subtabs
        subtabs = st.tabs([
            "Análisis de Diagramas de Arco",
            "Análisis de Categorías",
            "Análisis Morfológico"
        ])

        # -------------------- Subtab 0: Diagramas de Arco --------------------
        with subtabs[0]:
            # Botón de reset
            col1, col2, col3 = st.columns([2, 1, 2])
            with col1:
                if st.button("Nuevo Análisis", type="secondary", use_container_width=True):
                    reset_morpho_state()
                    # Forzar un refresco completo solo en este caso
                    st.experimental_rerun()

            # Container principal para análisis base
            analysis_container = st.container()
            with analysis_container:
                # Entrada de texto original
                text_input_key = f"original_text_{st.session_state.arc_analysis_state['analysis_count']}"
                text_input = st.text_area(
                    "Texto original",
                    value=st.session_state.arc_analysis_state.get('original_text', ''),
                    key=text_input_key,
                    height=100
                )

                # Botón de análisis
                col1, col2, col3 = st.columns([2, 1, 2])
                with col1:
                    analyze_button = st.button(
                        "Analizar Texto",
                        type="primary",
                        use_container_width=True
                    )

                # Procesar texto original
                if analyze_button and text_input.strip():
                    try:
                        if not getattr(st.session_state, 'username', None):
                            st.error("No se detectó username en session_state. Verifica tu login.")
                            return

                        doc = nlp_models[lang_code](text_input)
                        analysis = perform_advanced_morphosyntactic_analysis(
                            text_input,
                            nlp_models[lang_code]
                        )

                        # Guardar en BD (retornará ObjectId)
                        base_id = store_student_morphosyntax_base(
                            st.session_state.username,
                            text_input,
                            analysis['arc_diagrams']
                        )

                        if base_id:
                            # Actualizar el estado en session_state
                            st.session_state.arc_analysis_state.update({
                                'base_id': base_id,  # Guardamos el ObjectId
                                'original_text': text_input,
                                'original_analysis': analysis,
                                'analysis_count': st.session_state.arc_analysis_state['analysis_count'] + 1,
                                # Reiniciamos la iteración
                                'iteration_text': '',
                                'iteration_analysis': None
                            })

                            # Mostrar diagrama base
                            display_arc_diagram(doc, analysis)

                            # Línea divisora
                            st.markdown('<hr class="divider">', unsafe_allow_html=True)

                            # Sección para la iteración
                            st.subheader("Iteración / Cambios")
                            with st.form("iteration_form"):
                                # key para la iteración
                                iteration_text_key = f"iteration_text_{st.session_state.arc_analysis_state['analysis_count']}"
                                
                                # En lugar de default = text_input, ahora dejamos vacío por defecto
                                iteration_text = st.text_area(
                                    "Texto de iteración",
                                    value=st.session_state.arc_analysis_state.get('iteration_text', ''),
                                    key=iteration_text_key,
                                    height=100
                                )

                                # Botón de submit en el formulario
                                col1, col2, col3 = st.columns([2,1,2])
                                with col1:
                                    submitted = st.form_submit_button(
                                        "Analizar Cambios",
                                        type="primary",
                                        use_container_width=True
                                    )

                            if submitted and iteration_text.strip():
                                try:
                                    doc_iter = nlp_models[lang_code](iteration_text)
                                    analysis_iter = perform_advanced_morphosyntactic_analysis(
                                        iteration_text,
                                        nlp_models[lang_code]
                                    )

                                    iteration_id = store_student_morphosyntax_iteration(
                                        st.session_state.username,
                                        base_id,           # este es ObjectId
                                        text_input,        # Texto original
                                        iteration_text,    # Texto de iteración
                                        analysis_iter['arc_diagrams']
                                    )

                                    if iteration_id:
                                        # Actualizamos el estado de la iteración
                                        st.session_state.arc_analysis_state.update({
                                            'iteration_text': iteration_text,
                                            'iteration_analysis': analysis_iter
                                        })
                                        # Mostrar diagrama de iteración
                                        display_arc_diagram(doc_iter, analysis_iter)

                                except Exception as e:
                                    st.error("Error procesando iteración")
                                    logger.error(f"Error en iteración: {str(e)}")

                    except Exception as e:
                        st.error("Error procesando análisis base")
                        logger.error(f"Error base: {str(e)}")

        # -------------------- Subtab 1: Análisis de Categorías ----------------
        with subtabs[1]:
            st.info("Análisis de Categorías en desarrollo...")

        # -------------------- Subtab 2: Análisis Morfológico ------------------
        with subtabs[2]:
            st.info("Análisis Morfológico en desarrollo...")

    except Exception as e:
        st.error("Error en la interfaz de morfosintaxis")
        logger.error(f"Error general en la interfaz: {str(e)}")


def display_morphosyntax_results(result, lang_code, morpho_t):
    """
    Muestra solo el diagrama de arco.
    Args:
        result: Diccionario con el documento procesado y su análisis
        lang_code: Código del idioma
        morpho_t: Diccionario de traducciones (opcional)
    """
    if not result:
        return
    try:
        doc = result['doc']
        sentences = list(doc.sents)
        for i, sent in enumerate(sentences):
            try:
                st.subheader(f"{morpho_t.get('sentence', 'Sentence')} {i+1}")
                svg_html = displacy.render(
                    sent,
                    style="dep",
                    options={
                        "distance": 100,
                        "arrow_spacing": 20,
                        "word_spacing": 30
                    }
                )
                svg_html = svg_html.replace('height="375"', 'height="200"')
                svg_html = re.sub(
                    r'<svg[^>]*>',
                    lambda m: m.group(0).replace('height="450"', 'height="300"'),
                    svg_html
                )
                svg_html = re.sub(
                    r'<g [^>]*transform="translate\((\d+),(\d+)\)"',
                    lambda m: f'<g transform="translate({m.group(1)},50)"',
                    svg_html
                )
                svg_html = f'<div class="arc-diagram-container">{svg_html}</div>'
                st.write(svg_html, unsafe_allow_html=True)
            except Exception as exc:
                logger.error(f"Error mostrando diagrama de la oración {i}: {str(exc)}")
                continue
    except Exception as e:
        logger.error(f"Error en display_morphosyntax_results: {str(e)}")