File size: 11,418 Bytes
55c034b
 
bcc273d
831e193
 
 
 
 
 
 
 
 
 
 
bcc273d
831e193
 
 
b6ee9f7
 
831e193
 
 
 
 
 
97bc8ca
831e193
97bc8ca
 
 
 
 
 
 
 
 
831e193
 
 
 
72b2a4f
915e40c
78a6940
 
915e40c
 
 
 
 
 
 
 
 
 
78a6940
 
 
 
 
915e40c
 
bcc273d
 
 
 
 
 
 
 
 
 
 
72b2a4f
bcc273d
 
 
 
 
 
 
 
 
 
 
1ee3f25
1966cb7
78a6940
411ee97
 
78a6940
 
411ee97
78a6940
1910fa3
411ee97
 
78a6940
 
 
411ee97
 
 
 
831e193
 
1910fa3
72b2a4f
 
87370f4
 
 
 
 
72b2a4f
87370f4
 
 
40c546c
 
1ebc36b
 
 
 
 
 
72b2a4f
 
 
1ebc36b
7f28e14
 
e5d18d8
 
 
 
 
 
 
 
 
 
bcc273d
 
 
 
1ebc36b
 
 
 
 
 
bcc273d
 
1ebc36b
 
 
 
 
e5d18d8
0172e7f
1ebc36b
 
0172e7f
 
 
1ebc36b
0172e7f
 
e5d18d8
1ebc36b
e5d18d8
915e40c
e5d18d8
 
1ebc36b
 
 
 
 
 
 
 
bcc273d
915e40c
1ebc36b
 
 
 
 
7f28e14
1ebc36b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
411ee97
1ebc36b
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
915e40c
 
1ebc36b
915e40c
 
87370f4
831e193
1ebc36b
915e40c
bcc273d
0172e7f
 
5bd23d0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
407e78c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
#modules/morphosyntax/morphosyntax_interface.py

#Importaciones generales
import streamlit as st
from streamlit_float import *
from streamlit_antd_components import *
from streamlit.components.v1 import html
import spacy
from spacy import displacy
import spacy_streamlit
import pandas as pd
import base64
import re

#Importaciones locales
from .morphosyntax_process import (
    process_morphosyntactic_input,
    format_analysis_results,
    perform_advanced_morphosyntactic_analysis,
    get_repeated_words_colors,
    highlight_repeated_words,
    POS_COLORS,
    POS_TRANSLATIONS
)

from ..utils.widget_utils import generate_unique_key

from ..database.morphosintax_mongo_db import store_student_morphosyntax_result

from ..database.morphosyntax_iterative_mongo_db import (
    store_student_morphosyntax_base,
    store_student_morphosyntax_iteration,
    get_student_morphosyntax_analysis,
    update_student_morphosyntax_analysis,
    delete_student_morphosyntax_analysis,
    get_student_morphosyntax_data
)

import logging
logger = logging.getLogger(__name__)

###########################################################################
def initialize_arc_analysis_state():
    """Inicializa el estado del análisis de arcos y el caché si no existen"""
    # Inicializar estado de análisis
    if 'arc_analysis_state' not in st.session_state:
        st.session_state.arc_analysis_state = {
            'original_text': '',
            'original_analysis': None,
            'iteration_text': '',
            'iteration_analysis': None,
            'analysis_count': 0
        }
        logger.info("Estado de análisis de arcos inicializado")

    # Inicializar caché de análisis
    if 'analysis_cache' not in st.session_state:
        st.session_state.analysis_cache = {}
        logger.info("Caché de análisis inicializado")

###########################################################################

def reset_morpho_state():
    """Resetea el estado del análisis morfosintáctico"""
    if 'arc_analysis_state' in st.session_state:
        st.session_state.arc_analysis_state = {
            'original_text': '',
            'original_analysis': None,
            'iteration_text': '',
            'iteration_analysis': None,
            'analysis_count': 0
        }
############################################################################

def display_original_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis original en el contenedor especificado"""
    with container:
        st.subheader("Análisis Original")
        display_morphosyntax_results(analysis, lang_code, morpho_t)

def display_iteration_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis de cambios en el contenedor especificado"""
    with container:
        st.subheader("Análisis de Cambios")
        display_morphosyntax_results(analysis, lang_code, morpho_t)

############################################################################

def cache_analysis_results(key, result):
    """Almacena resultados de análisis en caché"""
    if not hasattr(st.session_state, 'analysis_cache'):
        initialize_arc_analysis_state()
    st.session_state.analysis_cache[key] = result
    logger.info(f"Resultado almacenado en caché con clave: {key}")

def get_cached_analysis(key):
    """Recupera resultados de análisis del caché"""
    if not hasattr(st.session_state, 'analysis_cache'):
        initialize_arc_analysis_state()
        return None
    return st.session_state.analysis_cache.get(key)


############################################################################
def display_morphosyntax_interface(lang_code, nlp_models, morpho_t):
    try:
        # CSS para layout estable
        st.markdown("""
            <style>
            .stTextArea textarea {
                font-size: 1rem;
                line-height: 1.5;
                min-height: 100px !important;
                height: 100px !important;
            }
            .arc-diagram-container {
                width: 100%;
                padding: 0.5rem;
                margin: 0.5rem 0;
            }
            .divider {
                height: 3px;
                border: none;
                background-color: #333;
                margin: 2rem 0;
            }
            </style>
        """, unsafe_allow_html=True)

        # Asegurar que el tab morfosintáctico permanece activo
        st.session_state.tab_states['morpho_active'] = True
        st.session_state.selected_tab = 1

        # Crear subtabs
        subtabs = st.tabs([
            "Análisis de Diagramas de Arco",
            "Análisis de Categorías",
            "Análisis Morfológico"
        ])

        # Tab de Diagramas de Arco
        with subtabs[0]:
            # Botón de reset
            col1, col2, col3 = st.columns([2,1,2])
            with col1:
                if st.button("Nuevo Análisis", type="secondary", use_container_width=True):
                    st.session_state.arc_analysis_state = {
                        'base_id': None,
                        'original_text': '',
                        'iteration_text': '',
                        'analysis_count': 0
                    }
                    st.rerun()

            # Container principal para análisis
            analysis_container = st.container()
            
            with analysis_container:
                # Entrada de texto original
                text_input = st.text_area(
                    "",
                    value=st.session_state.arc_analysis_state.get('original_text', ''),
                    key=f"original_text_{st.session_state.arc_analysis_state['analysis_count']}",
                    height=100
                )

                # Botón de análisis
                col1, col2, col3 = st.columns([2,1,2])
                with col1:
                    analyze_button = st.button(
                        "Analizar Texto",
                        type="primary",
                        use_container_width=True
                    )

                # Procesar texto original
                if analyze_button and text_input.strip():
                    try:
                        # Realizar análisis base
                        doc = nlp_models[lang_code](text_input)
                        analysis = perform_advanced_morphosyntactic_analysis(
                            text_input,
                            nlp_models[lang_code]
                        )

                        # Guardar análisis base y obtener ID
                        base_id = store_student_morphosyntax_base(
                            st.session_state.username,
                            text_input,
                            analysis['arc_diagrams']
                        )

                        if base_id:
                            # Actualizar estado
                            st.session_state.arc_analysis_state.update({
                                'base_id': base_id,
                                'original_text': text_input,
                                'analysis_count': st.session_state.arc_analysis_state['analysis_count'] + 1
                            })

                            # Mostrar diagrama base
                            display_arc_diagram(doc, analysis)

                            # Línea divisora
                            st.markdown('<hr class="divider">', unsafe_allow_html=True)

                            # Área de iteración
                            with st.form("iteration_form"):
                                iteration_text = st.text_area(
                                    "",
                                    value=text_input,
                                    height=100
                                )

                                col1, col2, col3 = st.columns([2,1,2])
                                with col1:
                                    submitted = st.form_submit_button(
                                        "Analizar Cambios",
                                        type="primary",
                                        use_container_width=True
                                    )

                            # Procesar iteración
                            if submitted and iteration_text.strip():
                                doc_iter = nlp_models[lang_code](iteration_text)
                                analysis_iter = perform_advanced_morphosyntactic_analysis(
                                    iteration_text,
                                    nlp_models[lang_code]
                                )

                                # Guardar iteración
                                iteration_id = store_student_morphosyntax_iteration(
                                    st.session_state.username,
                                    base_id,
                                    text_input,
                                    iteration_text,
                                    analysis_iter['arc_diagrams']
                                )

                                if iteration_id:
                                    # Mostrar diagrama de iteración
                                    display_arc_diagram(doc_iter, analysis_iter)

                    except Exception as e:
                        st.error("Error procesando análisis")
                        logger.error(f"Error: {str(e)}")

        # Otros subtabs mantienen su implementación actual...
        with subtabs[1]:
            st.info("Análisis de Categorías en desarrollo...")
        
        with subtabs[2]:
            st.info("Análisis Morfológico en desarrollo...")

    except Exception as e:
        st.error("Error en la interfaz")
        logger.error(f"Error general en la interfaz: {str(e)}")

############################################################################

def display_morphosyntax_results(result, lang_code, morpho_t):
    """
    Muestra solo el diagrama de arco.
    Args:
        result: Diccionario con el documento procesado y su análisis
        lang_code: Código del idioma
        morpho_t: Diccionario de traducciones
    """
    if result is None:
        return
        
    try:
        doc = result['doc']
        sentences = list(doc.sents)
        for i, sent in enumerate(sentences):
            try:
                st.subheader(f"{morpho_t.get('sentence', 'Sentence')} {i+1}")
                html = displacy.render(sent, style="dep", options={
                    "distance": 100,
                    "arrow_spacing": 20,
                    "word_spacing": 30
                })
                html = html.replace('height="375"', 'height="200"')
                html = re.sub(r'<svg[^>]*>', lambda m: m.group(0).replace('height="450"', 'height="300"'), html)
                html = re.sub(r'<g [^>]*transform="translate\((\d+),(\d+)\)"', 
                            lambda m: f'<g transform="translate({m.group(1)},50)"', html)
                html = f'<div class="arc-diagram-container">{html}</div>'
                st.write(html, unsafe_allow_html=True)
            except Exception as e:
                logger.error(f"Error en diagrama {i}: {str(e)}")
                continue
    except Exception as e:
        logger.error(f"Error en display_morphosyntax_results: {str(e)}")