File size: 13,616 Bytes
55c034b
 
bcc273d
831e193
 
 
 
 
 
 
 
 
 
 
bcc273d
831e193
 
 
b6ee9f7
 
831e193
 
 
 
 
 
 
 
 
 
 
 
72b2a4f
915e40c
78a6940
 
915e40c
 
 
 
 
 
 
 
 
 
78a6940
 
 
 
 
915e40c
 
bcc273d
 
 
 
 
 
 
 
 
 
 
72b2a4f
bcc273d
 
 
 
 
 
 
 
 
 
 
1ee3f25
1966cb7
78a6940
411ee97
 
78a6940
 
411ee97
78a6940
1910fa3
411ee97
 
78a6940
 
 
411ee97
 
 
 
831e193
 
1910fa3
72b2a4f
 
87370f4
 
 
 
 
72b2a4f
87370f4
 
 
40c546c
 
72b2a4f
 
 
7f28e14
 
 
915e40c
e5d18d8
 
 
 
 
 
 
 
 
 
bcc273d
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e5d18d8
 
0172e7f
e5d18d8
 
0172e7f
 
 
 
 
e5d18d8
 
 
915e40c
 
e5d18d8
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
bcc273d
915e40c
bcc273d
 
 
 
915e40c
e5d18d8
 
915e40c
e5d18d8
7f28e14
 
 
 
411ee97
7f28e14
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
411ee97
7f28e14
 
 
 
 
 
 
 
 
 
411ee97
7f28e14
 
 
 
 
 
 
 
 
 
 
e5d18d8
7f28e14
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
e5d18d8
bcc273d
915e40c
 
 
 
 
87370f4
831e193
1910fa3
915e40c
bcc273d
0172e7f
 
5bd23d0
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
407e78c
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
#modules/morphosyntax/morphosyntax_interface.py

#Importaciones generales
import streamlit as st
from streamlit_float import *
from streamlit_antd_components import *
from streamlit.components.v1 import html
import spacy
from spacy import displacy
import spacy_streamlit
import pandas as pd
import base64
import re

#Importaciones locales
from .morphosyntax_process import (
    process_morphosyntactic_input,
    format_analysis_results,
    perform_advanced_morphosyntactic_analysis,
    get_repeated_words_colors,
    highlight_repeated_words,
    POS_COLORS,
    POS_TRANSLATIONS
)

from ..utils.widget_utils import generate_unique_key
from ..database.morphosintax_mongo_db import store_student_morphosyntax_result
from ..database.chat_mongo_db import store_chat_history, get_chat_history

import logging
logger = logging.getLogger(__name__)

###########################################################################
def initialize_arc_analysis_state():
    """Inicializa el estado del análisis de arcos y el caché si no existen"""
    # Inicializar estado de análisis
    if 'arc_analysis_state' not in st.session_state:
        st.session_state.arc_analysis_state = {
            'original_text': '',
            'original_analysis': None,
            'iteration_text': '',
            'iteration_analysis': None,
            'analysis_count': 0
        }
        logger.info("Estado de análisis de arcos inicializado")

    # Inicializar caché de análisis
    if 'analysis_cache' not in st.session_state:
        st.session_state.analysis_cache = {}
        logger.info("Caché de análisis inicializado")

###########################################################################

def reset_morpho_state():
    """Resetea el estado del análisis morfosintáctico"""
    if 'arc_analysis_state' in st.session_state:
        st.session_state.arc_analysis_state = {
            'original_text': '',
            'original_analysis': None,
            'iteration_text': '',
            'iteration_analysis': None,
            'analysis_count': 0
        }
############################################################################

def display_original_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis original en el contenedor especificado"""
    with container:
        st.subheader("Análisis Original")
        display_morphosyntax_results(analysis, lang_code, morpho_t)

def display_iteration_analysis(container, analysis, lang_code, morpho_t):
    """Muestra el análisis de cambios en el contenedor especificado"""
    with container:
        st.subheader("Análisis de Cambios")
        display_morphosyntax_results(analysis, lang_code, morpho_t)

############################################################################

def cache_analysis_results(key, result):
    """Almacena resultados de análisis en caché"""
    if not hasattr(st.session_state, 'analysis_cache'):
        initialize_arc_analysis_state()
    st.session_state.analysis_cache[key] = result
    logger.info(f"Resultado almacenado en caché con clave: {key}")

def get_cached_analysis(key):
    """Recupera resultados de análisis del caché"""
    if not hasattr(st.session_state, 'analysis_cache'):
        initialize_arc_analysis_state()
        return None
    return st.session_state.analysis_cache.get(key)


############################################################################
def display_morphosyntax_interface(lang_code, nlp_models, morpho_t):
    try:
        # CSS para layout estable
        st.markdown("""
            <style>
            .stTextArea textarea {
                font-size: 1rem;
                line-height: 1.5;
                min-height: 100px !important;
                height: 100px !important;
            }
            .arc-diagram-container {
                width: 100%;
                padding: 0.5rem;
                margin: 0.5rem 0;
            }
            </style>
        """, unsafe_allow_html=True)

        # Inicializar estado y mantener tab activo
        st.session_state.tab_states['morpho_active'] = True
        st.session_state.selected_tab = 1
        initialize_arc_analysis_state()

        # Crear subtabs
        subtabs = st.tabs([
            "Análisis de Diagramas de Arco",
            "Análisis de Categorías",
            "Análisis Morfológico"
        ])

        # Tab de Diagramas de Arco
        with subtabs[0]:
            # Botón de reset
            col1, col2, col3 = st.columns([2,1,2])
            with col1:
                if st.button("Nuevo Análisis", type="secondary", use_container_width=True):
                    reset_morpho_state()
                    st.rerun()

            # Contenedores separados para cada tipo de análisis
            original_input_container = st.container()
            original_diagram_container = st.container()
            iteration_input_container = st.container()
            iteration_diagram_container = st.container()

            # Sección de análisis original
            with original_input_container:
                text_key = f"original_text_{st.session_state.arc_analysis_state['analysis_count']}"
                text_input = st.text_area(
                    "",
                    value=st.session_state.arc_analysis_state['original_text'],
                    key=text_key,
                    height=100
                )

                col1, col2, col3 = st.columns([2,1,2])
                with col1:
                    analyze_button = st.button(
                        "Analizar Texto Original",
                        type="primary",
                        key=f"analyze_original_{st.session_state.arc_analysis_state['analysis_count']}",
                        use_container_width=True
                    )

            # Procesar texto original
            if analyze_button and text_input.strip():
                try:
                    doc = nlp_models[lang_code](text_input)
                    analysis = perform_advanced_morphosyntactic_analysis(
                        text_input,
                        nlp_models[lang_code]
                    )
                    
                    st.session_state.arc_analysis_state.update({
                        'original_text': text_input,
                        'original_analysis': {'doc': doc, 'analysis': analysis},
                        'iteration_text': text_input,
                        'analysis_count': st.session_state.arc_analysis_state['analysis_count'] + 1
                    })

                    if store_student_morphosyntax_result(
                        username=st.session_state.username,
                        text=text_input,
                        arc_diagrams=analysis['arc_diagrams']
                    ):
                        display_original_analysis(
                            original_diagram_container,
                            st.session_state.arc_analysis_state['original_analysis'],
                            lang_code,
                            morpho_t
                        )

                except Exception as e:
                    st.error("Error al procesar texto original")
                    logger.error(f"Error al procesar texto original: {str(e)}")

            # Sección de iteración
            if st.session_state.arc_analysis_state.get('original_analysis'):
                with iteration_input_container:
                    st.markdown("---")
                    
                    # Formulario de iteración
                    with st.form(key="iteration_form"):
                        iteration_text = st.text_area(
                            "",
                            value=st.session_state.arc_analysis_state.get('iteration_text', ''),
                            key=f"iteration_{st.session_state.arc_analysis_state['analysis_count']}",
                            height=100
                        )
                        
                        # Botón de análisis dentro del formulario
                        submitted = st.form_submit_button(
                            "Analizar Cambios",
                            type="primary",
                            use_container_width=True
                        )
                        
                        # Cuando se envía el formulario
                        if submitted and iteration_text.strip():
                            try:
                                # Verificar si ya existe en caché
                                cache_key = f"iter_{iteration_text}"
                                cached_result = get_cached_analysis(cache_key)
                                
                                if cached_result:
                                    logger.info("Usando resultado cacheado")
                                    doc_iter = cached_result['doc']
                                    analysis_iter = cached_result['analysis']
                                else:
                                    logger.info("Generando nuevo análisis")
                                    doc_iter = nlp_models[lang_code](iteration_text)
                                    analysis_iter = perform_advanced_morphosyntactic_analysis(
                                        iteration_text,
                                        nlp_models[lang_code]
                                    )
                                    # Guardar en caché
                                    cache_analysis_results(cache_key, {
                                        'doc': doc_iter,
                                        'analysis': analysis_iter
                                    })

                                # Actualizar estado
                                st.session_state.arc_analysis_state.update({
                                    'iteration_text': iteration_text,
                                    'iteration_analysis': {'doc': doc_iter, 'analysis': analysis_iter}
                                })

                                if store_student_morphosyntax_result(
                                    username=st.session_state.username,
                                    text=iteration_text,
                                    arc_diagrams=analysis_iter['arc_diagrams']
                                ):
                                    # Mostrar análisis en columnas
                                    col1, col2 = st.columns(2)
                                    
                                    # Mostrar ambos análisis
                                    with col1:
                                        display_original_analysis(
                                            original_diagram_container,
                                            st.session_state.arc_analysis_state['original_analysis'],
                                            lang_code,
                                            morpho_t
                                        )
                                    
                                    with col2:
                                        display_iteration_analysis(
                                            iteration_diagram_container,
                                            {'doc': doc_iter, 'analysis': analysis_iter},
                                            lang_code,
                                            morpho_t
                                        )

                            except Exception as e:
                                st.error("Error al procesar iteración")
                                logger.error(f"Error al procesar iteración: {str(e)}")

        # Otros subtabs...
        with subtabs[1]:
            st.info("Análisis de Categorías en desarrollo...")
            
        with subtabs[2]:
            st.info("Análisis Morfológico en desarrollo...")

    except Exception as e:
        st.error("Error general en la interfaz")
        logger.error(f"Error general en la interfaz: {str(e)}")

############################################################################

def display_morphosyntax_results(result, lang_code, morpho_t):
    """
    Muestra solo el diagrama de arco.
    Args:
        result: Diccionario con el documento procesado y su análisis
        lang_code: Código del idioma
        morpho_t: Diccionario de traducciones
    """
    if result is None:
        return
        
    try:
        doc = result['doc']
        sentences = list(doc.sents)
        for i, sent in enumerate(sentences):
            try:
                st.subheader(f"{morpho_t.get('sentence', 'Sentence')} {i+1}")
                html = displacy.render(sent, style="dep", options={
                    "distance": 100,
                    "arrow_spacing": 20,
                    "word_spacing": 30
                })
                html = html.replace('height="375"', 'height="200"')
                html = re.sub(r'<svg[^>]*>', lambda m: m.group(0).replace('height="450"', 'height="300"'), html)
                html = re.sub(r'<g [^>]*transform="translate\((\d+),(\d+)\)"', 
                            lambda m: f'<g transform="translate({m.group(1)},50)"', html)
                html = f'<div class="arc-diagram-container">{html}</div>'
                st.write(html, unsafe_allow_html=True)
            except Exception as e:
                logger.error(f"Error en diagrama {i}: {str(e)}")
                continue
    except Exception as e:
        logger.error(f"Error en display_morphosyntax_results: {str(e)}")