Spaces:
Runtime error
Runtime error
# modules/morphosyntax/morphosyntax_interface.py | |
import streamlit as st | |
from streamlit_float import * | |
from streamlit_antd_components import * | |
from streamlit.components.v1 import html | |
import spacy | |
from spacy import displacy | |
import spacy_streamlit | |
import pandas as pd | |
import base64 | |
import re | |
# Importaciones locales | |
from .morphosyntax_process import ( | |
process_morphosyntactic_input, | |
format_analysis_results, | |
perform_advanced_morphosyntactic_analysis, | |
get_repeated_words_colors, | |
highlight_repeated_words, | |
POS_COLORS, | |
POS_TRANSLATIONS | |
) | |
from ..utils.widget_utils import generate_unique_key | |
from ..database.morphosyntax_iterative_mongo_db import ( | |
store_student_morphosyntax_base, | |
store_student_morphosyntax_iteration, | |
get_student_morphosyntax_analysis, | |
update_student_morphosyntax_analysis, | |
delete_student_morphosyntax_analysis, | |
get_student_morphosyntax_data | |
) | |
import logging | |
logger = logging.getLogger(__name__) | |
########################################################################### | |
def initialize_arc_analysis_state(): | |
"""Inicializa el estado del an谩lisis de arcos y el cach茅 si no existen.""" | |
if 'arc_analysis_state' not in st.session_state: | |
st.session_state.arc_analysis_state = { | |
'base_id': None, # ID del an谩lisis base | |
'original_text': '', # Texto original | |
'original_analysis': None, # Resultado an谩lisis original | |
'iteration_text': '', # Texto de iteraci贸n | |
'iteration_analysis': None,# Resultado an谩lisis iteraci贸n | |
'analysis_count': 0 | |
} | |
logger.info("Estado de an谩lisis de arcos inicializado") | |
# Inicializar cach茅 de an谩lisis | |
if 'analysis_cache' not in st.session_state: | |
st.session_state.analysis_cache = {} | |
logger.info("Cach茅 de an谩lisis inicializado") | |
def reset_morpho_state(): | |
"""Resetea el estado del an谩lisis morfosint谩ctico en sesi贸n.""" | |
if 'arc_analysis_state' in st.session_state: | |
st.session_state.arc_analysis_state = { | |
'base_id': None, | |
'original_text': '', | |
'original_analysis': None, | |
'iteration_text': '', | |
'iteration_analysis': None, | |
'analysis_count': 0 | |
} | |
def display_original_analysis(container, analysis, lang_code, morpho_t): | |
"""Muestra el an谩lisis original en el contenedor especificado.""" | |
with container: | |
st.subheader("An谩lisis Original") | |
display_morphosyntax_results(analysis, lang_code, morpho_t) | |
def display_iteration_analysis(container, analysis, lang_code, morpho_t): | |
"""Muestra el an谩lisis de cambios en el contenedor especificado.""" | |
with container: | |
st.subheader("An谩lisis de Cambios") | |
display_morphosyntax_results(analysis, lang_code, morpho_t) | |
def display_arc_diagram(doc, analysis): | |
"""Muestra un diagrama de arco sin t铆tulo.""" | |
try: | |
for sent in doc.sents: | |
svg_html = displacy.render( | |
sent, | |
style="dep", | |
options={ | |
"distance": 100, | |
"arrow_spacing": 20, | |
"word_spacing": 30 | |
} | |
) | |
# Ajustar tama帽o y posici贸n | |
svg_html = svg_html.replace('height="375"', 'height="200"') | |
svg_html = re.sub( | |
r'<svg[^>]*>', | |
lambda m: m.group(0).replace('height="450"', 'height="300"'), | |
svg_html | |
) | |
svg_html = re.sub( | |
r'<g [^>]*transform="translate\((\d+),(\d+)\)"', | |
lambda m: f'<g transform="translate({m.group(1)},50)"', | |
svg_html | |
) | |
# Envolver en contenedor con estilo | |
svg_html = f'<div class="arc-diagram-container">{svg_html}</div>' | |
st.write(svg_html, unsafe_allow_html=True) | |
except Exception as e: | |
logger.error(f"Error en display_arc_diagram: {str(e)}") | |
def cache_analysis_results(key, result): | |
"""Almacena resultados de an谩lisis en cach茅.""" | |
if not hasattr(st.session_state, 'analysis_cache'): | |
initialize_arc_analysis_state() | |
st.session_state.analysis_cache[key] = result | |
logger.info(f"Resultado almacenado en cach茅 con clave: {key}") | |
def get_cached_analysis(key): | |
"""Recupera resultados de an谩lisis del cach茅.""" | |
if not hasattr(st.session_state, 'analysis_cache'): | |
initialize_arc_analysis_state() | |
return None | |
return st.session_state.analysis_cache.get(key) | |
def display_morphosyntax_interface(lang_code, nlp_models, morpho_t): | |
""" | |
Interfaz principal para el an谩lisis morfosint谩ctico. | |
Evita resets indebidos y conserva la pesta帽a activa. | |
""" | |
try: | |
# CSS para layout estable | |
st.markdown(""" | |
<style> | |
.stTextArea textarea { | |
font-size: 1rem; | |
line-height: 1.5; | |
min-height: 100px !important; | |
height: 100px !important; | |
} | |
.arc-diagram-container { | |
width: 100%; | |
padding: 0.5rem; | |
margin: 0.5rem 0; | |
} | |
.divider { | |
height: 3px; | |
border: none; | |
background-color: #333; | |
margin: 2rem 0; | |
} | |
</style> | |
""", unsafe_allow_html=True) | |
# Inicializar estados de an谩lisis si no existen | |
initialize_arc_analysis_state() | |
# ------------------------------------------------------------------ | |
# Si tuvieras un control de tabs global, puedes comentarlo: | |
# | |
# st.session_state.tab_states['morpho_active'] = True | |
# st.session_state.selected_tab = 1 | |
# ------------------------------------------------------------------ | |
# Crear subtabs | |
subtabs = st.tabs([ | |
"An谩lisis de Diagramas de Arco", | |
"An谩lisis de Categor铆as", | |
"An谩lisis Morfol贸gico" | |
]) | |
# -------------------- Subtab 0: Diagramas de Arco -------------------- | |
with subtabs[0]: | |
# Bot贸n de reset | |
col1, col2, col3 = st.columns([2, 1, 2]) | |
with col1: | |
if st.button("Nuevo An谩lisis", type="secondary", use_container_width=True): | |
reset_morpho_state() | |
# Forzar el rec谩lculo limpio | |
st.rerun() | |
# Container principal para an谩lisis base | |
analysis_container = st.container() | |
with analysis_container: | |
# Entrada de texto original | |
text_input_key = f"original_text_{st.session_state.arc_analysis_state['analysis_count']}" | |
text_input = st.text_area( | |
"Texto original", | |
value=st.session_state.arc_analysis_state.get('original_text', ''), | |
key=text_input_key, | |
height=100 | |
) | |
# Bot贸n de an谩lisis | |
col1, col2, col3 = st.columns([2, 1, 2]) | |
with col1: | |
analyze_button = st.button( | |
"Analizar Texto", | |
type="primary", | |
use_container_width=True | |
) | |
# Procesar texto original | |
if analyze_button and text_input.strip(): | |
try: | |
# Realizar an谩lisis base (SpaCy) | |
doc = nlp_models[lang_code](text_input) | |
analysis = perform_advanced_morphosyntactic_analysis( | |
text_input, | |
nlp_models[lang_code] | |
) | |
# Guardar an谩lisis base en BD y obtener ID | |
base_id = store_student_morphosyntax_base( | |
st.session_state.username, | |
text_input, | |
analysis['arc_diagrams'] | |
) | |
if base_id: | |
# Actualizar el estado en session_state | |
st.session_state.arc_analysis_state.update({ | |
'base_id': base_id, | |
'original_text': text_input, | |
'original_analysis': analysis, # guardamos el dict | |
'analysis_count': st.session_state.arc_analysis_state['analysis_count'] + 1 | |
}) | |
# Mostrar diagrama base | |
display_arc_diagram(doc, analysis) | |
# L铆nea divisora | |
st.markdown('<hr class="divider">', unsafe_allow_html=True) | |
# 脕rea de iteraci贸n: usar un formulario | |
with st.form("iteration_form"): | |
# Separamos la key para la iteraci贸n para que no se sobreescriba | |
iteration_text_key = f"iteration_text_{st.session_state.arc_analysis_state['analysis_count']}" | |
# Mostrar el texto de iteraci贸n que tengamos en session_state | |
iteration_text = st.text_area( | |
"Texto de iteraci贸n", | |
value=st.session_state.arc_analysis_state.get('iteration_text', text_input), | |
key=iteration_text_key, | |
height=100 | |
) | |
# Bot贸n de submit en el formulario | |
col1, col2, col3 = st.columns([2,1,2]) | |
with col1: | |
submitted = st.form_submit_button( | |
"Analizar Cambios", | |
type="primary", | |
use_container_width=True | |
) | |
# Procesar iteraci贸n | |
if submitted and iteration_text.strip(): | |
try: | |
doc_iter = nlp_models[lang_code](iteration_text) | |
analysis_iter = perform_advanced_morphosyntactic_analysis( | |
iteration_text, | |
nlp_models[lang_code] | |
) | |
# Guardar iteraci贸n | |
iteration_id = store_student_morphosyntax_iteration( | |
st.session_state.username, | |
base_id, | |
text_input, # Texto original | |
iteration_text, # Texto de iteraci贸n | |
analysis_iter['arc_diagrams'] | |
) | |
if iteration_id: | |
# Actualizar el estado de iteraci贸n en session_state | |
st.session_state.arc_analysis_state.update({ | |
'iteration_text': iteration_text, | |
'iteration_analysis': analysis_iter | |
}) | |
# Mostrar diagrama de iteraci贸n | |
display_arc_diagram(doc_iter, analysis_iter) | |
except Exception as e: | |
st.error("Error procesando iteraci贸n") | |
logger.error(f"Error en iteraci贸n: {str(e)}") | |
except Exception as e: | |
st.error("Error procesando an谩lisis base") | |
logger.error(f"Error base: {str(e)}") | |
# -------------------- Subtab 1: An谩lisis de Categor铆as ---------------- | |
with subtabs[1]: | |
st.info("An谩lisis de Categor铆as en desarrollo...") | |
# -------------------- Subtab 2: An谩lisis Morfol贸gico ------------------ | |
with subtabs[2]: | |
st.info("An谩lisis Morfol贸gico en desarrollo...") | |
except Exception as e: | |
st.error("Error en la interfaz de morfosintaxis") | |
logger.error(f"Error general en la interfaz: {str(e)}") | |
def display_morphosyntax_results(result, lang_code, morpho_t): | |
""" | |
Muestra solo el diagrama de arco. | |
Args: | |
result: Diccionario con el documento procesado y su an谩lisis | |
lang_code: C贸digo del idioma | |
morpho_t: Diccionario de traducciones (opcional) | |
""" | |
if result is None: | |
return | |
try: | |
doc = result['doc'] | |
sentences = list(doc.sents) | |
for i, sent in enumerate(sentences): | |
try: | |
st.subheader(f"{morpho_t.get('sentence', 'Sentence')} {i+1}") | |
svg_html = displacy.render( | |
sent, | |
style="dep", | |
options={ | |
"distance": 100, | |
"arrow_spacing": 20, | |
"word_spacing": 30 | |
} | |
) | |
svg_html = svg_html.replace('height="375"', 'height="200"') | |
svg_html = re.sub( | |
r'<svg[^>]*>', | |
lambda m: m.group(0).replace('height="450"', 'height="300"'), | |
svg_html | |
) | |
svg_html = re.sub( | |
r'<g [^>]*transform="translate\((\d+),(\d+)\)"', | |
lambda m: f'<g transform="translate({m.group(1)},50)"', | |
svg_html | |
) | |
svg_html = f'<div class="arc-diagram-container">{svg_html}</div>' | |
st.write(svg_html, unsafe_allow_html=True) | |
except Exception as exc: | |
logger.error(f"Error mostrando diagrama de la oraci贸n {i}: {str(exc)}") | |
continue | |
except Exception as e: | |
logger.error(f"Error en display_morphosyntax_results: {str(e)}") | |