v3 / modules /morphosyntax /morphosyntax_interface.py
AIdeaText's picture
Update modules/morphosyntax/morphosyntax_interface.py
bcc273d verified
raw
history blame
10 kB
#modules/morphosyntax/morphosyntax_interface.py
#Importaciones generales
import streamlit as st
from streamlit_float import *
from streamlit_antd_components import *
from streamlit.components.v1 import html
import spacy
from spacy import displacy
import spacy_streamlit
import pandas as pd
import base64
import re
#Importaciones locales
from .morphosyntax_process import (
process_morphosyntactic_input,
format_analysis_results,
perform_advanced_morphosyntactic_analysis,
get_repeated_words_colors,
highlight_repeated_words,
POS_COLORS,
POS_TRANSLATIONS
)
from ..utils.widget_utils import generate_unique_key
from ..database.morphosintax_mongo_db import store_student_morphosyntax_result
from ..database.chat_mongo_db import store_chat_history, get_chat_history
import logging
logger = logging.getLogger(__name__)
###########################################################################
def reset_morpho_state():
"""Resetea el estado del análisis morfosintáctico"""
if 'arc_analysis_state' in st.session_state:
st.session_state.arc_analysis_state = {
'original_text': '',
'original_analysis': None,
'iteration_text': '',
'iteration_analysis': None,
'analysis_count': 0
}
############################################################################
def display_original_analysis(container, analysis, lang_code, morpho_t):
"""Muestra el análisis original en el contenedor especificado"""
with container:
st.subheader("Análisis Original")
display_morphosyntax_results(analysis, lang_code, morpho_t)
def display_iteration_analysis(container, analysis, lang_code, morpho_t):
"""Muestra el análisis de cambios en el contenedor especificado"""
with container:
st.subheader("Análisis de Cambios")
display_morphosyntax_results(analysis, lang_code, morpho_t)
############################################################################
def display_morphosyntax_interface(lang_code, nlp_models, morpho_t):
try:
# CSS para layout estable
st.markdown("""
<style>
.stTextArea textarea {
font-size: 1rem;
line-height: 1.5;
min-height: 100px !important;
height: 100px !important;
}
.arc-diagram-container {
width: 100%;
padding: 0.5rem;
margin: 0.5rem 0;
}
</style>
""", unsafe_allow_html=True)
# Estado para subtabs
if 'morpho_subtab' not in st.session_state:
st.session_state.morpho_subtab = 0
# Crear subtabs
subtabs = st.tabs([
"Análisis de Diagramas de Arco",
"Análisis de Categorías",
"Análisis Morfológico"
])
# Tab de Diagramas de Arco
with subtabs[0]:
# Botón de reset
col1, col2, col3 = st.columns([2,1,2])
with col1:
if st.button("Nuevo Análisis", type="secondary", use_container_width=True):
reset_morpho_state()
st.rerun()
# Estado para análisis...
# Contenedores separados para cada tipo de análisis
original_input_container = st.container()
original_diagram_container = st.container()
iteration_input_container = st.container()
iteration_diagram_container = st.container()
# Sección de análisis original
with original_input_container:
text_key = f"original_text_{st.session_state.arc_analysis_state['analysis_count']}"
text_input = st.text_area(
"",
value=st.session_state.arc_analysis_state['original_text'],
key=text_key,
height=100
)
col1, col2, col3 = st.columns([2,1,2])
with col1:
analyze_button = st.button(
"Analizar Texto Original",
type="primary",
key=f"analyze_original_{st.session_state.arc_analysis_state['analysis_count']}"
)
# Procesar texto original
if analyze_button and text_input.strip():
try:
doc = nlp_models[lang_code](text_input)
analysis = perform_advanced_morphosyntactic_analysis(
text_input,
nlp_models[lang_code]
)
# Actualizar estado
st.session_state.arc_analysis_state.update({
'original_text': text_input,
'original_analysis': {'doc': doc, 'analysis': analysis},
'iteration_text': text_input,
'analysis_count': st.session_state.arc_analysis_state['analysis_count'] + 1
})
if store_student_morphosyntax_result(
username=st.session_state.username,
text=text_input,
arc_diagrams=analysis['arc_diagrams']
):
display_original_analysis(
original_diagram_container,
st.session_state.arc_analysis_state['original_analysis'],
lang_code,
morpho_t
)
except Exception as e:
st.error("Error al procesar texto original")
logger.error(f"Error: {str(e)}")
# Sección de iteración
if st.session_state.arc_analysis_state.get('original_analysis'):
with iteration_input_container:
st.markdown("---")
iteration_key = f"iteration_{st.session_state.arc_analysis_state['analysis_count']}"
# Usar un formulario para evitar recargas innecesarias
with st.form(key="iteration_form"):
iteration_text = st.text_area(
"",
value=st.session_state.arc_analysis_state['iteration_text'],
key=iteration_key,
height=100
)
iterate_button = st.form_submit_button(
"Analizar Cambios",
type="primary",
use_container_width=True
)
if iterate_button and iteration_text.strip():
try:
doc_iter = nlp_models[lang_code](iteration_text)
analysis_iter = perform_advanced_morphosyntactic_analysis(
iteration_text,
nlp_models[lang_code]
)
# Actualizar solo el análisis de iteración
st.session_state.arc_analysis_state.update({
'iteration_text': iteration_text,
'iteration_analysis': {'doc': doc_iter, 'analysis': analysis_iter}
})
if store_student_morphosyntax_result(
username=st.session_state.username,
text=iteration_text,
arc_diagrams=analysis_iter['arc_diagrams']
):
display_iteration_analysis(
iteration_diagram_container,
{'doc': doc_iter, 'analysis': analysis_iter},
lang_code,
morpho_t
)
except Exception as e:
st.error("Error al procesar iteración")
logger.error(f"Error: {str(e)}")
# Otros subtabs...
except Exception as e:
st.error("Error general en la interfaz")
logger.error(f"Error: {str(e)}")
############################################################################
def display_morphosyntax_results(result, lang_code, morpho_t):
"""
Muestra solo el diagrama de arco.
Args:
result: Diccionario con el documento procesado y su análisis
lang_code: Código del idioma
morpho_t: Diccionario de traducciones
"""
if result is None:
return
try:
doc = result['doc']
sentences = list(doc.sents)
for i, sent in enumerate(sentences):
try:
st.subheader(f"{morpho_t.get('sentence', 'Sentence')} {i+1}")
html = displacy.render(sent, style="dep", options={
"distance": 100,
"arrow_spacing": 20,
"word_spacing": 30
})
html = html.replace('height="375"', 'height="200"')
html = re.sub(r'<svg[^>]*>', lambda m: m.group(0).replace('height="450"', 'height="300"'), html)
html = re.sub(r'<g [^>]*transform="translate\((\d+),(\d+)\)"',
lambda m: f'<g transform="translate({m.group(1)},50)"', html)
html = f'<div class="arc-diagram-container">{html}</div>'
st.write(html, unsafe_allow_html=True)
except Exception as e:
logger.error(f"Error en diagrama {i}: {str(e)}")
continue
except Exception as e:
logger.error(f"Error en display_morphosyntax_results: {str(e)}")