Agentic-RAG-Diabetes-Assistant/streamlit_app.py at main · JComyn/Agentic-RAG-Diabetes-Assistant · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
# Attempt to use pysqlite3 for ChromaDB compatibility
try:
    __import__('pysqlite3')
    import sys
    sys.modules['sqlite3'] = sys.modules.pop('pysqlite3')
except ImportError:
    # You can add a log or warning here if needed, e.g.,
    # print("Warning: pysqlite3-binary not found or could not be loaded. ChromaDB might fail.")
    pass

import streamlit as st
import os
import io
import contextlib
import logging
import warnings

# Silence noisy HF/Transformers warnings before project imports
os.environ["TRANSFORMERS_VERBOSITY"] = "error"
os.environ["TOKENIZERS_PARALLELISM"] = "false"

logging.getLogger("transformers").setLevel(logging.ERROR)
warnings.filterwarnings("ignore", category=UserWarning, module="transformers")
warnings.filterwarnings("ignore", category=FutureWarning, module="transformers")

from typing import List, Tuple
from langchain_core.messages import BaseMessage, HumanMessage, AIMessage
from langchain_core.runnables import RunnableConfig
from langgraph.errors import GraphRecursionError

# --- Import necessary components from your project ---
# Ensure these imports work correctly based on your project structure
try:
    from src import config # Import config for paths and settings
    from src.components import vectorstore # Import vectorstore for checking count
    from src.indexing import index_documents # Import indexing function
    from src.graph import app # Import the compiled graph app
    from src.agent import AgentState # Import AgentState if needed for type hints
except ImportError as e:
    st.error(f"Error importing project modules: {e}. Make sure the script is run from the project root or paths are configured correctly.")
    st.stop()

# --- Constants ---
ASSISTANT_AVATAR = "🤖"
USER_AVATAR = "👤"
UNKNOWN_CONFIDENCE = "N/A"

# --- Helper Function to Run the Agent and Capture Logs ---
def run_agent_with_logging(query: str, chat_history: List[BaseMessage]) -> Tuple[str, List[BaseMessage], str, str]:
    """
    Runs the Agentic RAG graph, captures logs, and returns results.

    Returns:
        Tuple[str, List[BaseMessage], str, str]: final_answer, new_history, confidence, logs
    """
    inputs = {
        "original_query": query,
        "chat_history": chat_history
    }
    run_config = RunnableConfig(recursion_limit=config.RECURSION_LIMIT)
    log_stream = io.StringIO()
    final_answer = "Error: No se generó respuesta."
    confidence = UNKNOWN_CONFIDENCE
    new_history = chat_history # Default to old history in case of error
    final_state = {}

    try:
        # Redirect stdout to capture print statements
        with contextlib.redirect_stdout(log_stream):
            print("--- Starting Agent Execution ---")
            final_state = app.invoke(inputs, config=run_config)
            print("--- Agent Execution Finished ---")

        # Extract results from the final state
        final_answer = final_state.get("final_answer", "Error: No se pudo obtener la respuesta final del estado.")
        confidence_raw = final_state.get("generation_confidence") # Might be None

        # Determine confidence string
        if confidence_raw == "high":
            confidence = "Alta"
        elif confidence_raw == "low":
            confidence = "Baja"
        elif final_state.get("error_message"):
             confidence = "Error" # Indicate error via confidence
             final_answer = f"Error: {final_state.get('error_message', 'Unknown error')}"
        else:
             confidence = UNKNOWN_CONFIDENCE # If confidence wasn't set

        # Update history safely
        new_history = chat_history + [
            HumanMessage(content=query),
            AIMessage(content=final_answer) # Store the potentially error message in history too
        ]

    except GraphRecursionError as e: # Catch specific recursion error
        st.error(f"Error: Límite de recursión del grafo alcanzado: {e}")
        final_answer = "Lo siento, el proceso se complicó y no pude completar tu solicitud. Intenta reformular la pregunta o simplificarla."
        confidence = "Error"
        new_history = chat_history + [
            HumanMessage(content=query),
            AIMessage(content=final_answer)
        ]
        print(f"\n--- GRAPH RECURSION ERROR ---", file=log_stream)
        print(f"{e}", file=log_stream)
        import traceback
        traceback.print_exc(file=log_stream)

    except Exception as e:
        st.error(f"Error during agent execution: {e}")
        final_answer = f"Lo siento, ocurrió un error grave al procesar tu solicitud: {e}"
        confidence = "Error"
        # Ensure history reflects the error message
        new_history = chat_history + [
            HumanMessage(content=query),
            AIMessage(content=final_answer)
        ]
        # Capture the exception in the logs as well
        print(f"\n--- EXCEPTION CAUGHT ---", file=log_stream)
        import traceback
        traceback.print_exc(file=log_stream)

    logs = log_stream.getvalue()
    return final_answer, new_history, confidence, logs

# --- Streamlit App ---

st.set_page_config(page_title="Asistente Diabetes", page_icon="🩸")
st.title("Asistente de Diabetes")
st.caption("Consulta información sobre diabetes basada en documentos médicos.")

# --- Initialization and Indexing ---
# Run this only once per session
if "initialized" not in st.session_state:
    st.session_state.initialized = False
    st.session_state.indexing_done = False
    st.session_state.error_message = None

if not st.session_state.initialized:
    with st.status("Inicializando sistema...", expanded=True) as status:
        try:
            st.write(f"Verificando directorio de documentos: '{config.DOCUMENTS_PATH}'...")
            if not os.path.exists(config.DOCUMENTS_PATH):
                os.makedirs(config.DOCUMENTS_PATH)
                st.warning(f"Directorio '{config.DOCUMENTS_PATH}' creado. Por favor, añade documentos PDF y refresca la página.")
                st.session_state.error_message = "Directorio de documentos creado. Añade PDFs."
                st.stop() # Stop execution until user adds files

            pdf_files = [f for f in os.listdir(config.DOCUMENTS_PATH) if f.lower().endswith('.pdf')]
            if not pdf_files:
                st.warning(f"No se encontraron archivos PDF en '{config.DOCUMENTS_PATH}'. El asistente no tendrá documentos para consultar.")
                # Allow proceeding without documents, but RAG won't work well
                st.session_state.indexing_done = True # Mark as "done" as there's nothing to index
            else:
                st.write(f"Encontrados {len(pdf_files)} archivos PDF.")
                st.write("Verificando base de datos vectorial...")
                try:
                    count = vectorstore._collection.count()
                    if count == 0:
                        st.write("Base de datos vacía. Indexando documentos (esto puede tardar)...")
                        # Capture indexing logs
                        log_stream_index = io.StringIO()
                        with contextlib.redirect_stdout(log_stream_index):
                            success = index_documents() # Use default batch size or adjust if needed
                        st.text_area("Log de Indexación", log_stream_index.getvalue(), height=150)
                        if success:
                            st.write("Indexación completada.")
                            st.session_state.indexing_done = True
                        else:
                            st.error("La indexación falló. Revisa los logs.")
                            st.session_state.error_message = "La indexación falló."
                            st.stop()
                    else:
                        st.write(f"Base de datos vectorial contiene {count} entradas. Saltando indexación.")
                        st.session_state.indexing_done = True
                except Exception as e:
                    st.error(f"Error al verificar/indexar la base de datos: {e}")
                    st.session_state.error_message = f"Error de base de datos: {e}"
                    st.stop()

            if st.session_state.indexing_done:
                status.update(label="Inicialización completa.", state="complete", expanded=False)
                st.session_state.initialized = True
            else:
                 status.update(label="Inicialización fallida.", state="error", expanded=True)

        except Exception as e:
            st.error(f"Error fatal durante la inicialización: {e}")
            st.session_state.error_message = f"Error fatal: {e}"
            st.stop()

# --- Chat History Management ---
if "messages" not in st.session_state:
    st.session_state.messages = [] # Store dicts like {"role": "user/assistant", "content": ..., "confidence": ..., "logs": ...}
if "langchain_history" not in st.session_state:
     st.session_state.langchain_history = [] # Store Langchain BaseMessage objects

# Display previous messages
for message in st.session_state.messages:
    avatar = USER_AVATAR if message["role"] == "user" else ASSISTANT_AVATAR
    with st.chat_message(message["role"], avatar=avatar):
        st.markdown(message["content"])
        # Display confidence and logs expander only for assistant messages
        if message["role"] == "assistant":
            confidence = message.get("confidence", UNKNOWN_CONFIDENCE)
            st.markdown(f"*Confianza en la respuesta: {confidence}*")
            if message.get("logs"):
                with st.expander("Ver Logs de Ejecución"):
                    st.text(message["logs"])

# --- Chat Input ---
if prompt := st.chat_input("Escribe tu consulta sobre diabetes..."):
    # Add user message to Streamlit state
    st.session_state.messages.append({"role": "user", "content": prompt})
    # Display user message
    with st.chat_message("user", avatar=USER_AVATAR):
        st.markdown(prompt)

    # Run the agent and get response
    with st.spinner("Pensando..."):
        final_answer, new_langchain_history, confidence, logs = run_agent_with_logging(
            prompt,
            st.session_state.langchain_history
        )

    # Update Langchain history
    st.session_state.langchain_history = new_langchain_history

    # Add assistant response to Streamlit state
    assistant_message = {
        "role": "assistant",
        "content": final_answer,
        "confidence": confidence,
        "logs": logs
    }
    st.session_state.messages.append(assistant_message)

    # Display assistant message
    with st.chat_message("assistant", avatar=ASSISTANT_AVATAR):
        st.markdown(final_answer)
        st.markdown(f"*Confianza en la respuesta: {confidence}*")
        with st.expander("Ver Logs de Ejecución"):
            st.text(logs)

# Display error message if initialization failed
if not st.session_state.initialized and st.session_state.error_message:
    st.error(f"El sistema no pudo inicializarse correctamente: {st.session_state.error_message}")