Spaces:

mrcamcam
/

arize_demo

Sleeping

App Files Files Community

Cam commited on Apr 6

Commit

604eb35

1 Parent(s): 9019284

adjusted app.py due to initiatlization error

Browse files

Files changed (1) hide show

app.py +91 -134

app.py CHANGED Viewed

@@ -1,72 +1,21 @@
-import streamlit as st
-import os
-import sys
-import uuid
-import logging
-from pathlib import Path
-import subprocess
-# Configure page first (must be the first Streamlit command)
-st.set_page_config(
-    page_title="Assurant 10-K Analysis & Risk Assessment App",
-    page_icon="📊",
-    layout="wide"
-)
-# Run setup script if environment variable is set
-if os.environ.get('STREAMLIT_RUN_SETUP', 'false').lower() == 'true':
-    try:
-        st.write("Setting up environment...")
-        subprocess.call(['bash', 'setup.sh'])
-        st.write("Setup completed!")
-    except Exception as e:
-        st.error(f"Setup failed: {e}")
-# Suppress PyTorch warnings that might appear in the console
-os.environ['PYTHONWARNINGS'] = 'ignore::RuntimeWarning'
-# Configure logging before imports
-logging.basicConfig(
-    level=logging.INFO,
-    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
-    handlers=[logging.StreamHandler()]
-)
-logger = logging.getLogger(__name__)
-# Determine the project root directory
-project_root = Path(__file__).parent.absolute()
-logger.info(f"Project root directory: {project_root}")
-# Add the project root to the Python path if it's not already there
-if str(project_root) not in sys.path:
-    sys.path.insert(0, str(project_root))
-    logger.info(f"Added project root to path: {project_root}")
-# Verify the src directory exists
-src_dir = project_root / "src"
-if not src_dir.exists():
-    logger.error(f"Source directory not found: {src_dir}")
-    st.error("Application structure is incorrect. The 'src' directory is missing.")
-else:
-    logger.info(f"Source directory found: {src_dir}")
-# Import the necessary modules using direct imports
-try:
-    # Use absolute imports based on the project structure
-    from src.llamaindex_app.main import init_openai_client, setup_instrumentation, process_interaction
-    from src.llamaindex_app.classifier import QueryClassifier
-    from src.llamaindex_app.index_manager import IndexManager
-    from src.llamaindex_app.config import Settings
-    logger.info("Successfully imported all required modules")
-except ImportError as e:
-    logger.error(f"Import error: {e}")
 def init_app():
     """Initialize everything just once using st.session_state."""
     if "initialized" not in st.session_state:
         try:
-            st.session_state["initialized"] = True
             logger.info("Starting app initialization")
             # Load settings
@@ -87,21 +36,29 @@ def init_app():
             # (3) index manager & query engine
             with st.spinner("Loading index and query engine..."):
                 index_manager = IndexManager(openai_client=openai_client)
                 query_engine = index_manager.get_query_engine()
                 st.session_state["query_engine"] = query_engine
                 logger.info("Index and query engine loaded")
             # (4) classifier
             with st.spinner("Initializing query classifier..."):
-                classifier = QueryClassifier(
-                    query_engine=query_engine,
-                    openai_client=openai_client
-                )
-                st.session_state["classifier"] = classifier
-                logger.info("Query classifier initialized")
-            st.session_state["chat_history"] = []  # store chat Q&A pairs
             logger.info("App initialization complete")
             st.success("App initialized successfully!")
@@ -115,6 +72,9 @@ def init_app():
     return "initialized" in st.session_state and st.session_state["initialized"]
 def main():
     """Main Streamlit app function."""
     st.title("Assurant 10-K Analysis & Risk Assessment App")
@@ -135,6 +95,10 @@ def main():
         # Debug section in sidebar
         if st.checkbox("Show debug info"):
             st.subheader("Debug Information")
             st.write("Python Path:")
             for path in sys.path:
                 st.write(f"- {path}")
@@ -158,18 +122,6 @@ def main():
                 if settings.OPENAI_ORG_ID:
                     st.write(f"- OpenAI Organization: {settings.OPENAI_ORG_ID}")
-    # Check if the required modules are properly imported
-    if 'src.llamaindex_app.classifier' not in sys.modules:
-        st.error("Failed to import required modules. Please check your project structure and try again.")
-        st.info("""
-        Troubleshooting steps:
-        1. Ensure you have proper __init__.py files in src/ and src/llamaindex_app/ directories
-        2. Verify that all Python modules are in the correct locations
-        3. Check that your imports use absolute paths (src.llamaindex_app.module)
-        4. Make sure all requirements are installed
-        """)
-        return
     # Initialize the app
     initialization_status = init_app()
@@ -178,51 +130,64 @@ def main():
         st.warning("Please check your environment variables and connection settings.")
         return
-    # Query section
-    st.subheader("Ask a question about Assurant's 10-K")
-    user_question = st.text_input("Your question:", placeholder="e.g., How did Assurant perform last quarter?")
-    submit = st.button("Submit Question")
-    if submit and user_question.strip():
-        # retrieve references from st.session_state
-        query_engine = st.session_state["query_engine"]
-        classifier = st.session_state["classifier"]
-        tracer = st.session_state["tracer"]
-        session_id = str(uuid.uuid4())
-        with st.spinner("Analyzing your question..."):
             try:
-                # Log the question being processed
-                logger.info(f"Processing query: {user_question}")
-                response, error = process_interaction(
-                    query_engine,
-                    classifier,
-                    tracer,
-                    user_question,
-                    session_id
-                )
-                # Store in st.session_state so we can display entire conversation
-                if error:
-                    st.session_state["chat_history"].append(("user", user_question))
-                    st.session_state["chat_history"].append(("assistant", f"Error: {error}"))
-                    st.error(f"Error: {error}")
-                    logger.error(f"Query processing error: {error}")
-                else:
-                    st.session_state["chat_history"].append(("user", user_question))
-                    st.session_state["chat_history"].append(("assistant", response.response))
-                    logger.info("Query processed successfully")
-                    # If there are any sources
-                    if getattr(response, "source_nodes", None):
-                        source_text = "\n".join(
-                            f"- {node.metadata.get('file_name', 'Unknown source')}"
-                            for node in response.source_nodes
-                        )
-                        st.session_state["chat_history"].append(("assistant_sources", source_text))
-                        logger.info(f"Found {len(response.source_nodes)} source nodes")
             except Exception as e:
                 st.error(f"Error processing your question: {str(e)}")
                 logger.error(f"Process interaction error: {str(e)}", exc_info=True)
@@ -245,12 +210,4 @@ def main():
             # Add a separator between conversations
             if idx < len(st.session_state.get("chat_history", [])) - 1 and role == "assistant":
-                st.markdown("---")
-if __name__ == "__main__":
-    try:
-        main()
-    except Exception as e:
-        logger.error(f"Unhandled exception in main app: {str(e)}", exc_info=True)
-        st.error(f"An unexpected error occurred: {str(e)}")
-        st.warning("Please check the logs for more details.")

+# Modify the init_app function in app.py to ensure proper initialization and handling of errors:
 def init_app():
     """Initialize everything just once using st.session_state."""
+    # Initialize empty collections to prevent KeyError
+    if "chat_history" not in st.session_state:
+        st.session_state["chat_history"] = []
+    # Create a flag for initialization attempts
+    if "initialization_attempted" not in st.session_state:
+        st.session_state["initialization_attempted"] = False
     if "initialized" not in st.session_state:
+        st.session_state["initialization_attempted"] = True
         try:
+            # Add key presence checks before starting initialization
+            st.session_state["initialized"] = False  # Mark as not initialized until complete
             logger.info("Starting app initialization")
             # Load settings
             # (3) index manager & query engine
             with st.spinner("Loading index and query engine..."):
+                # Create these objects explicitly
                 index_manager = IndexManager(openai_client=openai_client)
                 query_engine = index_manager.get_query_engine()
+                # Store them in session_state
+                st.session_state["index_manager"] = index_manager
                 st.session_state["query_engine"] = query_engine
                 logger.info("Index and query engine loaded")
             # (4) classifier
             with st.spinner("Initializing query classifier..."):
+                # Create classifier only when we are sure query_engine exists
+                if "query_engine" in st.session_state:
+                    classifier = QueryClassifier(
+                        query_engine=st.session_state["query_engine"],
+                        openai_client=openai_client
+                    )
+                    st.session_state["classifier"] = classifier
+                    logger.info("Query classifier initialized")
+                else:
+                    raise ValueError("Query engine not initialized properly")
+            st.session_state["initialized"] = True  # Now mark as fully initialized
             logger.info("App initialization complete")
             st.success("App initialized successfully!")
     return "initialized" in st.session_state and st.session_state["initialized"]
+# Modify the main function to handle errors more gracefully:
 def main():
     """Main Streamlit app function."""
     st.title("Assurant 10-K Analysis & Risk Assessment App")
         # Debug section in sidebar
         if st.checkbox("Show debug info"):
             st.subheader("Debug Information")
+            st.write("Session State Keys:")
+            for key in st.session_state:
+                st.write(f"- {key}: {'Present' if st.session_state[key] is not None else 'None'}")
             st.write("Python Path:")
             for path in sys.path:
                 st.write(f"- {path}")
                 if settings.OPENAI_ORG_ID:
                     st.write(f"- OpenAI Organization: {settings.OPENAI_ORG_ID}")
     # Initialize the app
     initialization_status = init_app()
         st.warning("Please check your environment variables and connection settings.")
         return
+    # Safety check - if we've attempted initialization but still don't have key components
+    if st.session_state.get("initialization_attempted", False) and not st.session_state.get("initialized", False):
+        st.warning("The application is still initializing or had problems during initialization. Please wait or refresh the page.")
+        return
+    # Query section - Only show if properly initialized
+    if st.session_state.get("initialized", False):
+        st.subheader("Ask a question about Assurant's 10-K")
+        user_question = st.text_input("Your question:", placeholder="e.g., How did Assurant perform last quarter?")
+        submit = st.button("Submit Question")
+        if submit and user_question.strip():
+            # Safely retrieve references from st.session_state with error handling
             try:
+                # Check that all required components exist
+                required_keys = ["query_engine", "classifier", "tracer"]
+                missing_keys = [key for key in required_keys if key not in st.session_state]
+                if missing_keys:
+                    st.error(f"Missing required components: {', '.join(missing_keys)}")
+                    return
+                query_engine = st.session_state["query_engine"]
+                classifier = st.session_state["classifier"]
+                tracer = st.session_state["tracer"]
+                session_id = str(uuid.uuid4())
+                with st.spinner("Analyzing your question..."):
+                    # Log the question being processed
+                    logger.info(f"Processing query: {user_question}")
+                    response, error = process_interaction(
+                        query_engine,
+                        classifier,
+                        tracer,
+                        user_question,
+                        session_id
+                    )
+                    # Store in st.session_state so we can display entire conversation
+                    if error:
+                        st.session_state["chat_history"].append(("user", user_question))
+                        st.session_state["chat_history"].append(("assistant", f"Error: {error}"))
+                        st.error(f"Error: {error}")
+                        logger.error(f"Query processing error: {error}")
+                    else:
+                        st.session_state["chat_history"].append(("user", user_question))
+                        st.session_state["chat_history"].append(("assistant", response.response))
+                        logger.info("Query processed successfully")
+                        # If there are any sources
+                        if getattr(response, "source_nodes", None):
+                            source_text = "\n".join(
+                                f"- {node.metadata.get('file_name', 'Unknown source')}"
+                                for node in response.source_nodes
+                            )
+                            st.session_state["chat_history"].append(("assistant_sources", source_text))
+                            logger.info(f"Found {len(response.source_nodes)} source nodes")
             except Exception as e:
                 st.error(f"Error processing your question: {str(e)}")
                 logger.error(f"Process interaction error: {str(e)}", exc_info=True)
             # Add a separator between conversations
             if idx < len(st.session_state.get("chat_history", [])) - 1 and role == "assistant":
+                st.markdown("---")