erwallace · erwallace · May 23, 2025 · May 22, 2025 · May 22, 2025 · May 22, 2025
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
@@ -1,3 +1,4 @@
+exclude: ^vectorstore/
 repos:
   - repo: https://github.com/pre-commit/pre-commit-hooks
     rev: v4.5.0

diff --git a/src/paper_query/base_chatbot.py b/src/paper_query/base_chatbot.py
@@ -15,7 +15,7 @@ def main():
     parser.add_argument(
         "--model",
         type=str,
-        default="gpt-4o",
+        default="gpt-4.1",
         help="Model name to use for the chatbot",
     )
     parser.add_argument(

diff --git a/src/paper_query/code_query_chatbot.py b/src/paper_query/code_query_chatbot.py
@@ -18,7 +18,7 @@ def main():
     parser.add_argument(
         "--model",
         type=str,
-        default="gpt-4o",
+        default="gpt-4.1",
         help="Model name to use for the chatbot",
     )
     parser.add_argument(

diff --git a/src/paper_query/constants/__init__.py b/src/paper_query/constants/__init__.py
@@ -1,6 +1,6 @@
 from ._api_keys import GROQ_API_KEY, HUGGINGFACE_API_KEY, OPENAI_API_KEY
 from ._paths import PERSIST_DIRECTORY, assets_dir, data_dir, project_dir, src_dir, test_dir
-from ._strings import RAG_DOC_ID
+from ._strings import RAG_DOC_ID, STREAMLIT_CHEAP_MODEL, STREAMLIT_EXPENSIVE_MODEL
 
 __all__ = [
     "OPENAI_API_KEY",
@@ -13,4 +13,6 @@
     "data_dir",
     "assets_dir",
     "RAG_DOC_ID",
+    "STREAMLIT_CHEAP_MODEL",
+    "STREAMLIT_EXPENSIVE_MODEL",
 ]
diff --git a/src/paper_query/constants/_strings.py b/src/paper_query/constants/_strings.py
@@ -1 +1,4 @@
 RAG_DOC_ID = "file"
+
+STREAMLIT_CHEAP_MODEL = "GPT-4.1-nano"
+STREAMLIT_EXPENSIVE_MODEL = "GPT-4.1"
diff --git a/src/paper_query/hybrid_query_chatbot.py b/src/paper_query/hybrid_query_chatbot.py
@@ -18,7 +18,7 @@ def main():
     parser.add_argument(
         "--model",
         type=str,
-        default="gpt-4o",
+        default="gpt-4.1",
         help="Model name to use for the chatbot",
     )
     parser.add_argument(

diff --git a/src/paper_query/paper_query_chatbot.py b/src/paper_query/paper_query_chatbot.py
@@ -18,7 +18,7 @@ def main():
     parser.add_argument(
         "--model",
         type=str,
-        default="gpt-4o",
+        default="gpt-4.1",
         help="Model name to use for the chatbot",
     )
     parser.add_argument(

diff --git a/src/paper_query/paper_query_plus_chatbot.py b/src/paper_query/paper_query_plus_chatbot.py
@@ -19,7 +19,7 @@ def main():
     parser.add_argument(
         "--model",
         type=str,
-        default="gpt-4o",
+        default="gpt-4.1",
         help="Model name to use for the chatbot",
     )
     parser.add_argument(

diff --git a/src/paper_query/ui/components/chat_interface.py b/src/paper_query/ui/components/chat_interface.py
@@ -6,24 +6,33 @@ def display_chat_interface() -> None:
     if "messages" not in st.session_state:
         st.session_state.messages = []
 
-    for message in st.session_state.messages:
-        with st.chat_message(message["role"]):
-            st.markdown(message["content"])
+    message_container = st.container()
 
-    if "chatbot_confirmed" in st.session_state and st.session_state.chatbot_confirmed:
+    # Display all past messages in the message container
+    with message_container:
+        for message in st.session_state.messages:
+            with st.chat_message(message["role"]):
+                st.markdown(message["content"])
+
+    # Create the input at the bottom
+    if "chatbot_ready" in st.session_state and st.session_state.chatbot_ready:
         if user_input := st.chat_input("What is your question?", key="user_input"):
-            st.chat_message("user").markdown(user_input)
+            # Add user message to UI
+            with message_container:
+                st.chat_message("user").markdown(user_input)
             st.session_state.messages.append({"role": "user", "content": user_input})
 
-            with st.chat_message("assistant"):
-                message_placeholder = st.empty()
-                full_response = ""
+            # Add assistant response to UI
+            with message_container:
+                with st.chat_message("assistant"):
+                    message_placeholder = st.empty()
+                    full_response = ""
 
-                for response_chunk in st.session_state.chatbot.stream_response(user_input):
-                    full_response += response_chunk
-                    message_placeholder.markdown(full_response)
+                    for response_chunk in st.session_state.chatbot.stream_response(user_input):
+                        full_response += response_chunk
+                        message_placeholder.markdown(full_response)
 
-                message_placeholder.markdown(full_response)
+                    message_placeholder.markdown(full_response)
 
             st.session_state.messages.append({"role": "assistant", "content": full_response})
     else:

diff --git a/src/paper_query/ui/components/sidebar_inputs.py b/src/paper_query/ui/components/sidebar_inputs.py
@@ -17,7 +17,7 @@ def get_class_params(cls) -> list[str]:
     ]
 
 
-def model_name_input(name: str = "gpt-4o") -> str:
+def model_name_input(name: str = "gpt-4.1") -> str:
     """Get the model name from the sidebar."""
     return st.sidebar.text_input("Model Name", value=name, key="model_name_input")
 

diff --git a/src/paper_query/ui/components/text.py b/src/paper_query/ui/components/text.py
@@ -0,0 +1,55 @@
+from paper_query.constants import STREAMLIT_EXPENSIVE_MODEL
+
+ABOUT = f"""
+**StrainRelief is a tool for calculating ligand strain energy with quantum mechanical
+accuracy**.
+
+##### What is ligand strain energy?
+Ligand strain energy is the energy difference between the bound and unbound conformations
+of a ligand. It's an important component in structure-based small molecule drug design.
+
+##### How does StrainRelief work?
+StrainRelief uses a MACE Neural Network Potential (NNP) trained on a large database of
+Density Functional Theory (DFT) calculations to estimate ligand strain of neutral molecules
+with quantum accuracy.
+
+##### About this chatbot
+This chatbot is built using a hybrid retrieval and cached augmented generation (RAG/CAG)
+approach:
+
+1. The full StrainRelief [paper](https://arxiv.org/abs/2503.13352) is loaded and cached
+in the context window for all queries
+2. Reference papers cited in StrainRelief are embedded and available for retrieval
+3. The StrainRelief code [repository](https://github.com/prescient-design/StrainRelief)
+is embedded and available for retrieval
+
+The chatbot is currently has a naive modular framework. When you ask a question, the
+system:
+- Retrieves relevant information from the references and code
+- Combines this with the full paper context
+- Uses the LLM to generate a response based on all available information
+
+The chatbot uses the following components:
+- **LLM**: {STREAMLIT_EXPENSIVE_MODEL} from OpenAI for generating responses
+- **Embedding**: OpenAI embeddings for vector search
+- **Vector Database**: ChromaDB for storing and retrieving embedded documents
+
+Feel free to ask about the StrainRelief methodology, implementation details, or
+how to use the tool for drug discovery applications.
+        """
+
+ABSTRACT = """
+:gray[**Abstract**: Ligand strain energy, the energy difference between the
+bound and unbound conformations of a ligand, is an important component of
+structure-based small molecule drug design. A large majority of observed
+ligands in protein-small molecule co-crystal structures bind in low-strain
+conformations, making strain energy a useful filter for structure-based drug
+design. In this work we present a tool for calculating ligand strain with a
+high accuracy. StrainRelief uses a MACE Neural Network Potential (NNP),
+trained on a large database of Density Functional Theory (DFT) calculations
+to estimate ligand strain of neutral molecules with quantum accuracy. We show
+that this tool estimates strain energy differences relative to DFT to within
+1.4 kcal/mol, more accurately than alternative NNPs. These results highlight
+the utility of NNPs in drug discovery, and provide a useful tool for drug
+discovery teams.]
+"""
diff --git a/src/paper_query/ui/components/validate_key.py b/src/paper_query/ui/components/validate_key.py
@@ -0,0 +1,25 @@
+import streamlit as st
+from loguru import logger
+from openai import OpenAI
+
+from paper_query.constants import STREAMLIT_CHEAP_MODEL, STREAMLIT_EXPENSIVE_MODEL
+
+
+def validate_openai_api_key(api_key: str):
+    """Validates the OpenAI API key and updates the session state accordingly."""
+    if api_key and api_key != st.session_state.last_validated_key:
+        try:
+            client = OpenAI(api_key=api_key)
+            client.models.list()
+            logger.debug("API key validation successful.")
+            st.session_state.model_name = STREAMLIT_EXPENSIVE_MODEL
+            st.session_state.last_validated_key = api_key
+        except Exception as e:
+            logger.error(f"API key validation failed: {e}")
+            st.sidebar.error("Invalid API key. Please check your OpenAI API key.")
+            st.session_state.model_name = STREAMLIT_CHEAP_MODEL
+            st.session_state.last_validated_key = None  # Reset if validation fails
+    elif not api_key:
+        # Reset to cheap model if key is cleared
+        st.session_state.model_name = STREAMLIT_CHEAP_MODEL
+        st.session_state.last_validated_key = None
diff --git a/src/paper_query/ui/custom_app.py b/src/paper_query/ui/custom_app.py
@@ -20,7 +20,7 @@ def streamlit_chatbot():
     chatbot_args = get_chatbot_params(selected_chatbot_class)
 
     if st.sidebar.button("Confirm Chatbot", key="confirm_chatbot_button"):
-        st.session_state.chatbot_confirmed = True
+        st.session_state.chatbot_ready = True
         st.session_state.chatbot = selected_chatbot_class(**chatbot_args)
         st.sidebar.success(f"{selected_label} is ready!")
         st.title(f"{selected_label} Chatbot")

diff --git a/src/paper_query/ui/strain_relief_app.py b/src/paper_query/ui/strain_relief_app.py
@@ -4,59 +4,71 @@
 from loguru import logger
 
 from paper_query.chatbots import HybridQueryChatbot
-from paper_query.constants import assets_dir
+from paper_query.constants import STREAMLIT_CHEAP_MODEL, STREAMLIT_EXPENSIVE_MODEL, assets_dir
 from paper_query.ui.components.chat_interface import display_chat_interface
+from paper_query.ui.components.text import ABOUT, ABSTRACT
+from paper_query.ui.components.validate_key import validate_openai_api_key
 
 # Configure logger to use DEBUG level
 logger.remove()
 logger.add(sys.stderr, level="DEBUG")
 
 
+def initialize_session_state():
+    """Initialize session state variables."""
+    if "chatbot_ready" not in st.session_state:
+        st.session_state.chatbot_ready = True
+
+    if "chatbot" not in st.session_state:
+        st.session_state.chatbot = None
+
+    if "model_name" not in st.session_state:
+        st.session_state.model_name = STREAMLIT_CHEAP_MODEL
+
+
 def strain_relief_chatbot():
     """Chatbot for the StrainRelief paper."""
-    st.session_state.chatbot_confirmed = True
-    if "chatbot" not in st.session_state:
-        st.session_state.chatbot = HybridQueryChatbot(
-            model_name="gpt-4o",
-            model_provider="openai",
-            paper_path=str(assets_dir / "strainrelief_preprint.pdf"),
-            references_dir=str(assets_dir / "references"),
-        )
+    initialize_session_state()
 
     st.title("The StrainRelief Chatbot")
+    chat_tab, about_tab = st.tabs(["Chat", "About"])
 
-    st.markdown(
-        "This retrieval augmented generation (RAG) chatbot is designed to answer questions about "
-        "the StrainRelief. The chatbot has access to the [paper](https://arxiv.org/abs/2503.13352),"
-        " all references, and the code "
-        "[repository](https://github.com/prescient-design/StrainRelief)."
+    st.sidebar.title("API Configuration")
+    # Enter API key in sidebar
+    openai_api_key = st.sidebar.text_input(
+        "OpenAI API Key",
+        type="password",
+        help="If you don't have an API key, you can get one from [OpenAI](https://platform.openai.com/api-keys).",
+        key="api_input",
     )
-    if "messages" not in st.session_state:
-        st.markdown(
-            ":gray[**Abstract**: Ligand strain energy, the energy difference between the bound and "
-            "unbound conformations of a ligand, is an important component of structure-based small "
-            "molecule drug design. A large majority of observed ligands in protein-small molecule "
-            "co-crystal structures bind in low-strain conformations, making strain energy a useful "
-            "filter for structure-based drug design. In this work we present a tool for "
-            "calculating ligand strain with a high accuracy. StrainRelief uses a MACE Neural "
-            "Network Potential (NNP), trained on a large database of Density Functional Theory "
-            "(DFT) calculations to estimate ligand strain of neutral molecules with quantum "
-            "accuracy. We show that this tool estimates strain energy differences relative to DFT "
-            "to within 1.4 kcal/mol, more accurately than alternative NNPs. These results "
-            "highlight the utility of NNPs in drug discovery, and provide a useful tool for drug "
-            "discovery teams.]"
-        )
-
-    display_chat_interface()
 
+    validate_openai_api_key(openai_api_key)
+    # Display current model
+    st.sidebar.markdown(f"Using **{st.session_state.model_name}** model.")
 
-if __name__ == "__main__":
-    if sys.platform != "linux":  # Skip for GitHub actions
-        # Get API keys from Streamlit secrets
-        from paper_query import constants
+    st.session_state.chatbot = HybridQueryChatbot(
+        model_name=st.session_state.model_name.lower(),
+        model_provider="openai",
+        paper_path=str(assets_dir / "strainrelief_preprint.pdf"),
+        references_dir=str(assets_dir / "references"),
+    )
+
+    with chat_tab:
+        if "messages" not in st.session_state:
+            st.markdown(ABSTRACT)
+
+            # Show info message only when using nano model
+            if st.session_state.model_name == STREAMLIT_CHEAP_MODEL:
+                st.info(
+                    f"You are currently using {STREAMLIT_CHEAP_MODEL}. Add a valid OpenAI API key "
+                    f"to access the more powerful {STREAMLIT_EXPENSIVE_MODEL} model."
+                )
 
-        constants.OPENAI_API_KEY = st.secrets["OPENAI_API_KEY"]
-        constants.GROQ_API_KEY = st.secrets["GROQ_API_KEY"]
-        constants.HUGGINGFACE_API_KEY = st.secrets["HUGGINGFACE_API_KEY"]
+        display_chat_interface()
 
+    with about_tab:
+        st.markdown(ABOUT)
+
+
+if __name__ == "__main__":
     strain_relief_chatbot()
diff --git a/test/data/test_loaders.py b/test/data/test_loaders.py
@@ -22,7 +22,7 @@ def test_pypdf_loader_w_images(test_assets_dir):
     """Test the pypdf_loader_w_images function."""
     path = test_assets_dir / "example_pdf.pdf"
     # TODO: change to free model
-    doc = pypdf_loader_w_images(path, "gpt-4o-mini", "openai")
+    doc = pypdf_loader_w_images(path, "gpt-4.1-nano", "openai")
     assert isinstance(doc, Document)
 
 

diff --git a/test/ui/components/test_sidebar_inputs.py b/test/ui/components/test_sidebar_inputs.py
@@ -13,8 +13,8 @@
 
 
 def test_model_name_input():
-    assert model_name_input() == "gpt-4o"
-    assert model_name_input("gpt-4o-mini") == "gpt-4o-mini"
+    assert model_name_input() == "gpt-4.1"
+    assert model_name_input("gpt-4.1-nano") == "gpt-4.1-nano"
 
 
 def test_model_provider_input():
@@ -38,7 +38,7 @@ def test_code_dir_input():
 
 
 def test_get_param():
-    assert get_param("model_name") == "gpt-4o"
+    assert get_param("model_name") == "gpt-4.1"
     assert get_param("model_provider") == "openai"
     assert get_param("paper_path") == str(assets_dir / "strainrelief_preprint.pdf")
     assert get_param("references_dir") == str(assets_dir / "references")
@@ -48,4 +48,4 @@ def test_get_param():
 
 
 def test_get_chatbot_params():
-    assert get_chatbot_params(BaseChatbot) == {"model_name": "gpt-4o", "model_provider": "openai"}
+    assert get_chatbot_params(BaseChatbot) == {"model_name": "gpt-4.1", "model_provider": "openai"}
diff --git a/test/ui/components/test_validate_key.py b/test/ui/components/test_validate_key.py
@@ -0,0 +1,22 @@
+import pytest
+import streamlit as st
+from paper_query.constants import OPENAI_API_KEY, STREAMLIT_CHEAP_MODEL, STREAMLIT_EXPENSIVE_MODEL
+from paper_query.ui.components.validate_key import validate_openai_api_key
+
+
+@pytest.mark.app
+@pytest.mark.parametrize(
+    "api_key, last_key, model_name",
+    [
+        (OPENAI_API_KEY, OPENAI_API_KEY, STREAMLIT_EXPENSIVE_MODEL),
+        (None, None, STREAMLIT_CHEAP_MODEL),
+        ("invalid_key", None, STREAMLIT_CHEAP_MODEL),
+    ],
+)
+def test_validate_openai_api_key_correct(api_key, last_key, model_name):
+    """Test the OpenAI API key validation."""
+    st.session_state.last_validated_key = True
+
+    validate_openai_api_key(api_key)
+    assert st.session_state.last_validated_key == last_key
+    assert st.session_state.model_name == model_name
diff --git a/test/ui/test_custom_app.py b/test/ui/test_custom_app.py
@@ -31,7 +31,7 @@ def test_confirm_chatbot(app):
 @pytest.mark.app
 def test_model_selection(app):
     """Test model selection text input."""
-    assert app.sidebar.text_input("model_name_input").value == "gpt-4o"
+    assert app.sidebar.text_input("model_name_input").value == "gpt-4.1"
     app.sidebar.text_input("model_name_input").set_value(MODEL_NAME)
     assert app.sidebar.text_input("model_name_input").value == MODEL_NAME