diff --git a/.env.example b/.env.example
index e4767a97..fdee9af0 100644
--- a/.env.example
+++ b/.env.example
@@ -1,8 +1,11 @@
 # Copy this file to a new file named .env and replace the placeholders with your actual keys.
+# REMOVE "pragma: allowlist secret" when you replace with actual keys.
 # DO NOT fill your keys directly into this file.
 
 # OpenAI API Key
 OPENAI_API_KEY=YOUR_OPENAI_API_KEY_GOES_HERE  # pragma: allowlist secret
 
-# Serp API key
-SERP_API_KEY=YOUR_SERP_API_KEY_GOES_HERE  # pragma: allowlist secret
+# PQA API Key to use LiteratureSearch tool (optional) -- it also requires OpenAI key
+PQA_API_KEY=YOUR_PQA_API_KEY_GOES_HERE # pragma: allowlist secret
+
+# Optional: add TogetherAI, Fireworks, or Anthropic API key here to use their models
diff --git a/README.md b/README.md
index 12a9964f..f520c334 100644
--- a/README.md
+++ b/README.md
@@ -1,14 +1,17 @@
-MD-Agent is a LLM-agent based toolset for Molecular Dynamics.
+MDAgent is a LLM-agent based toolset for Molecular Dynamics.
 It's built using Langchain and uses a collection of tools to set up and execute molecular dynamics simulations, particularly in OpenMM.
 
 
 ## Environment Setup
 To use the OpenMM features in the agent, please set up a conda environment, following these steps.
-- Create conda environment: `conda env create -n mdagent -f environment.yaml`
-- Activate your environment: `conda activate mdagent`
+```
+conda env create -n mdagent -f environment.yaml
+conda activate mdagent
+```
+
+If you already have a conda environment, you can install dependencies before you activate it with the following step.
+- Install the necessary conda dependencies: `conda env update -n <YOUR_CONDA_ENV_HERE> -f environment.yaml`
 
-If you already have a conda environment, you can install dependencies with the following step.
-- Install the necessary conda dependencies: `conda install -c conda-forge openmm pdbfixer mdtraj`
 
 
 ## Installation
@@ -16,23 +19,30 @@ If you already have a conda environment, you can install dependencies with the f
 pip install git+https://github.com/ur-whitelab/md-agent.git
 ```
 
-
 ## Usage
-The first step is to set up your API keys in your environment. An OpenAI key is necessary for this project.
+The next step is to set up your API keys in your environment. An API key for LLM provider is necessary for this project. Supported LLM providers are OpenAI, TogetherAI, Fireworks, and Anthropic.
 Other tools require API keys, such as paper-qa for literature searches. We recommend setting up the keys in a .env file. You can use the provided .env.example file as a template.
 1. Copy the `.env.example` file and rename it to `.env`: `cp .env.example .env`
 2. Replace the placeholder values in `.env` with your actual keys
 
-<!-- ## Using Streamlit Interface
-If you'd like to use MDAgent via the streamlit app, make sure you have completed the steps above. Then, in your terminal, run `streamlit run st_app.py` in the project root directory.
+You can ask MDAgent to conduct molecular dynamics tasks using OpenAI's GPT model
+```
+from mdagent import MDAgent
+
+agent = MDAgent(model="gpt-3.5-turbo")
+agent.run("Simulate protein 1ZNI at 300 K for 0.1 ps and calculate the RMSD over time.")
+```
+Note: to distinguish Together models from the rest, you'll need to add "together\" prefix in model flag, such as `agent = MDAgent(model="together/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo")`
 
-From there you may upload files to use during the run. Note: the app is currently limited to uploading .pdb and .cif files, and the max size is defaulted at 200MB.
-- To upload larger files, instead run `streamlit run st_app.py --server.maxUploadSize=some_large_number`
-- To add different file types, you can add your desired file type to the list in the [streamlit app file](https://github.com/ur-whitelab/md-agent/blob/main/st_app.py). -->
+## LLM Providers
+By default, we support LLMs through OpenAI API. However, feel free to use other LLM providers. Make sure to install the necessary package for it. Here's list of packages required for alternative LLM providers we support:
+- `pip install langchain-together` to use models from TogetherAI
+- `pip install langchain-anthropic` to use models from Anthropic
+- `pip install langchain-fireworks` to use models from Fireworks
 
 
 ## Contributing
 
-We welcome contributions to MD-Agent! If you're interested in contributing to the project, please check out our [Contributor's Guide](CONTRIBUTING.md) for detailed instructions on getting started, feature development, and the pull request process.
+We welcome contributions to MDAgent! If you're interested in contributing to the project, please check out our [Contributor's Guide](CONTRIBUTING.md) for detailed instructions on getting started, feature development, and the pull request process.
 
-We value and appreciate all contributions to MD-Agent.
+We value and appreciate all contributions to MDAgent.
diff --git a/mdagent/agent/agent.py b/mdagent/agent/agent.py
index f67df6de..2adc7330 100644
--- a/mdagent/agent/agent.py
+++ b/mdagent/agent/agent.py
@@ -4,7 +4,7 @@
 from langchain.agents import AgentExecutor, OpenAIFunctionsAgent
 from langchain.agents.structured_chat.base import StructuredChatAgent
 
-from ..tools import get_tools, make_all_tools
+from ..tools import get_relevant_tools, make_all_tools
 from ..utils import PathRegistry, SetCheckpoint, _make_llm
 from .memory import MemoryManager
 from .prompt import openaifxn_prompt, structured_prompt
@@ -76,7 +76,7 @@ def _initialize_tools_and_agent(self, user_input=None):
         else:
             if self.top_k_tools != "all" and user_input is not None:
                 # retrieve only tools relevant to user input
-                self.tools = get_tools(
+                self.tools = get_relevant_tools(
                     query=user_input,
                     llm=self.tools_llm,
                     top_k_tools=self.top_k_tools,
diff --git a/mdagent/tools/__init__.py b/mdagent/tools/__init__.py
index 79c851ff..bf02a575 100644
--- a/mdagent/tools/__init__.py
+++ b/mdagent/tools/__init__.py
@@ -1,3 +1,3 @@
-from .maketools import get_tools, make_all_tools
+from .maketools import get_relevant_tools, make_all_tools
 
-__all__ = ["get_tools", "make_all_tools"]
+__all__ = ["get_relevant_tools", "make_all_tools"]
diff --git a/mdagent/tools/base_tools/__init__.py b/mdagent/tools/base_tools/__init__.py
index dab5d3fc..23a1fd21 100644
--- a/mdagent/tools/base_tools/__init__.py
+++ b/mdagent/tools/base_tools/__init__.py
@@ -45,7 +45,6 @@
 )
 from .simulation_tools.create_simulation import ModifyBaseSimulationScriptTool
 from .simulation_tools.setup_and_run import SetUpandRunFunction
-from .util_tools.git_issues_tool import SerpGitTool
 from .util_tools.registry_tools import ListRegistryPaths, MapPath2Name
 from .util_tools.search_tools import Scholar2ResultLLM
 
@@ -87,7 +86,6 @@
     "RDFTool",
     "RMSDCalculator",
     "Scholar2ResultLLM",
-    "SerpGitTool",
     "SetUpandRunFunction",
     "SimulationOutputFigures",
     "SmallMolPDB",
diff --git a/mdagent/tools/base_tools/preprocess_tools/pdb_get.py b/mdagent/tools/base_tools/preprocess_tools/pdb_get.py
index 675390f0..6212a6c9 100644
--- a/mdagent/tools/base_tools/preprocess_tools/pdb_get.py
+++ b/mdagent/tools/base_tools/preprocess_tools/pdb_get.py
@@ -1,7 +1,6 @@
 from typing import Optional
 
 import requests
-import streamlit as st
 from langchain.tools import BaseTool
 from rdkit import Chem
 from rdkit.Chem import AllChem
@@ -36,7 +35,6 @@ def get_pdb(query_string: str, path_registry: PathRegistry):
         results = r.json()["result_set"]
         pdbid = max(results, key=lambda x: x["score"])["identifier"]
         print(f"PDB file found with this ID: {pdbid}")
-        st.markdown(f"PDB file found with this ID: {pdbid}", unsafe_allow_html=True)
         url = f"https://files.rcsb.org/download/{pdbid}.{filetype}"
         pdb = requests.get(url)
         filename = path_registry.write_file_name(
diff --git a/mdagent/tools/base_tools/simulation_tools/setup_and_run.py b/mdagent/tools/base_tools/simulation_tools/setup_and_run.py
index 413ce5e1..d6dfe023 100644
--- a/mdagent/tools/base_tools/simulation_tools/setup_and_run.py
+++ b/mdagent/tools/base_tools/simulation_tools/setup_and_run.py
@@ -7,7 +7,6 @@
 from typing import Any, Dict, List, Optional, Type
 
 import requests
-import streamlit as st
 from langchain.tools import BaseTool
 from openff.toolkit.topology import Molecule
 from openmm import (
@@ -251,7 +250,6 @@ def __init__(
 
     def setup_system(self):
         print("Building system...")
-        st.markdown("Building system", unsafe_allow_html=True)
         self.pdb_id = self.params["pdb_id"]
         self.pdb_path = self.path_registry.get_mapped_path(self.pdb_id)
         self.pdb = PDBFile(self.pdb_path)
@@ -285,7 +283,6 @@ def setup_system(self):
 
     def setup_integrator(self):
         print("Setting up integrator...")
-        st.markdown("Setting up integrator", unsafe_allow_html=True)
         int_params = self.int_params
         integrator_type = int_params.get("integrator_type", "LangevinMiddle")
 
@@ -310,7 +307,6 @@ def setup_integrator(self):
 
     def create_simulation(self):
         print("Creating simulation...")
-        st.markdown("Creating simulation", unsafe_allow_html=True)
         self.simulation = Simulation(
             self.modeller.topology,
             self.system,
@@ -838,12 +834,10 @@ def remove_leading_spaces(text):
             file.write(script_content)
 
         print(f"Standalone simulation script written to {directory}/{filename}")
-        st.markdown("Standalone simulation script written", unsafe_allow_html=True)
 
     def run(self):
         # Minimize and Equilibrate
         print("Performing energy minimization...")
-        st.markdown("Performing energy minimization", unsafe_allow_html=True)
 
         self.simulation.minimizeEnergy()
         print("Minimization complete!")
@@ -857,7 +851,6 @@ def run(self):
             )
         self.path_registry.map_path(f"top_{self.sim_id}", top_name, top_description)
         print("Initial Positions saved to initial_positions.pdb")
-        st.markdown("Minimization complete! Equilibrating...", unsafe_allow_html=True)
         print("Equilibrating...")
         _temp = self.int_params["Temperature"]
         self.simulation.context.setVelocitiesToTemperature(_temp)
@@ -865,11 +858,9 @@ def run(self):
         self.simulation.step(_eq_steps)
         # Simulate
         print("Simulating...")
-        st.markdown("Simulating...", unsafe_allow_html=True)
         self.simulation.currentStep = 0
         self.simulation.step(self.sim_params["Number of Steps"])
         print("Done!")
-        st.markdown("Done!", unsafe_allow_html=True)
         if not self.save:
             if os.path.exists("temp_trajectory.dcd"):
                 os.remove("temp_trajectory.dcd")
@@ -950,7 +941,6 @@ def _run(self, **input_args):
             openmmsim.create_simulation()
 
             print("simulation set!")
-            st.markdown("simulation set!", unsafe_allow_html=True)
         except ValueError as e:
             msg = str(e) + f"This were the inputs {input_args}"
             if "No template for" in msg:
@@ -1492,11 +1482,9 @@ def check_system_params(cls, values):
         forcefield_files = values.get("forcefield_files")
         if forcefield_files is None or forcefield_files is []:
             print("Setting default forcefields")
-            st.markdown("Setting default forcefields", unsafe_allow_html=True)
             forcefield_files = ["amber14-all.xml", "amber14/tip3pfb.xml"]
         elif len(forcefield_files) == 0:
             print("Setting default forcefields v2")
-            st.markdown("Setting default forcefields", unsafe_allow_html=True)
             forcefield_files = ["amber14-all.xml", "amber14/tip3pfb.xml"]
         else:
             for file in forcefield_files:
diff --git a/mdagent/tools/base_tools/util_tools/__init__.py b/mdagent/tools/base_tools/util_tools/__init__.py
index 079e5904..87f60934 100644
--- a/mdagent/tools/base_tools/util_tools/__init__.py
+++ b/mdagent/tools/base_tools/util_tools/__init__.py
@@ -1,4 +1,3 @@
-from .git_issues_tool import SerpGitTool
 from .registry_tools import ListRegistryPaths, MapPath2Name
 from .search_tools import Scholar2ResultLLM
 
@@ -6,5 +5,4 @@
     "ListRegistryPaths",
     "MapPath2Name",
     "Scholar2ResultLLM",
-    "SerpGitTool",
 ]
diff --git a/mdagent/tools/base_tools/util_tools/git_issues_tool.py b/mdagent/tools/base_tools/util_tools/git_issues_tool.py
deleted file mode 100644
index 1feb0852..00000000
--- a/mdagent/tools/base_tools/util_tools/git_issues_tool.py
+++ /dev/null
@@ -1,168 +0,0 @@
-from typing import List, Optional
-
-import requests
-import tiktoken
-from langchain.prompts import PromptTemplate
-from langchain.tools import BaseTool
-from langchain_core.output_parsers import StrOutputParser
-from serpapi import GoogleSearch
-
-
-class GitToolFunctions:
-    """Class to store the functions of the tool."""
-
-    def __init__(self, llm):
-        self.llm = llm
-
-    def _prompt_summary(self, query: str, output: str):
-        prompt_template = """You're receiving the following github issues and comments.
-                            They come after looking for issues
-                            in the openmm repo for the query: {query}.
-                            The responses have the following format:
-                            Issue: body of the issue
-                            Comment: comments in response to the issue.
-                            There are up to 5 comments per issue.
-                            Some of the comments do not address the issue.
-                            You job is to decide:
-                            1) if the issue is relevant to the query.
-                            2) if the comments are relevant to the issue.
-                            Then, make a summary of the issue and comments.
-                            Only keeping the relevant information.
-                            If there are PDB files shared,
-                            just add a few lines from them, not all of it.
-                            If a comment is not relevant,
-                            do not include it in the summary.
-                            And if the issue is not relevant,
-                            do not include it in the summary.
-                            Keep in the summary all possible solutions given
-                            in the comments if they are appropiate.
-                            The summary should have at most 2.5k tokens.
-                            The answer you have to summarize is:
-                            {output}
-
-                            you:"""
-        prompt = PromptTemplate(
-            template=prompt_template, input_variables=["query", "output"]
-        )
-        llm_chain = prompt | self.llm | StrOutputParser()
-
-        return llm_chain.invoke({"query": query, "output": output})
-
-    """Function to get the number of requests remaining for the Github API """
-
-    def get_requests_remaining(self):
-        url = "https://api.github.com/rate_limit"
-        response = requests.get(url)
-        return response.json()["rate"]["remaining"]
-
-    def make_encoding(self):
-        return tiktoken.encoding_for_model("gpt-4")
-
-
-class SerpGitTool(BaseTool):
-    name = "Openmm_Github_Issues_Search"
-    description = """ Tool that searches inside
-                    github issues in openmm. Make
-                    your query as if you were googling something.
-                    Input: Trying to run a simulation with a
-                    custom forcefield error: error_code.
-                    Output: Relevant issues with your query.
-                    Input: """
-    serp_key: Optional[str]
-
-    def __init__(self, serp_key, llm):
-        super().__init__()
-        self.serp_key = serp_key
-        self.llm = llm
-
-    def _run(self, query: str):
-        fxns = GitToolFunctions(self.llm)
-        # print("this is the key", self.serp_key)
-        params = {
-            "engine": "google",
-            "q": "site:github.com/openmm/openmm/issues " + query,
-            "api_key": self.serp_key,
-        }
-        encoding = fxns.make_encoding()
-        search = GoogleSearch(params)
-        results = search.get_dict()
-        organic_results = results.get("organic_results")
-        if organic_results is None:
-            if results.get("error"):
-                return "Failed. Error: " + results.get("error")
-            else:
-                return "Failed. Error: No 'organic_results' found"
-        issues_numbers: List = (
-            []
-        )  # list that will contain issue id numbers retrieved from the google search
-        number_of_results = (
-            3  # number of results to be retrieved from the google search
-        )
-        print(len(organic_results), "results found with SERP API")
-        for result in organic_results:
-            if (
-                len(issues_numbers) == number_of_results
-            ):  # break if we have enough results
-                break
-            link = result["link"]
-            number = int(link.split("/")[-1])
-            # check if number is integer
-            if isinstance(number, int):
-                issues_numbers.append(number)
-
-        # search for issues
-
-        number_of_requests = len(issues_numbers) * 2  # 1 for comments, 1 for issues
-        remaining_requests = fxns.get_requests_remaining()
-        print("remaining requests", remaining_requests)
-        if remaining_requests > number_of_requests:
-            issues_dict = {}
-            print("number of issues", len(issues_numbers))
-            for number in issues_numbers:
-                url_comments = f"https://api.github.com/repos/openmm/openmm/issues/{number}/comments"
-                url_issues = (
-                    f"https://api.github.com/repos/openmm/openmm/issues/{number}"
-                )
-                response_issues = requests.get(url_issues)
-                response_comments = requests.get(url_comments)
-
-                if (
-                    response_issues.status_code == 200
-                    and response_comments.status_code == 200
-                ):
-                    issues = response_issues.json()
-                    issue = issues["title"]
-                    body = issues["body"]
-                    comments = response_comments.json()
-                    body += f"\n\n Comments for issue {number}: \n"
-                    for i, comment in enumerate(comments):
-                        body += f"Answer#{i}:{comment['body']} \n"
-                        if i > 5:  # up to 5 comments per issue should be enough,
-                            # some issues have more than 100 comments
-                            break  # TODO definitely summarize comments
-                            # if there are more than x amount of comments.
-                    issues_dict[f"{number}"] = [issue, body]
-                else:
-                    print(f"Error: {response_comments.status_code} for issue {number}")
-                    continue
-
-                # prepare the output
-                output = ""
-                for key in issues_dict.keys():
-                    output += f"Issue {key}: {issues_dict[key][0]} \n"
-                    output += f"Body: {issues_dict[key][1]} \n"
-
-            num_tokens = len(encoding.encode(str(output)))
-            if num_tokens > 4000:
-                # summarize output
-                output = fxns._prompt_summary(query, output)
-            return "Succeeded. " + output
-        else:
-            return (
-                "Failed. Not enough requests remaining for Github API. "
-                "Try again later"
-            )
-
-    def _arun(self, query) -> str:
-        """Use the tool asynchronously."""
-        raise NotImplementedError("Name2PDB does not support async")
diff --git a/mdagent/tools/maketools.py b/mdagent/tools/maketools.py
index ab985d43..a7f514a1 100644
--- a/mdagent/tools/maketools.py
+++ b/mdagent/tools/maketools.py
@@ -1,11 +1,12 @@
 import os
 
-import streamlit as st
+import numpy as np
 from dotenv import load_dotenv
 from langchain import agents
 from langchain.base_language import BaseLanguageModel
-from langchain_chroma import Chroma
 from langchain_openai import OpenAIEmbeddings
+from sklearn.feature_extraction.text import TfidfVectorizer
+from sklearn.metrics.pairwise import cosine_similarity
 
 from mdagent.utils import PathRegistry
 
@@ -73,7 +74,7 @@ def make_all_tools(
         all_tools += [
             ModifyBaseSimulationScriptTool(path_registry=path_instance, llm=llm),
         ]
-        if "OPENAI_API_KEY" in os.environ:
+        if "OPENAI_API_KEY" in os.environ and "PQA_API_KEY" in os.environ:
             all_tools += [Scholar2ResultLLM(llm=llm, path_registry=path_instance)]
         if human:
             all_tools += [agents.load_tools(["human"], llm)[0]]
@@ -131,46 +132,44 @@ def make_all_tools(
     return all_tools
 
 
-def get_tools(
-    query,
-    llm: BaseLanguageModel,
-    top_k_tools=15,
-    human=False,
-):
-    ckpt_dir = PathRegistry.get_instance().ckpt_dir
+def get_relevant_tools(query, llm: BaseLanguageModel, top_k_tools=15, human=False):
+    """
+    Get most relevant tools for the query using vector similarity search.
+    Query and tools are vectorized using either OpenAI embeddings or TF-IDF.
+
+    If an OpenAI API key is available, it uses embeddings for a more
+    sophisticated search. Otherwise, it falls back to using TF-IDF for
+    simpler, term-based matching.
+
+    Returns:
+    - A list of the most relevant tools, or None if no tools are found.
+    """
 
     all_tools = make_all_tools(llm, human=human)
+    if not all_tools:
+        return None
+
+    tool_texts = [f"{tool.name} {tool.description}" for tool in all_tools]
 
-    # set vector DB for all tools
-    vectordb = Chroma(
-        collection_name="all_tools_vectordb",
-        embedding_function=OpenAIEmbeddings(),
-        persist_directory=f"{ckpt_dir}/all_tools_vectordb",
-    )
-    # vectordb.delete_collection()      #<--- to clear previous vectordb directory
-    for i, tool in enumerate(all_tools):
-        vectordb.add_texts(
-            texts=[tool.description],
-            ids=[tool.name],
-            metadatas=[{"tool_name": tool.name, "index": i}],
-        )
-
-    # retrieve 'k' tools
-    k = min(top_k_tools, vectordb._collection.count())
+    # convert texts to vectors
+    if "OPENAI_API_KEY" in os.environ:
+        embeddings = OpenAIEmbeddings(model="text-embedding-3-small")
+        try:
+            tool_vectors = np.array(embeddings.embed_documents(tool_texts))
+            query_vector = np.array(embeddings.embed_query(query)).reshape(1, -1)
+        except Exception as e:
+            print(f"Error generating embeddings for tool retrieval: {e}")
+            return None
+    else:
+        vectorizer = TfidfVectorizer()
+        tool_vectors = vectorizer.fit_transform(tool_texts)
+        query_vector = vectorizer.transform([query])
+
+    similarities = cosine_similarity(query_vector, tool_vectors).flatten()
+    k = min(max(top_k_tools, 1), len(all_tools))
     if k == 0:
         return None
-    docs = vectordb.similarity_search(query, k=k)
-    retrieved_tools = []
-    for d in docs:
-        index = d.metadata.get("index")
-        if index is not None and 0 <= index < len(all_tools):
-            retrieved_tools.append(all_tools[index])
-        else:
-            print(f"Invalid index {index}.")
-            print("Some tools may be duplicated.")
-            print(f"Try to delete vector DB at {ckpt_dir}/all_tools_vectordb.")
-            st.markdown(
-                "Invalid index. Some tools may be duplicated Try to delete VDB.",
-                unsafe_allow_html=True,
-            )
+    top_k_indices = np.argsort(similarities)[-k:][::-1]
+    retrieved_tools = [all_tools[i] for i in top_k_indices]
+
     return retrieved_tools
diff --git a/mdagent/utils/makellm.py b/mdagent/utils/makellm.py
index 9eaf6738..d9f0b70f 100644
--- a/mdagent/utils/makellm.py
+++ b/mdagent/utils/makellm.py
@@ -1,6 +1,15 @@
+import importlib.util
+
 from langchain.callbacks.streaming_stdout import StreamingStdOutCallbackHandler
 
 
+def check_package_exists(package_name, model):
+    if not importlib.util.find_spec(package_name):
+        raise ImportError(
+            f"The package required to run model '{model}' is missing: '{package_name}'."
+        )
+
+
 def _make_llm(model, temp, streaming):
     if model.startswith("gpt-3.5-turbo") or model.startswith("gpt-4"):
         from langchain_openai import ChatOpenAI
@@ -13,6 +22,7 @@ def _make_llm(model, temp, streaming):
             callbacks=[StreamingStdOutCallbackHandler()] if streaming else None,
         )
     elif model.startswith("accounts/fireworks"):
+        check_package_exists("langchain_fireworks", model)
         from langchain_fireworks import ChatFireworks
 
         llm = ChatFireworks(
@@ -24,6 +34,7 @@ def _make_llm(model, temp, streaming):
         )
     elif model.startswith("together/"):
         # user needs to add 'together/' prefix to use TogetherAI provider
+        check_package_exists("langchain_together", model)
         from langchain_together import ChatTogether
 
         llm = ChatTogether(
@@ -34,6 +45,7 @@ def _make_llm(model, temp, streaming):
             callbacks=[StreamingStdOutCallbackHandler()] if streaming else None,
         )
     elif model.startswith("claude"):
+        check_package_exists("langchain_anthropic", model)
         from langchain_anthropic import ChatAnthropic
 
         llm = ChatAnthropic(
diff --git a/setup.py b/setup.py
index cba4e7f5..85ae8841 100644
--- a/setup.py
+++ b/setup.py
@@ -17,19 +17,12 @@
     license="MIT",
     packages=find_packages(),
     install_requires=[
-        "chromadb",
-        "google-search-results",
         "langchain==0.2.12",
-        "langchain-anthropic==0.1.22",
-        "langchain-chroma",
         "langchain-community",
-        "langchain-fireworks==0.1.7",
         "langchain-openai==0.1.19",
-        "langchain-together==0.1.4",
         "matplotlib",
         "nbformat",
         "openai",
-        "outlines",
         "paper-qa==4.0.0rc8 ",
         "paper-scraper @ git+https://github.com/blackadad/paper-scraper.git",
         "pandas",
@@ -38,8 +31,6 @@
         "rdkit",
         "requests",
         "seaborn",
-        "streamlit",
-        "tiktoken",
         "scikit-learn",
         "scipy==1.14.0",
     ],
diff --git a/tests/test_analysis/test_inertia.py b/tests/test_analysis/test_inertia.py
index 961ff477..67a7c91a 100644
--- a/tests/test_analysis/test_inertia.py
+++ b/tests/test_analysis/test_inertia.py
@@ -57,4 +57,4 @@ def test_plot_moi_multiple_frames(mock_close, mock_savefig, moi_functions):
     result = moi_functions.plot_moi()
     assert "Plot of moments of inertia over time saved" in result
     mock_savefig.assert_called_once()
-    mock_close.assert_called_once()
+    mock_close.mock_close.call_count >= 1
diff --git a/tests/test_utils/test_top_k_tools.py b/tests/test_utils/test_top_k_tools.py
new file mode 100644
index 00000000..2f3dda3b
--- /dev/null
+++ b/tests/test_utils/test_top_k_tools.py
@@ -0,0 +1,96 @@
+import os
+from unittest.mock import MagicMock, patch
+
+import numpy as np
+import pytest
+
+from mdagent.tools.maketools import get_relevant_tools
+
+
+@pytest.fixture
+def mock_llm():
+    return MagicMock()
+
+
+@pytest.fixture
+def mock_tools():
+    Tool = MagicMock()
+    tool1 = Tool(name="Tool1", description="This is the first tool")
+    tool2 = Tool(name="Tool2", description="This is the second tool")
+    tool3 = Tool(name="Tool3", description="This is the third tool")
+    return [tool1, tool2, tool3]
+
+
+@patch("mdagent.tools.maketools.make_all_tools")
+@patch("mdagent.tools.maketools.OpenAIEmbeddings")
+def test_get_relevant_tools_with_openai_embeddings(
+    mock_openai_embeddings, mock_make_all_tools, mock_llm, mock_tools
+):
+    mock_make_all_tools.return_value = mock_tools
+    mock_embed_documents = mock_openai_embeddings.return_value.embed_documents
+    mock_embed_query = mock_openai_embeddings.return_value.embed_query
+    mock_embed_documents.return_value = np.random.rand(3, 512)
+    mock_embed_query.return_value = np.random.rand(512)
+
+    with patch.dict(
+        os.environ, {"OPENAI_API_KEY": "test_key"}  # pragma: allowlist secret
+    ):
+        relevant_tools = get_relevant_tools("test query", mock_llm, top_k_tools=2)
+        assert len(relevant_tools) == 2
+        assert relevant_tools[0] in mock_tools
+        assert relevant_tools[1] in mock_tools
+
+
+@patch("mdagent.tools.maketools.make_all_tools")
+@patch("mdagent.tools.maketools.TfidfVectorizer")
+def test_get_relevant_tools_with_tfidf(
+    mock_tfidf_vectorizer, mock_make_all_tools, mock_llm, mock_tools
+):
+    mock_make_all_tools.return_value = mock_tools
+    mock_vectorizer = mock_tfidf_vectorizer.return_value
+    mock_vectorizer.fit_transform.return_value = np.random.rand(3, 10)
+    mock_vectorizer.transform.return_value = np.random.rand(1, 10)
+
+    with patch.dict(os.environ, {}, clear=True):  # ensure OPENAI_API_KEY is not set
+        relevant_tools = get_relevant_tools("test query", mock_llm, top_k_tools=2)
+        assert len(relevant_tools) == 2
+        assert relevant_tools[0] in mock_tools
+        assert relevant_tools[1] in mock_tools
+
+
+@patch("mdagent.tools.maketools.make_all_tools")
+def test_get_relevant_tools_with_no_tools(mock_make_all_tools, mock_llm):
+    mock_make_all_tools.return_value = []
+
+    with patch.dict(os.environ, {}, clear=True):
+        relevant_tools = get_relevant_tools("test query", mock_llm)
+        assert relevant_tools is None
+
+
+@patch("mdagent.tools.maketools.make_all_tools")
+@patch("mdagent.tools.maketools.OpenAIEmbeddings")
+def test_get_relevant_tools_with_openai_exception(
+    mock_openai_embeddings, mock_make_all_tools, mock_llm, mock_tools
+):
+    mock_make_all_tools.return_value = mock_tools
+    mock_embed_documents = mock_openai_embeddings.return_value.embed_documents
+    mock_embed_documents.side_effect = Exception("Embedding error")
+
+    with patch.dict(
+        os.environ, {"OPENAI_API_KEY": "test_key"}  # pragma: allowlist secret
+    ):
+        relevant_tools = get_relevant_tools("test query", mock_llm)
+        assert relevant_tools is None
+
+
+@patch("mdagent.tools.maketools.make_all_tools")
+def test_get_relevant_tools_top_k(mock_make_all_tools, mock_llm, mock_tools):
+    mock_make_all_tools.return_value = mock_tools
+
+    with patch.dict(os.environ, {}, clear=True):
+        relevant_tools = get_relevant_tools("test query", mock_llm, top_k_tools=1)
+        assert len(relevant_tools) == 1
+        assert relevant_tools[0] in mock_tools
+
+        relevant_tools = get_relevant_tools("test query", mock_llm, top_k_tools=5)
+        assert len(relevant_tools) == len(mock_tools)