diff --git a/.github/scripts/check_version_consistency.py b/.github/scripts/check_version_consistency.py
new file mode 100755
index 000000000000..daf78a8d2c1a
--- /dev/null
+++ b/.github/scripts/check_version_consistency.py
@@ -0,0 +1,66 @@
+#!/usr/bin/env python3
+import os
+import re
+import sys
+from typing import Set, Tuple
+
+
+def find_version_references(directory: str) -> Tuple[Set[str], Set[str]]:
+    openhands_versions = set()
+    runtime_versions = set()
+
+    version_pattern_openhands = re.compile(r'openhands:(\d{1})\.(\d{2})')
+    version_pattern_runtime = re.compile(r'runtime:(\d{1})\.(\d{2})')
+
+    for root, _, files in os.walk(directory):
+        # Skip .git directory
+        if '.git' in root:
+            continue
+
+        for file in files:
+            if file.endswith(
+                ('.md', '.yml', '.yaml', '.txt', '.html', '.py', '.js', '.ts')
+            ):
+                file_path = os.path.join(root, file)
+                try:
+                    with open(file_path, 'r', encoding='utf-8') as f:
+                        content = f.read()
+
+                        # Find all openhands version references
+                        matches = version_pattern_openhands.findall(content)
+                        openhands_versions.update(matches)
+
+                        # Find all runtime version references
+                        matches = version_pattern_runtime.findall(content)
+                        runtime_versions.update(matches)
+                except Exception as e:
+                    print(f'Error reading {file_path}: {e}', file=sys.stderr)
+
+    return openhands_versions, runtime_versions
+
+
+def main():
+    repo_root = os.path.abspath(os.path.join(os.path.dirname(__file__), '..', '..'))
+    openhands_versions, runtime_versions = find_version_references(repo_root)
+
+    exit_code = 0
+
+    if len(openhands_versions) > 1:
+        print('Error: Multiple openhands versions found:', file=sys.stderr)
+        print('Found versions:', sorted(openhands_versions), file=sys.stderr)
+        exit_code = 1
+    elif len(openhands_versions) == 0:
+        print('Warning: No openhands version references found', file=sys.stderr)
+
+    if len(runtime_versions) > 1:
+        print('Error: Multiple runtime versions found:', file=sys.stderr)
+        print('Found versions:', sorted(runtime_versions), file=sys.stderr)
+        exit_code = 1
+    elif len(runtime_versions) == 0:
+        print('Warning: No runtime version references found', file=sys.stderr)
+
+    sys.exit(exit_code)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/.github/workflows/lint.yml b/.github/workflows/lint.yml
index 1bfc8c91c6a4..789a938e1d7e 100644
--- a/.github/workflows/lint.yml
+++ b/.github/workflows/lint.yml
@@ -53,3 +53,16 @@ jobs:
         run: pip install pre-commit==3.7.0
       - name: Run pre-commit hooks
         run: pre-commit run --files openhands/**/* evaluation/**/* tests/**/* --show-diff-on-failure --config ./dev_config/python/.pre-commit-config.yaml
+
+  # Check version consistency across documentation
+  check-version-consistency:
+    name: Check version consistency
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v4
+      - name: Set up python
+        uses: actions/setup-python@v5
+        with:
+          python-version: 3.12
+      - name: Run version consistency check
+        run: .github/scripts/check_version_consistency.py
diff --git a/.github/workflows/openhands-resolver.yml b/.github/workflows/openhands-resolver.yml
index 2db2907eba9a..028316ee05d5 100644
--- a/.github/workflows/openhands-resolver.yml
+++ b/.github/workflows/openhands-resolver.yml
@@ -185,12 +185,17 @@ jobs:
 
       - name: Install OpenHands
         uses: actions/github-script@v7
+        env:
+          COMMENT_BODY: ${{ github.event.comment.body || '' }}
+          REVIEW_BODY: ${{ github.event.review.body || '' }}
+          LABEL_NAME: ${{ github.event.label.name || '' }}
+          EVENT_NAME: ${{ github.event_name }}
         with:
           script: |
-            const commentBody = `${{ github.event.comment.body || '' }}`.trim();
-            const reviewBody = `${{ github.event.review.body || '' }}`.trim();
-            const labelName = `${{ github.event.label.name || '' }}`.trim();
-            const eventName = `${{ github.event_name }}`.trim();
+            const commentBody = process.env.COMMENT_BODY.trim();
+            const reviewBody = process.env.REVIEW_BODY.trim();
+            const labelName = process.env.LABEL_NAME.trim();
+            const eventName = process.env.EVENT_NAME.trim();
 
             // Check conditions
             const isExperimentalLabel = labelName === "fix-me-experimental";
diff --git a/Development.md b/Development.md
index 1eaa3054773b..fbdaac497e91 100644
--- a/Development.md
+++ b/Development.md
@@ -8,7 +8,7 @@ Otherwise, you can clone the OpenHands project directly.
 * Linux, Mac OS, or [WSL on Windows](https://learn.microsoft.com/en-us/windows/wsl/install)  [Ubuntu <= 22.04]
 * [Docker](https://docs.docker.com/engine/install/) (For those on MacOS, make sure to allow the default Docker socket to be used from advanced settings!)
 * [Python](https://www.python.org/downloads/) = 3.12
-* [NodeJS](https://nodejs.org/en/download/package-manager) >= 18.17.1
+* [NodeJS](https://nodejs.org/en/download/package-manager) >= 20.x
 * [Poetry](https://python-poetry.org/docs/#installing-with-the-official-installer) >= 1.8
 * OS-specific dependencies:
   - Ubuntu: build-essential => `sudo apt-get install build-essential`
diff --git a/Makefile b/Makefile
index c4e1949b9621..e1f14c410f43 100644
--- a/Makefile
+++ b/Makefile
@@ -81,10 +81,10 @@ check-nodejs:
 	@if command -v node > /dev/null; then \
 		NODE_VERSION=$(shell node --version | sed -E 's/v//g'); \
 		IFS='.' read -r -a NODE_VERSION_ARRAY <<< "$$NODE_VERSION"; \
-		if [ "$${NODE_VERSION_ARRAY[0]}" -gt 18 ] || ([ "$${NODE_VERSION_ARRAY[0]}" -eq 18 ] && [ "$${NODE_VERSION_ARRAY[1]}" -gt 17 ]) || ([ "$${NODE_VERSION_ARRAY[0]}" -eq 18 ] && [ "$${NODE_VERSION_ARRAY[1]}" -eq 17 ] && [ "$${NODE_VERSION_ARRAY[2]}" -ge 1 ]); then \
+		if [ "$${NODE_VERSION_ARRAY[0]}" -ge 20 ]; then \
 			echo "$(BLUE)Node.js $$NODE_VERSION is already installed.$(RESET)"; \
 		else \
-			echo "$(RED)Node.js 18.17.1 or later is required. Please install Node.js 18.17.1 or later to continue.$(RESET)"; \
+			echo "$(RED)Node.js 20.x or later is required. Please install Node.js 20.x or later to continue.$(RESET)"; \
 			exit 1; \
 		fi; \
 	else \
diff --git a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md
index b00df2c1f2a2..9156d7ac46ff 100644
--- a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md
+++ b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md
@@ -52,7 +52,7 @@ LLM_API_KEY="sk_test_12345"
 ```bash
 docker run -it \
     --pull=always \
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -e SANDBOX_USER_ID=$(id -u) \
     -e WORKSPACE_MOUNT_PATH=$WORKSPACE_BASE \
     -e LLM_API_KEY=$LLM_API_KEY \
@@ -61,7 +61,7 @@ docker run -it \
     -v /var/run/docker.sock:/var/run/docker.sock \
     --add-host host.docker.internal:host-gateway \
     --name openhands-app-$(date +%Y%m%d%H%M%S) \
-    docker.all-hands.dev/all-hands-ai/openhands:0.16 \
+    docker.all-hands.dev/all-hands-ai/openhands:0.17 \
     python -m openhands.core.cli
 ```
 
diff --git a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md
index a1610bb11562..9d1172770549 100644
--- a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md
+++ b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md
@@ -46,7 +46,7 @@ LLM_API_KEY="sk_test_12345"
 ```bash
 docker run -it \
     --pull=always \
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -e SANDBOX_USER_ID=$(id -u) \
     -e WORKSPACE_MOUNT_PATH=$WORKSPACE_BASE \
     -e LLM_API_KEY=$LLM_API_KEY \
@@ -56,6 +56,6 @@ docker run -it \
     -v /var/run/docker.sock:/var/run/docker.sock \
     --add-host host.docker.internal:host-gateway \
     --name openhands-app-$(date +%Y%m%d%H%M%S) \
-    docker.all-hands.dev/all-hands-ai/openhands:0.16 \
+    docker.all-hands.dev/all-hands-ai/openhands:0.17 \
     python -m openhands.core.main -t "write a bash script that prints hi" --no-auto-continue
 ```
diff --git a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/installation.mdx b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/installation.mdx
index 87b7afb07cd2..ddfef195b661 100644
--- a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/installation.mdx
+++ b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/installation.mdx
@@ -13,16 +13,16 @@
 La façon la plus simple d'exécuter OpenHands est avec Docker.
 
 ```bash
-docker pull docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik
+docker pull docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik
 
 docker run -it --rm --pull=always \
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -e LOG_ALL_EVENTS=true \
     -v /var/run/docker.sock:/var/run/docker.sock \
     -p 3000:3000 \
     --add-host host.docker.internal:host-gateway \
     --name openhands-app \
-    docker.all-hands.dev/all-hands-ai/openhands:0.16
+    docker.all-hands.dev/all-hands-ai/openhands:0.17
 ```
 
 Vous pouvez également exécuter OpenHands en mode [headless scriptable](https://docs.all-hands.dev/modules/usage/how-to/headless-mode), en tant que [CLI interactive](https://docs.all-hands.dev/modules/usage/how-to/cli-mode), ou en utilisant l'[Action GitHub OpenHands](https://docs.all-hands.dev/modules/usage/how-to/github-action).
diff --git a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/runtimes.md b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/runtimes.md
index d12524fc012c..67d054c4791f 100644
--- a/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/runtimes.md
+++ b/docs/i18n/fr/docusaurus-plugin-content-docs/current/usage/runtimes.md
@@ -13,7 +13,7 @@ C'est le Runtime par défaut qui est utilisé lorsque vous démarrez OpenHands.
 
 ```
 docker run # ...
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -v /var/run/docker.sock:/var/run/docker.sock \
     # ...
 ```
diff --git a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md
index cf0bbdd10dd6..e6760ee2d63b 100644
--- a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md
+++ b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/cli-mode.md
@@ -50,7 +50,7 @@ LLM_API_KEY="sk_test_12345"
 ```bash
 docker run -it \
     --pull=always \
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -e SANDBOX_USER_ID=$(id -u) \
     -e WORKSPACE_MOUNT_PATH=$WORKSPACE_BASE \
     -e LLM_API_KEY=$LLM_API_KEY \
@@ -59,7 +59,7 @@ docker run -it \
     -v /var/run/docker.sock:/var/run/docker.sock \
     --add-host host.docker.internal:host-gateway \
     --name openhands-app-$(date +%Y%m%d%H%M%S) \
-    docker.all-hands.dev/all-hands-ai/openhands:0.16 \
+    docker.all-hands.dev/all-hands-ai/openhands:0.17 \
     python -m openhands.core.cli
 ```
 
diff --git a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md
index 6a95fa0fe5a5..c38831e4a462 100644
--- a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md
+++ b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/how-to/headless-mode.md
@@ -47,7 +47,7 @@ LLM_API_KEY="sk_test_12345"
 ```bash
 docker run -it \
     --pull=always \
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -e SANDBOX_USER_ID=$(id -u) \
     -e WORKSPACE_MOUNT_PATH=$WORKSPACE_BASE \
     -e LLM_API_KEY=$LLM_API_KEY \
@@ -57,6 +57,6 @@ docker run -it \
     -v /var/run/docker.sock:/var/run/docker.sock \
     --add-host host.docker.internal:host-gateway \
     --name openhands-app-$(date +%Y%m%d%H%M%S) \
-    docker.all-hands.dev/all-hands-ai/openhands:0.16 \
+    docker.all-hands.dev/all-hands-ai/openhands:0.17 \
     python -m openhands.core.main -t "write a bash script that prints hi" --no-auto-continue
 ```
diff --git a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/installation.mdx b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/installation.mdx
index 432eaeeff0e4..6de97bfc3bc5 100644
--- a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/installation.mdx
+++ b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/installation.mdx
@@ -11,16 +11,16 @@
 在 Docker 中运行 OpenHands 是最简单的方式。
 
 ```bash
-docker pull docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik
+docker pull docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik
 
 docker run -it --rm --pull=always \
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -e LOG_ALL_EVENTS=true \
     -v /var/run/docker.sock:/var/run/docker.sock \
     -p 3000:3000 \
     --add-host host.docker.internal:host-gateway \
     --name openhands-app \
-    docker.all-hands.dev/all-hands-ai/openhands:0.16
+    docker.all-hands.dev/all-hands-ai/openhands:0.17
 ```
 
 你也可以在可脚本化的[无头模式](https://docs.all-hands.dev/modules/usage/how-to/headless-mode)下运行 OpenHands，作为[交互式 CLI](https://docs.all-hands.dev/modules/usage/how-to/cli-mode)，或使用 [OpenHands GitHub Action](https://docs.all-hands.dev/modules/usage/how-to/github-action)。
diff --git a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/runtimes.md b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/runtimes.md
index d93207442a07..c6a7fc29053c 100644
--- a/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/runtimes.md
+++ b/docs/i18n/zh-Hans/docusaurus-plugin-content-docs/current/usage/runtimes.md
@@ -11,7 +11,7 @@
 
 ```
 docker run # ...
-    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.16-nikolaik \
+    -e SANDBOX_RUNTIME_CONTAINER_IMAGE=docker.all-hands.dev/all-hands-ai/runtime:0.17-nikolaik \
     -v /var/run/docker.sock:/var/run/docker.sock \
     # ...
 ```
diff --git a/docs/modules/usage/how-to/headless-mode.md b/docs/modules/usage/how-to/headless-mode.md
index dd5cee783f0a..2d085d813c3c 100644
--- a/docs/modules/usage/how-to/headless-mode.md
+++ b/docs/modules/usage/how-to/headless-mode.md
@@ -12,7 +12,7 @@ To run OpenHands in headless mode with Python,
 and then run:
 
 ```bash
-poetry run python -m openhands.core.main -t "write a bash script that prints hi"
+poetry run python -m openhands.core.main -t "write a bash script that prints hi" --no-auto-continue
 ```
 
 You'll need to be sure to set your model, API key, and other settings via environment variables
diff --git a/evaluation/benchmarks/EDA/run_infer.py b/evaluation/benchmarks/EDA/run_infer.py
index c866b5090bdd..e8cee3df3e20 100644
--- a/evaluation/benchmarks/EDA/run_infer.py
+++ b/evaluation/benchmarks/EDA/run_infer.py
@@ -63,7 +63,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/agent_bench/run_infer.py b/evaluation/benchmarks/agent_bench/run_infer.py
index f008c9dc8a8a..a64c66f22cdc 100644
--- a/evaluation/benchmarks/agent_bench/run_infer.py
+++ b/evaluation/benchmarks/agent_bench/run_infer.py
@@ -43,7 +43,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-slim',
diff --git a/evaluation/benchmarks/aider_bench/run_infer.py b/evaluation/benchmarks/aider_bench/run_infer.py
index e059a6b46f6a..bc850dbc6261 100644
--- a/evaluation/benchmarks/aider_bench/run_infer.py
+++ b/evaluation/benchmarks/aider_bench/run_infer.py
@@ -50,7 +50,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.11-bookworm',
diff --git a/evaluation/benchmarks/biocoder/run_infer.py b/evaluation/benchmarks/biocoder/run_infer.py
index 2da7b09f0fcf..c33c75e5a221 100644
--- a/evaluation/benchmarks/biocoder/run_infer.py
+++ b/evaluation/benchmarks/biocoder/run_infer.py
@@ -61,7 +61,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image=BIOCODER_BENCH_CONTAINER_IMAGE,
diff --git a/evaluation/benchmarks/bird/run_infer.py b/evaluation/benchmarks/bird/run_infer.py
index d35084fdbc82..14946ebacb2f 100644
--- a/evaluation/benchmarks/bird/run_infer.py
+++ b/evaluation/benchmarks/bird/run_infer.py
@@ -74,7 +74,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/browsing_delegation/run_infer.py b/evaluation/benchmarks/browsing_delegation/run_infer.py
index 38fb6cae25ce..016b6c3f582e 100644
--- a/evaluation/benchmarks/browsing_delegation/run_infer.py
+++ b/evaluation/benchmarks/browsing_delegation/run_infer.py
@@ -39,7 +39,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/commit0_bench/run_infer.py b/evaluation/benchmarks/commit0_bench/run_infer.py
index 1ef347931feb..d8f1f64b1a6b 100644
--- a/evaluation/benchmarks/commit0_bench/run_infer.py
+++ b/evaluation/benchmarks/commit0_bench/run_infer.py
@@ -124,7 +124,7 @@ def get_config(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
         max_iterations=metadata.max_iterations,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         sandbox=SandboxConfig(
             base_container_image=base_container_image,
             enable_auto_lint=True,
diff --git a/evaluation/benchmarks/discoverybench/run_infer.py b/evaluation/benchmarks/discoverybench/run_infer.py
index 55e958d9fd9c..0d5b47410c2d 100644
--- a/evaluation/benchmarks/discoverybench/run_infer.py
+++ b/evaluation/benchmarks/discoverybench/run_infer.py
@@ -65,7 +65,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/gaia/run_infer.py b/evaluation/benchmarks/gaia/run_infer.py
index 99c29b211dc4..8aaa479e92be 100644
--- a/evaluation/benchmarks/gaia/run_infer.py
+++ b/evaluation/benchmarks/gaia/run_infer.py
@@ -50,7 +50,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/gorilla/run_infer.py b/evaluation/benchmarks/gorilla/run_infer.py
index 64263242d751..e453b1f570ba 100644
--- a/evaluation/benchmarks/gorilla/run_infer.py
+++ b/evaluation/benchmarks/gorilla/run_infer.py
@@ -43,7 +43,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/gpqa/run_infer.py b/evaluation/benchmarks/gpqa/run_infer.py
index d9e1caec7768..08e66827924e 100644
--- a/evaluation/benchmarks/gpqa/run_infer.py
+++ b/evaluation/benchmarks/gpqa/run_infer.py
@@ -64,7 +64,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/humanevalfix/run_infer.py b/evaluation/benchmarks/humanevalfix/run_infer.py
index 3b5a5bca2ff8..b2fb6d677a9c 100644
--- a/evaluation/benchmarks/humanevalfix/run_infer.py
+++ b/evaluation/benchmarks/humanevalfix/run_infer.py
@@ -85,7 +85,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/logic_reasoning/run_infer.py b/evaluation/benchmarks/logic_reasoning/run_infer.py
index 0a1447f06171..d84c5f8ca8cb 100644
--- a/evaluation/benchmarks/logic_reasoning/run_infer.py
+++ b/evaluation/benchmarks/logic_reasoning/run_infer.py
@@ -48,7 +48,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='xingyaoww/od-eval-logic-reasoning:v1.0',
diff --git a/evaluation/benchmarks/miniwob/run_infer.py b/evaluation/benchmarks/miniwob/run_infer.py
index dd93fbaf0a75..acc1431c81f1 100644
--- a/evaluation/benchmarks/miniwob/run_infer.py
+++ b/evaluation/benchmarks/miniwob/run_infer.py
@@ -58,7 +58,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='xingyaoww/od-eval-miniwob:v1.0',
diff --git a/evaluation/benchmarks/mint/run_infer.py b/evaluation/benchmarks/mint/run_infer.py
index 7106f4a59d86..a98fa8d91805 100644
--- a/evaluation/benchmarks/mint/run_infer.py
+++ b/evaluation/benchmarks/mint/run_infer.py
@@ -106,7 +106,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='xingyaoww/od-eval-mint:v1.0',
diff --git a/evaluation/benchmarks/ml_bench/run_infer.py b/evaluation/benchmarks/ml_bench/run_infer.py
index ab94b925ab14..1c084fc14916 100644
--- a/evaluation/benchmarks/ml_bench/run_infer.py
+++ b/evaluation/benchmarks/ml_bench/run_infer.py
@@ -80,7 +80,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='public.ecr.aws/i5g0m1f6/ml-bench',
diff --git a/evaluation/benchmarks/scienceagentbench/run_infer.py b/evaluation/benchmarks/scienceagentbench/run_infer.py
index db4abf0f4828..ebe1b783cfed 100644
--- a/evaluation/benchmarks/scienceagentbench/run_infer.py
+++ b/evaluation/benchmarks/scienceagentbench/run_infer.py
@@ -62,7 +62,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         max_budget_per_task=4,
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
diff --git a/evaluation/benchmarks/swe_bench/eval_infer.py b/evaluation/benchmarks/swe_bench/eval_infer.py
index 95f65245f22f..c5d479dd50d5 100644
--- a/evaluation/benchmarks/swe_bench/eval_infer.py
+++ b/evaluation/benchmarks/swe_bench/eval_infer.py
@@ -76,7 +76,7 @@ def get_config(instance: pd.Series) -> AppConfig:
     )
     config = AppConfig(
         run_as_openhands=False,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         sandbox=SandboxConfig(
             base_container_image=base_container_image,
             use_host_network=False,
diff --git a/evaluation/benchmarks/swe_bench/run_infer.py b/evaluation/benchmarks/swe_bench/run_infer.py
index be4761da13e7..61c045037bbb 100644
--- a/evaluation/benchmarks/swe_bench/run_infer.py
+++ b/evaluation/benchmarks/swe_bench/run_infer.py
@@ -121,7 +121,7 @@ def get_config(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
         max_iterations=metadata.max_iterations,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         sandbox=SandboxConfig(
             base_container_image=base_container_image,
             enable_auto_lint=True,
diff --git a/evaluation/benchmarks/the_agent_company/scripts/summarise_results.py b/evaluation/benchmarks/the_agent_company/scripts/summarise_results.py
new file mode 100644
index 000000000000..e30ae9de3cc9
--- /dev/null
+++ b/evaluation/benchmarks/the_agent_company/scripts/summarise_results.py
@@ -0,0 +1,316 @@
+###########################################################################################################
+# Adapted from https://github.com/TheAgentCompany/TheAgentCompany/blob/main/evaluation/summarise_results.py
+###########################################################################################################
+
+
+import glob
+import json
+import os
+import re
+import sys
+from typing import Dict, Tuple
+
+
+def calculate_cost(model: str, prompt_tokens: int, completion_tokens: int) -> float:
+    """
+    Calculate the cost of the model call.
+    """
+    if 'claude-3-5-sonnet' in model.lower():
+        # https://www.anthropic.com/pricing#anthropic-api, accessed 12/11/2024
+        return 0.000003 * prompt_tokens + 0.000015 * completion_tokens
+    elif 'gpt-4o' in model.lower():
+        # https://openai.com/api/pricing/, accessed 12/11/2024
+        return 0.0000025 * prompt_tokens + 0.00001 * completion_tokens
+    elif 'gemini-1.5-pro' in model.lower():
+        # https://ai.google.dev/pricing#1_5pro, accessed 12/11/2024
+        # assuming prompts up to 128k tokens
+        cost = 0.00000125 * prompt_tokens + 0.000005 * completion_tokens
+        if prompt_tokens > 128000:
+            cost *= 2
+        return cost
+    elif 'gemini-2.0-flash-exp' in model.lower():
+        # price unknown for gemini-2.0-flash-exp, assuming same price as gemini-1.5-flash
+        cost = 0.000000075 * prompt_tokens + 0.0000003 * completion_tokens
+        if prompt_tokens > 128000:
+            cost *= 2
+        return cost
+    elif 'qwen2-72b' in model.lower():
+        # assuming hosted on Together
+        # https://www.together.ai/pricing, accessed 12/11/2024
+        return 0.0000009 * (prompt_tokens + completion_tokens)
+    elif 'qwen2p5-72b' in model.lower():
+        # assuming hosted on Together
+        # https://www.together.ai/pricing, accessed 12/14/2024
+        return 0.0000012 * (prompt_tokens + completion_tokens)
+    elif 'llama-v3p1-405b-instruct' in model.lower():
+        # assuming hosted on Fireworks AI
+        # https://fireworks.ai/pricing, accessed 12/11/2024
+        return 0.000003 * (prompt_tokens + completion_tokens)
+    elif 'llama-v3p1-70b-instruct' in model.lower():
+        # assuming hosted on Fireworks AI
+        return 0.0000009 * (prompt_tokens + completion_tokens)
+    elif 'llama-v3p3-70b-instruct' in model.lower():
+        # assuming hosted on Fireworks AI
+        return 0.0000009 * (prompt_tokens + completion_tokens)
+    elif 'amazon.nova-pro-v1:0' in model.lower():
+        # assuming hosted on Amazon Bedrock
+        # https://aws.amazon.com/bedrock/pricing/, accessed 12/11/2024
+        return 0.0000008 * prompt_tokens + 0.0000032 * completion_tokens
+    else:
+        raise ValueError(f'Unknown model: {model}')
+
+
+def analyze_eval_json_file(filepath: str) -> Tuple[int, int]:
+    """
+    Analyze a single eval JSON file and extract the total and result from final_score.
+
+    Args:
+        filepath: Path to the JSON file
+
+    Returns:
+        Tuple containing (total, result) from final_score
+    """
+    try:
+        with open(filepath, 'r') as f:
+            data = json.load(f)
+
+        final_score = data.get('final_score', {})
+        return (final_score.get('total', 0), final_score.get('result', 0))
+    except json.JSONDecodeError as e:
+        print(f'Error decoding JSON in {filepath}: {e}')
+        return (0, 0)
+    except Exception as e:
+        print(f'Error processing {filepath}: {e}')
+        return (0, 0)
+
+
+def analyze_traj_json_file(filepath: str) -> Tuple[int, float]:
+    """
+    Analyze a single trajectory JSON file and extract the steps and tokens
+    for each step. Then estimate the cost based on the tokens and the model type.
+    Note: this is assuming there's no prompt caching at all.
+    """
+    steps: int = 0
+    cost: float = 0.0
+    with open(filepath, 'r') as f:
+        data = json.load(f)
+        response_id = None
+        for action in data:
+            if 'tool_call_metadata' in action:
+                if action['tool_call_metadata']['model_response']['id'] != response_id:
+                    response_id = action['tool_call_metadata']['model_response']['id']
+                else:
+                    # openhands displays the same model response meta data multiple times, when
+                    # a single LLM call leads to multiple actions and observations.
+                    continue
+                steps += 1
+                usage = action['tool_call_metadata']['model_response']['usage']
+                model: str = action['tool_call_metadata']['model_response']['model']
+                prompt_tokens = usage['prompt_tokens']
+                completion_tokens = usage['completion_tokens']
+                cost += calculate_cost(model, prompt_tokens, completion_tokens)
+
+    return (steps, cost)
+
+
+def analyze_folder(
+    folder_path: str,
+) -> Tuple[Dict[str, Tuple[int, int]], Dict[str, Tuple[int, float]]]:
+    """
+    Analyze all eval_*.json & traj_*.json files in the specified folder.
+
+    Args:
+        folder_path: Path to the folder containing JSON files
+
+    Returns:
+        dictionaries:
+        - eval_results: Dictionary with filename as key and (total, result) tuple as value
+        - traj_results: Dictionary with filename as key and (steps, cost) tuple as value
+    """
+    eval_results = {}
+    traj_results = {}
+
+    eval_pattern = os.path.join(folder_path, 'eval_*.json')
+    traj_pattern = os.path.join(folder_path, 'traj_*.json')
+
+    for filepath in glob.glob(eval_pattern):
+        filename = os.path.basename(filepath)
+        total, result = analyze_eval_json_file(filepath)
+        key = re.search(r'eval_(.+)\.json', filename).group(1)
+        eval_results[key] = (total, result)
+
+    for filepath in glob.glob(traj_pattern):
+        filename = os.path.basename(filepath)
+        steps, cost = analyze_traj_json_file(filepath)
+        key = re.search(r'traj_(.+)\.json', filename).group(1)
+        traj_results[key] = (steps, cost)
+
+    return eval_results, traj_results
+
+
+def get_task_nature_category(task_name: str) -> str:
+    """
+    Get the nature category of the task.
+    """
+    task_nature = task_name.split('-')[0]
+    if task_nature.lower() in ['sde', 'pm', 'ds', 'admin', 'hr', 'finance']:
+        return task_nature
+    else:
+        return 'other'
+
+
+def calculate_score(total: int, result: int) -> float:
+    """
+    Calculate the score as a number between 0 and 1.
+
+    Formula: score = (result / total) * 0.5 + (result // total) * 0.5
+    Explanation:
+    - (result / total) * 0.5: This is the completion ratio, scaled down to a 0-0.5 range.
+    - (result // total) * 0.5: This is a binary score indicating whether the task was completed or not.
+
+    Args:
+        total: Total possible points
+        result: Actual points achieved
+
+    Returns:
+        Score as a number between 0 and 1
+    """
+    return (result / total * 0.5) + (result // total * 0.5)
+
+
+def is_perfect_completion(total: int, result: int) -> bool:
+    """
+    Check if the task achieved perfect completion.
+
+    Args:
+        total: Total possible points
+        result: Actual points achieved
+
+    Returns:
+        True if result equals total, False otherwise
+    """
+    return total > 0 and total == result
+
+
+def main():
+    if len(sys.argv) != 2:
+        print('Usage: poetry run python summarise_results.py <folder_path>')
+        sys.exit(1)
+
+    folder_path = sys.argv[1]
+
+    if not os.path.isdir(folder_path):
+        print(f"Error: '{folder_path}' is not a valid directory")
+        sys.exit(1)
+
+    eval_results, traj_results = analyze_folder(folder_path)
+
+    if not eval_results:
+        print(f'No eval_*.json files found in {folder_path}')
+        return
+
+    # Create list of results with completion ratios for sorting
+    detailed_results = [
+        (
+            task_name,
+            total,
+            result,
+            calculate_score(total, result),
+            is_perfect_completion(total, result),
+            get_task_nature_category(task_name),
+        )
+        for task_name, (total, result) in eval_results.items()
+    ]
+
+    # Sort by score in descending order
+    detailed_results.sort(key=lambda x: (-x[3], x[0]))
+
+    # Calculate perfect completion stats
+    perfect_completions = sum(
+        1 for _, _, _, _, is_perfect, _ in detailed_results if is_perfect
+    )
+
+    # Print header
+    print('\n# Evaluation Results Report')
+    print('\n## Results per File')
+    print('\n*Sorted by score (⭐ indicates perfect completion)*\n')
+
+    # Print table header
+    print(
+        '| Filename | Total | Result | Score | Steps | Cost (assuming no prompt caching)|'
+    )
+    print('|----------|--------|---------|-------|-------|------|')
+
+    # Print individual file results
+    for task_name, total, result, score, is_perfect, task_nature in detailed_results:
+        perfect_marker = ' ⭐' if is_perfect else ''
+        print(
+            f'| {task_name} | {total:,} | {result:,} | {score:.2f}{perfect_marker} | {traj_results[task_name][0]} | {traj_results[task_name][1]:.2f} |'
+        )
+
+    # Print summary section
+    print('\n## Summary\n')
+    print(f'**Tasks Evaluated:** {len(eval_results)}\n')
+    print(
+        f'**Perfect Completions:** {perfect_completions}/{len(eval_results)} ({(perfect_completions/len(eval_results)*100):.2f}%)\n'
+    )
+
+    overall_score = (
+        sum(score for _, _, _, score, _, _ in detailed_results)
+        / len(detailed_results)
+        * 100
+    )
+    avg_steps = sum(steps for steps, _ in traj_results.values()) / len(traj_results)
+    avg_cost = sum(cost for _, cost in traj_results.values()) / len(traj_results)
+    print(f'**Overall Score:** {overall_score:.2f}%\n')
+    print(f'**Average Steps:** {avg_steps:.2f}\n')
+    print(f'**Average Cost (USD):** {avg_cost:.2f}\n')
+
+    # Additional statistics
+    if detailed_results:
+        highest_score = max(score for _, _, _, score, _, _ in detailed_results)
+        lowest_score = min(score for _, _, _, score, _, _ in detailed_results)
+        median_score = detailed_results[len(detailed_results) // 2][3]
+        avg_score = sum(score for _, _, _, score, _, _ in detailed_results) / len(
+            detailed_results
+        )
+
+        print('\n## Statistics\n')
+        print('| Metric | Value |')
+        print('|---------|--------|')
+        print(f'| Highest Task Score | {highest_score*100:.2f}% |')
+        print(f'| Lowest Task Score | {lowest_score*100:.2f}% |')
+        print(f'| Median Task Score | {median_score*100:.2f}% |')
+        print(f'| Average Task Score | {avg_score*100:.2f}% |')
+
+        # compute avg score per nature category
+        print('\n## Statistics per Nature Category\n')
+        print('| Metric | Value |')
+        print('|---------|--------|')
+        for task_nature in ['sde', 'pm', 'ds', 'admin', 'hr', 'finance', 'other']:
+            num_of_tasks = sum(
+                1
+                for _, _, _, _, _, nature_category in detailed_results
+                if nature_category == task_nature
+            )
+            task_nature_score = (
+                sum(
+                    score
+                    for _, _, _, score, _, nature_category in detailed_results
+                    if nature_category == task_nature
+                )
+                / num_of_tasks
+            )
+            perfect_completions = sum(
+                1
+                for _, _, _, _, is_perfect, nature_category in detailed_results
+                if nature_category == task_nature and is_perfect
+            )
+            print(
+                f'| Perfect Completions for {task_nature} | {perfect_completions}/{num_of_tasks} ({perfect_completions/num_of_tasks*100:.2f}%) |'
+            )
+            print(f'| Average Score for {task_nature} | {task_nature_score*100:.2f}% |')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/evaluation/benchmarks/toolqa/run_infer.py b/evaluation/benchmarks/toolqa/run_infer.py
index f88163a048f5..6f6f1a0e2048 100644
--- a/evaluation/benchmarks/toolqa/run_infer.py
+++ b/evaluation/benchmarks/toolqa/run_infer.py
@@ -44,7 +44,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/benchmarks/webarena/run_infer.py b/evaluation/benchmarks/webarena/run_infer.py
index d18918cf969f..ac51a201a712 100644
--- a/evaluation/benchmarks/webarena/run_infer.py
+++ b/evaluation/benchmarks/webarena/run_infer.py
@@ -53,7 +53,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime='eventstream',
+        runtime='docker',
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             base_container_image='python:3.12-bookworm',
diff --git a/evaluation/integration_tests/run_infer.py b/evaluation/integration_tests/run_infer.py
index 2da68b9b82b9..fe85d23bf585 100644
--- a/evaluation/integration_tests/run_infer.py
+++ b/evaluation/integration_tests/run_infer.py
@@ -42,7 +42,7 @@ def get_config(
     config = AppConfig(
         default_agent=metadata.agent_class,
         run_as_openhands=False,
-        runtime=os.environ.get('RUNTIME', 'eventstream'),
+        runtime=os.environ.get('RUNTIME', 'docker'),
         max_iterations=metadata.max_iterations,
         sandbox=SandboxConfig(
             # use default base_container_image
diff --git a/frontend/__tests__/api/github.test.ts b/frontend/__tests__/api/github.test.ts
new file mode 100644
index 000000000000..5a659d4b71e6
--- /dev/null
+++ b/frontend/__tests__/api/github.test.ts
@@ -0,0 +1,47 @@
+import { describe, expect, it, vi } from "vitest";
+import { retrieveLatestGitHubCommit } from "../../src/api/github";
+
+describe("retrieveLatestGitHubCommit", () => {
+  const { githubGetMock } = vi.hoisted(() => ({
+    githubGetMock: vi.fn(),
+  }));
+
+  vi.mock("../../src/api/github-axios-instance", () => ({
+    github: {
+      get: githubGetMock,
+    },
+  }));
+
+  it("should return the latest commit when repository has commits", async () => {
+    const mockCommit = {
+      sha: "123abc",
+      commit: {
+        message: "Initial commit",
+      },
+    };
+
+    githubGetMock.mockResolvedValueOnce({
+      data: [mockCommit],
+    });
+
+    const result = await retrieveLatestGitHubCommit("user/repo");
+    expect(result).toEqual(mockCommit);
+  });
+
+  it("should return null when repository is empty", async () => {
+    const error = new Error("Repository is empty");
+    (error as any).response = { status: 409 };
+    githubGetMock.mockRejectedValueOnce(error);
+
+    const result = await retrieveLatestGitHubCommit("user/empty-repo");
+    expect(result).toBeNull();
+  });
+
+  it("should throw error for other error cases", async () => {
+    const error = new Error("Network error");
+    (error as any).response = { status: 500 };
+    githubGetMock.mockRejectedValueOnce(error);
+
+    await expect(retrieveLatestGitHubCommit("user/repo")).rejects.toThrow();
+  });
+});
diff --git a/frontend/__tests__/components/context-menu/account-settings-context-menu.test.tsx b/frontend/__tests__/components/context-menu/account-settings-context-menu.test.tsx
index ad5b6a0a3443..89780e07aef7 100644
--- a/frontend/__tests__/components/context-menu/account-settings-context-menu.test.tsx
+++ b/frontend/__tests__/components/context-menu/account-settings-context-menu.test.tsx
@@ -28,8 +28,8 @@ describe("AccountSettingsContextMenu", () => {
     expect(
       screen.getByTestId("account-settings-context-menu"),
     ).toBeInTheDocument();
-    expect(screen.getByText("Account Settings")).toBeInTheDocument();
-    expect(screen.getByText("Logout")).toBeInTheDocument();
+    expect(screen.getByText("ACCOUNT_SETTINGS$SETTINGS")).toBeInTheDocument();
+    expect(screen.getByText("ACCOUNT_SETTINGS$LOGOUT")).toBeInTheDocument();
   });
 
   it("should call onClickAccountSettings when the account settings option is clicked", async () => {
@@ -42,7 +42,7 @@ describe("AccountSettingsContextMenu", () => {
       />,
     );
 
-    const accountSettingsOption = screen.getByText("Account Settings");
+    const accountSettingsOption = screen.getByText("ACCOUNT_SETTINGS$SETTINGS");
     await user.click(accountSettingsOption);
 
     expect(onClickAccountSettingsMock).toHaveBeenCalledOnce();
@@ -58,7 +58,7 @@ describe("AccountSettingsContextMenu", () => {
       />,
     );
 
-    const logoutOption = screen.getByText("Logout");
+    const logoutOption = screen.getByText("ACCOUNT_SETTINGS$LOGOUT");
     await user.click(logoutOption);
 
     expect(onLogoutMock).toHaveBeenCalledOnce();
@@ -74,7 +74,7 @@ describe("AccountSettingsContextMenu", () => {
       />,
     );
 
-    const logoutOption = screen.getByText("Logout");
+    const logoutOption = screen.getByText("ACCOUNT_SETTINGS$LOGOUT");
     await user.click(logoutOption);
 
     expect(onLogoutMock).not.toHaveBeenCalled();
@@ -90,7 +90,7 @@ describe("AccountSettingsContextMenu", () => {
       />,
     );
 
-    const accountSettingsButton = screen.getByText("Account Settings");
+    const accountSettingsButton = screen.getByText("ACCOUNT_SETTINGS$SETTINGS");
     await user.click(accountSettingsButton);
     await user.click(document.body);
 
diff --git a/frontend/__tests__/components/features/conversation-panel/conversation-card.test.tsx b/frontend/__tests__/components/features/conversation-panel/conversation-card.test.tsx
new file mode 100644
index 000000000000..749bc6c48de0
--- /dev/null
+++ b/frontend/__tests__/components/features/conversation-panel/conversation-card.test.tsx
@@ -0,0 +1,274 @@
+import { render, screen, within } from "@testing-library/react";
+import { afterEach, describe, expect, it, test, vi } from "vitest";
+import userEvent from "@testing-library/user-event";
+import { formatTimeDelta } from "#/utils/format-time-delta";
+import { ConversationCard } from "#/components/features/conversation-panel/conversation-card";
+
+describe("ConversationCard", () => {
+  const onClick = vi.fn();
+  const onDelete = vi.fn();
+  const onChangeTitle = vi.fn();
+
+  afterEach(() => {
+    vi.clearAllMocks();
+  });
+
+  it("should render the conversation card", () => {
+    render(
+      <ConversationCard
+        onDelete={onDelete}
+        onClick={onClick}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+    const expectedDate = `${formatTimeDelta(new Date("2021-10-01T12:00:00Z"))} ago`;
+
+    const card = screen.getByTestId("conversation-card");
+    const title = within(card).getByTestId("conversation-card-title");
+
+    expect(title).toHaveValue("Conversation 1");
+    within(card).getByText(expectedDate);
+  });
+
+  it("should render the repo if available", () => {
+    const { rerender } = render(
+      <ConversationCard
+        onDelete={onDelete}
+        onClick={onClick}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    expect(
+      screen.queryByTestId("conversation-card-repo"),
+    ).not.toBeInTheDocument();
+
+    rerender(
+      <ConversationCard
+        onDelete={onDelete}
+        onClick={onClick}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo="org/repo"
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    screen.getByTestId("conversation-card-repo");
+  });
+
+  it("should call onClick when the card is clicked", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onDelete={onDelete}
+        onClick={onClick}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    const card = screen.getByTestId("conversation-card");
+    await user.click(card);
+
+    expect(onClick).toHaveBeenCalled();
+  });
+
+  it("should toggle a context menu when clicking the ellipsis button", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onDelete={onDelete}
+        onClick={onClick}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    expect(screen.queryByTestId("context-menu")).not.toBeInTheDocument();
+
+    const ellipsisButton = screen.getByTestId("ellipsis-button");
+    await user.click(ellipsisButton);
+
+    screen.getByTestId("context-menu");
+
+    await user.click(ellipsisButton);
+
+    expect(screen.queryByTestId("context-menu")).not.toBeInTheDocument();
+  });
+
+  it("should call onDelete when the delete button is clicked", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onClick={onClick}
+        onDelete={onDelete}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    const ellipsisButton = screen.getByTestId("ellipsis-button");
+    await user.click(ellipsisButton);
+
+    const menu = screen.getByTestId("context-menu");
+    const deleteButton = within(menu).getByTestId("delete-button");
+
+    await user.click(deleteButton);
+
+    expect(onDelete).toHaveBeenCalled();
+  });
+
+  test("clicking the repo should not trigger the onClick handler", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onClick={onClick}
+        onDelete={onDelete}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo="org/repo"
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    const repo = screen.getByTestId("conversation-card-repo");
+    await user.click(repo);
+
+    expect(onClick).not.toHaveBeenCalled();
+  });
+
+  test("conversation title should call onChangeTitle when changed and blurred", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onClick={onClick}
+        onDelete={onDelete}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+        onChangeTitle={onChangeTitle}
+      />,
+    );
+
+    const title = screen.getByTestId("conversation-card-title");
+
+    await user.clear(title);
+    await user.type(title, "New Conversation Name   ");
+    await user.tab();
+
+    expect(onChangeTitle).toHaveBeenCalledWith("New Conversation Name");
+    expect(title).toHaveValue("New Conversation Name");
+  });
+
+  it("should reset title and not call onChangeTitle when the title is empty", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onClick={onClick}
+        onDelete={onDelete}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    const title = screen.getByTestId("conversation-card-title");
+
+    await user.clear(title);
+    await user.tab();
+
+    expect(onChangeTitle).not.toHaveBeenCalled();
+    expect(title).toHaveValue("Conversation 1");
+  });
+
+  test("clicking the title should not trigger the onClick handler", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onClick={onClick}
+        onDelete={onDelete}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    const title = screen.getByTestId("conversation-card-title");
+    await user.click(title);
+
+    expect(onClick).not.toHaveBeenCalled();
+  });
+
+  test("clicking the delete button should not trigger the onClick handler", async () => {
+    const user = userEvent.setup();
+    render(
+      <ConversationCard
+        onClick={onClick}
+        onDelete={onDelete}
+        onChangeTitle={onChangeTitle}
+        name="Conversation 1"
+        repo={null}
+        lastUpdated="2021-10-01T12:00:00Z"
+      />,
+    );
+
+    const ellipsisButton = screen.getByTestId("ellipsis-button");
+    await user.click(ellipsisButton);
+
+    const menu = screen.getByTestId("context-menu");
+    const deleteButton = within(menu).getByTestId("delete-button");
+
+    await user.click(deleteButton);
+
+    expect(onClick).not.toHaveBeenCalled();
+  });
+
+  describe("state indicator", () => {
+    it("should render the 'cold' indicator by default", () => {
+      render(
+        <ConversationCard
+          onClick={onClick}
+          onDelete={onDelete}
+          onChangeTitle={onChangeTitle}
+          name="Conversation 1"
+          repo={null}
+          lastUpdated="2021-10-01T12:00:00Z"
+        />,
+      );
+
+      screen.getByTestId("cold-indicator");
+    });
+
+    it("should render the other indicators when provided", () => {
+      render(
+        <ConversationCard
+          onClick={onClick}
+          onDelete={onDelete}
+          onChangeTitle={onChangeTitle}
+          name="Conversation 1"
+          repo={null}
+          lastUpdated="2021-10-01T12:00:00Z"
+          state="warm"
+        />,
+      );
+
+      expect(screen.queryByTestId("cold-indicator")).not.toBeInTheDocument();
+      screen.getByTestId("warm-indicator");
+    });
+  });
+});
diff --git a/frontend/__tests__/components/features/conversation-panel/conversation-panel.test.tsx b/frontend/__tests__/components/features/conversation-panel/conversation-panel.test.tsx
new file mode 100644
index 000000000000..5a1d703b22ce
--- /dev/null
+++ b/frontend/__tests__/components/features/conversation-panel/conversation-panel.test.tsx
@@ -0,0 +1,267 @@
+import { render, screen, within } from "@testing-library/react";
+import { beforeAll, beforeEach, describe, expect, it, vi } from "vitest";
+import {
+  QueryClientProvider,
+  QueryClient,
+  QueryClientConfig,
+} from "@tanstack/react-query";
+import userEvent from "@testing-library/user-event";
+import { ConversationPanel } from "#/components/features/conversation-panel/conversation-panel";
+import OpenHands from "#/api/open-hands";
+import { AuthProvider } from "#/context/auth-context";
+
+describe("ConversationPanel", () => {
+  const onCloseMock = vi.fn();
+
+  const renderConversationPanel = (config?: QueryClientConfig) =>
+    render(<ConversationPanel onClose={onCloseMock} />, {
+      wrapper: ({ children }) => (
+        <AuthProvider>
+          <QueryClientProvider client={new QueryClient(config)}>
+            {children}
+          </QueryClientProvider>
+        </AuthProvider>
+      ),
+    });
+
+  const { endSessionMock } = vi.hoisted(() => ({
+    endSessionMock: vi.fn(),
+  }));
+
+  beforeAll(() => {
+    vi.mock("react-router", async (importOriginal) => ({
+      ...(await importOriginal<typeof import("react-router")>()),
+      Link: ({ children }: React.PropsWithChildren) => children,
+      useNavigate: vi.fn(() => vi.fn()),
+      useLocation: vi.fn(() => ({ pathname: "/conversation" })),
+      useParams: vi.fn(() => ({ conversationId: "2" })),
+    }));
+
+    vi.mock("#/hooks/use-end-session", async (importOriginal) => ({
+      ...(await importOriginal<typeof import("#/hooks/use-end-session")>()),
+      useEndSession: vi.fn(() => endSessionMock),
+    }));
+  });
+
+  beforeEach(() => {
+    vi.clearAllMocks();
+    vi.restoreAllMocks();
+  });
+
+  it("should render the conversations", async () => {
+    renderConversationPanel();
+    const cards = await screen.findAllByTestId("conversation-card");
+
+    expect(cards).toHaveLength(3);
+  });
+
+  it("should display an empty state when there are no conversations", async () => {
+    const getUserConversationsSpy = vi.spyOn(OpenHands, "getUserConversations");
+    getUserConversationsSpy.mockResolvedValue([]);
+
+    renderConversationPanel();
+
+    const emptyState = await screen.findByText("No conversations found");
+    expect(emptyState).toBeInTheDocument();
+  });
+
+  it("should handle an error when fetching conversations", async () => {
+    const getUserConversationsSpy = vi.spyOn(OpenHands, "getUserConversations");
+    getUserConversationsSpy.mockRejectedValue(
+      new Error("Failed to fetch conversations"),
+    );
+
+    renderConversationPanel({
+      defaultOptions: {
+        queries: {
+          retry: false,
+        },
+      },
+    });
+
+    const error = await screen.findByText("Failed to fetch conversations");
+    expect(error).toBeInTheDocument();
+  });
+
+  it("should cancel deleting a conversation", async () => {
+    const user = userEvent.setup();
+    renderConversationPanel();
+
+    let cards = await screen.findAllByTestId("conversation-card");
+    expect(
+      within(cards[0]).queryByTestId("delete-button"),
+    ).not.toBeInTheDocument();
+
+    const ellipsisButton = within(cards[0]).getByTestId("ellipsis-button");
+    await user.click(ellipsisButton);
+    const deleteButton = screen.getByTestId("delete-button");
+
+    // Click the first delete button
+    await user.click(deleteButton);
+
+    // Cancel the deletion
+    const cancelButton = screen.getByText("Cancel");
+    await user.click(cancelButton);
+
+    expect(screen.queryByText("Cancel")).not.toBeInTheDocument();
+
+    // Ensure the conversation is not deleted
+    cards = await screen.findAllByTestId("conversation-card");
+    expect(cards).toHaveLength(3);
+  });
+
+  it("should call endSession after deleting a conversation that is the current session", async () => {
+    const user = userEvent.setup();
+    renderConversationPanel();
+
+    let cards = await screen.findAllByTestId("conversation-card");
+    const ellipsisButton = within(cards[1]).getByTestId("ellipsis-button");
+    await user.click(ellipsisButton);
+    const deleteButton = screen.getByTestId("delete-button");
+
+    // Click the second delete button
+    await user.click(deleteButton);
+
+    // Confirm the deletion
+    const confirmButton = screen.getByText("Confirm");
+    await user.click(confirmButton);
+
+    expect(screen.queryByText("Confirm")).not.toBeInTheDocument();
+
+    // Ensure the conversation is deleted
+    cards = await screen.findAllByTestId("conversation-card");
+    expect(cards).toHaveLength(2);
+
+    expect(endSessionMock).toHaveBeenCalledOnce();
+  });
+
+  it("should delete a conversation", async () => {
+    const user = userEvent.setup();
+    renderConversationPanel();
+
+    let cards = await screen.findAllByTestId("conversation-card");
+    const ellipsisButton = within(cards[0]).getByTestId("ellipsis-button");
+    await user.click(ellipsisButton);
+    const deleteButton = screen.getByTestId("delete-button");
+
+    // Click the first delete button
+    await user.click(deleteButton);
+
+    // Confirm the deletion
+    const confirmButton = screen.getByText("Confirm");
+    await user.click(confirmButton);
+
+    expect(screen.queryByText("Confirm")).not.toBeInTheDocument();
+
+    // Ensure the conversation is deleted
+    cards = await screen.findAllByTestId("conversation-card");
+    expect(cards).toHaveLength(1);
+  });
+
+  it("should rename a conversation", async () => {
+    const updateUserConversationSpy = vi.spyOn(
+      OpenHands,
+      "updateUserConversation",
+    );
+
+    const user = userEvent.setup();
+    renderConversationPanel();
+    const cards = await screen.findAllByTestId("conversation-card");
+    const title = within(cards[0]).getByTestId("conversation-card-title");
+
+    await user.clear(title);
+    await user.type(title, "Conversation 1 Renamed");
+    await user.tab();
+
+    // Ensure the conversation is renamed
+    expect(updateUserConversationSpy).toHaveBeenCalledWith("3", {
+      name: "Conversation 1 Renamed",
+    });
+  });
+
+  it("should not rename a conversation when the name is unchanged", async () => {
+    const updateUserConversationSpy = vi.spyOn(
+      OpenHands,
+      "updateUserConversation",
+    );
+
+    const user = userEvent.setup();
+    renderConversationPanel();
+    const cards = await screen.findAllByTestId("conversation-card");
+    const title = within(cards[0]).getByTestId("conversation-card-title");
+
+    await user.click(title);
+    await user.tab();
+
+    // Ensure the conversation is not renamed
+    expect(updateUserConversationSpy).not.toHaveBeenCalled();
+
+    await user.type(title, "Conversation 1");
+    await user.click(title);
+    await user.tab();
+
+    expect(updateUserConversationSpy).toHaveBeenCalledTimes(1);
+
+    await user.click(title);
+    await user.tab();
+
+    expect(updateUserConversationSpy).toHaveBeenCalledTimes(1);
+  });
+
+  it("should call onClose after clicking a card", async () => {
+    renderConversationPanel();
+    const cards = await screen.findAllByTestId("conversation-card");
+    const firstCard = cards[0];
+
+    await userEvent.click(firstCard);
+
+    expect(onCloseMock).toHaveBeenCalledOnce();
+  });
+
+  describe("New Conversation Button", () => {
+    it("should display a confirmation modal when clicking", async () => {
+      const user = userEvent.setup();
+      renderConversationPanel();
+
+      expect(
+        screen.queryByTestId("confirm-new-conversation-modal"),
+      ).not.toBeInTheDocument();
+
+      const newProjectButton = screen.getByTestId("new-conversation-button");
+      await user.click(newProjectButton);
+
+      const modal = screen.getByTestId("confirm-new-conversation-modal");
+      expect(modal).toBeInTheDocument();
+    });
+
+    it("should call endSession and close panel after confirming", async () => {
+      const user = userEvent.setup();
+      renderConversationPanel();
+
+      const newProjectButton = screen.getByTestId("new-conversation-button");
+      await user.click(newProjectButton);
+
+      const confirmButton = screen.getByText("Confirm");
+      await user.click(confirmButton);
+
+      expect(endSessionMock).toHaveBeenCalledOnce();
+      expect(onCloseMock).toHaveBeenCalledOnce();
+    });
+
+    it("should close the modal when cancelling", async () => {
+      const user = userEvent.setup();
+      renderConversationPanel();
+
+      const newProjectButton = screen.getByTestId("new-conversation-button");
+      await user.click(newProjectButton);
+
+      const cancelButton = screen.getByText("Cancel");
+      await user.click(cancelButton);
+
+      expect(endSessionMock).not.toHaveBeenCalled();
+      expect(
+        screen.queryByTestId("confirm-new-conversation-modal"),
+      ).not.toBeInTheDocument();
+    });
+  });
+});
diff --git a/frontend/__tests__/components/features/sidebar/sidebar.test.tsx b/frontend/__tests__/components/features/sidebar/sidebar.test.tsx
new file mode 100644
index 000000000000..40d0ea4a48bc
--- /dev/null
+++ b/frontend/__tests__/components/features/sidebar/sidebar.test.tsx
@@ -0,0 +1,46 @@
+import { screen } from "@testing-library/react";
+import userEvent from "@testing-library/user-event";
+import { describe, expect, it } from "vitest";
+import { renderWithProviders } from "test-utils";
+import { createRoutesStub } from "react-router";
+import { Sidebar } from "#/components/features/sidebar/sidebar";
+import { MULTI_CONVO_UI_IS_ENABLED } from "#/utils/constants";
+
+const renderSidebar = () => {
+  const RouterStub = createRoutesStub([
+    {
+      path: "/conversation/:conversationId",
+      Component: Sidebar,
+    },
+  ]);
+
+  renderWithProviders(<RouterStub initialEntries={["/conversation/123"]} />);
+};
+
+describe("Sidebar", () => {
+  it.skipIf(!MULTI_CONVO_UI_IS_ENABLED)(
+    "should have the conversation panel open by default",
+    () => {
+      renderSidebar();
+      expect(screen.getByTestId("conversation-panel")).toBeInTheDocument();
+    },
+  );
+
+  it.skipIf(!MULTI_CONVO_UI_IS_ENABLED)(
+    "should toggle the conversation panel",
+    async () => {
+      const user = userEvent.setup();
+      renderSidebar();
+
+      const projectPanelButton = screen.getByTestId(
+        "toggle-conversation-panel",
+      );
+
+      await user.click(projectPanelButton);
+
+      expect(
+        screen.queryByTestId("conversation-panel"),
+      ).not.toBeInTheDocument();
+    },
+  );
+});
diff --git a/frontend/__tests__/components/user-actions.test.tsx b/frontend/__tests__/components/user-actions.test.tsx
index a83b88a38923..143af7d7113f 100644
--- a/frontend/__tests__/components/user-actions.test.tsx
+++ b/frontend/__tests__/components/user-actions.test.tsx
@@ -58,7 +58,7 @@ describe("UserActions", () => {
     const userAvatar = screen.getByTestId("user-avatar");
     await user.click(userAvatar);
 
-    const accountSettingsOption = screen.getByText("Account Settings");
+    const accountSettingsOption = screen.getByText("ACCOUNT_SETTINGS$SETTINGS");
     await user.click(accountSettingsOption);
 
     expect(onClickAccountSettingsMock).toHaveBeenCalledOnce();
@@ -79,7 +79,7 @@ describe("UserActions", () => {
     const userAvatar = screen.getByTestId("user-avatar");
     await user.click(userAvatar);
 
-    const logoutOption = screen.getByText("Logout");
+    const logoutOption = screen.getByText("ACCOUNT_SETTINGS$LOGOUT");
     await user.click(logoutOption);
 
     expect(onLogoutMock).toHaveBeenCalledOnce();
@@ -99,7 +99,7 @@ describe("UserActions", () => {
     const userAvatar = screen.getByTestId("user-avatar");
     await user.click(userAvatar);
 
-    const logoutOption = screen.getByText("Logout");
+    const logoutOption = screen.getByText("ACCOUNT_SETTINGS$LOGOUT");
     await user.click(logoutOption);
 
     expect(onLogoutMock).not.toHaveBeenCalled();
diff --git a/frontend/__tests__/routes/_oh.app.test.tsx b/frontend/__tests__/routes/_oh.app.test.tsx
new file mode 100644
index 000000000000..2addbc5fe604
--- /dev/null
+++ b/frontend/__tests__/routes/_oh.app.test.tsx
@@ -0,0 +1,83 @@
+import { createRoutesStub } from "react-router";
+import { afterEach, beforeAll, describe, expect, it, vi } from "vitest";
+import { renderWithProviders } from "test-utils";
+import { screen, waitFor } from "@testing-library/react";
+import toast from "react-hot-toast";
+import App from "#/routes/_oh.app/route";
+import OpenHands from "#/api/open-hands";
+import { MULTI_CONVO_UI_IS_ENABLED } from "#/utils/constants";
+
+describe("App", () => {
+  const RouteStub = createRoutesStub([
+    { Component: App, path: "/conversation/:conversationId" },
+  ]);
+
+  const { endSessionMock } = vi.hoisted(() => ({
+    endSessionMock: vi.fn(),
+  }));
+
+  beforeAll(() => {
+    vi.mock("#/hooks/use-end-session", () => ({
+      useEndSession: vi.fn(() => endSessionMock),
+    }));
+
+    vi.mock("#/hooks/use-terminal", () => ({
+      useTerminal: vi.fn(),
+    }));
+  });
+
+  afterEach(() => {
+    vi.clearAllMocks();
+  });
+
+  it("should render", async () => {
+    renderWithProviders(<RouteStub initialEntries={["/conversation/123"]} />);
+    await screen.findByTestId("app-route");
+  });
+
+  it.skipIf(!MULTI_CONVO_UI_IS_ENABLED)(
+    "should call endSession if the user does not have permission to view conversation",
+    async () => {
+      const errorToastSpy = vi.spyOn(toast, "error");
+      const getConversationSpy = vi.spyOn(OpenHands, "getConversation");
+
+      getConversationSpy.mockResolvedValue(null);
+      renderWithProviders(
+        <RouteStub initialEntries={["/conversation/9999"]} />,
+      );
+
+      await waitFor(() => {
+        expect(endSessionMock).toHaveBeenCalledOnce();
+        expect(errorToastSpy).toHaveBeenCalledOnce();
+      });
+    },
+  );
+
+  it("should not call endSession if the user has permission", async () => {
+    const errorToastSpy = vi.spyOn(toast, "error");
+    const getConversationSpy = vi.spyOn(OpenHands, "getConversation");
+
+    getConversationSpy.mockResolvedValue({
+      conversation_id: "9999",
+      lastUpdated: "",
+      name: "",
+      repo: "",
+      state: "cold",
+    });
+    const { rerender } = renderWithProviders(
+      <RouteStub initialEntries={["/conversation/9999"]} />,
+    );
+
+    await waitFor(() => {
+      expect(endSessionMock).not.toHaveBeenCalled();
+      expect(errorToastSpy).not.toHaveBeenCalled();
+    });
+
+    rerender(<RouteStub initialEntries={["/conversation"]} />);
+
+    await waitFor(() => {
+      expect(endSessionMock).not.toHaveBeenCalled();
+      expect(errorToastSpy).not.toHaveBeenCalled();
+    });
+  });
+});
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index 62ed141b8fa8..973a16d01049 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -14,7 +14,7 @@
         "@react-router/serve": "^7.1.1",
         "@react-types/shared": "^3.25.0",
         "@reduxjs/toolkit": "^2.5.0",
-        "@tanstack/react-query": "^5.62.10",
+        "@tanstack/react-query": "^5.62.11",
         "@vitejs/plugin-react": "^4.3.2",
         "@xterm/addon-fit": "^0.10.0",
         "@xterm/xterm": "^5.4.0",
@@ -27,12 +27,12 @@
         "isbot": "^5.1.19",
         "jose": "^5.9.4",
         "monaco-editor": "^0.52.2",
-        "posthog-js": "^1.203.1",
+        "posthog-js": "^1.203.2",
         "react": "^19.0.0",
         "react-dom": "^19.0.0",
         "react-highlight": "^0.15.0",
         "react-hot-toast": "^2.4.1",
-        "react-i18next": "^15.2.0",
+        "react-i18next": "^15.4.0",
         "react-icons": "^5.4.0",
         "react-markdown": "^9.0.1",
         "react-redux": "^9.2.0",
@@ -43,11 +43,12 @@
         "sirv-cli": "^3.0.0",
         "socket.io-client": "^4.8.1",
         "tailwind-merge": "^2.6.0",
-        "vite": "^5.4.9",
+        "vite": "^5.4.11",
         "web-vitals": "^3.5.2",
         "ws": "^8.18.0"
       },
       "devDependencies": {
+        "@mswjs/socket.io-binding": "^0.1.1",
         "@playwright/test": "^1.49.1",
         "@react-router/dev": "^7.1.1",
         "@tailwindcss/typography": "^0.5.15",
@@ -77,7 +78,7 @@
         "eslint-plugin-react-hooks": "^4.6.2",
         "husky": "^9.1.6",
         "jsdom": "^25.0.1",
-        "lint-staged": "^15.2.11",
+        "lint-staged": "^15.3.0",
         "msw": "^2.6.6",
         "postcss": "^8.4.47",
         "prettier": "^3.4.2",
@@ -1626,6 +1627,21 @@
         "node": ">=18"
       }
     },
+    "node_modules/@mswjs/socket.io-binding": {
+      "version": "0.1.1",
+      "resolved": "https://registry.npmjs.org/@mswjs/socket.io-binding/-/socket.io-binding-0.1.1.tgz",
+      "integrity": "sha512-mtFDHC5XMeti43toe3HBynD4uBxvUA2GfJVC6TDfhOQlH+G2hf5znNTSa75A30XdWL0P6aNqUKpcNo6L0Wop+A==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "@mswjs/interceptors": "^0.37.1",
+        "engine.io-parser": "^5.2.3",
+        "socket.io-parser": "^4.2.4"
+      },
+      "peerDependencies": {
+        "@mswjs/interceptors": "*"
+      }
+    },
     "node_modules/@nextui-org/accordion": {
       "version": "2.2.6",
       "resolved": "https://registry.npmjs.org/@nextui-org/accordion/-/accordion-2.2.6.tgz",
@@ -5355,9 +5371,9 @@
       }
     },
     "node_modules/@tanstack/react-query": {
-      "version": "5.62.10",
-      "resolved": "https://registry.npmjs.org/@tanstack/react-query/-/react-query-5.62.10.tgz",
-      "integrity": "sha512-1e1WpHM5oGf27nWM/NWLY62/X9pbMBWa6ErWYmeuK0OqB9/g9UzA59ogiWbxCmS2wtAFQRhOdHhfSofrkhPl2g==",
+      "version": "5.62.11",
+      "resolved": "https://registry.npmjs.org/@tanstack/react-query/-/react-query-5.62.11.tgz",
+      "integrity": "sha512-Xb1nw0cYMdtFmwkvH9+y5yYFhXvLRCnXoqlzSw7UkqtCVFq3cG8q+rHZ2Yz1XrC+/ysUaTqbLKJqk95mCgC1oQ==",
       "license": "MIT",
       "dependencies": {
         "@tanstack/query-core": "5.62.9"
@@ -8134,9 +8150,9 @@
       "license": "MIT"
     },
     "node_modules/es-abstract": {
-      "version": "1.23.7",
-      "resolved": "https://registry.npmjs.org/es-abstract/-/es-abstract-1.23.7.tgz",
-      "integrity": "sha512-OygGC8kIcDhXX+6yAZRGLqwi2CmEXCbLQixeGUgYeR+Qwlppqmo7DIDr8XibtEBZp+fJcoYpoatp5qwLMEdcqQ==",
+      "version": "1.23.8",
+      "resolved": "https://registry.npmjs.org/es-abstract/-/es-abstract-1.23.8.tgz",
+      "integrity": "sha512-lfab8IzDn6EpI1ibZakcgS6WsfEBiB+43cuJo+wgylx1xKXf+Sp+YR3vFuQwC/u3sxYwV8Cxe3B0DpVUu/WiJQ==",
       "dev": true,
       "license": "MIT",
       "dependencies": {
@@ -8175,8 +8191,10 @@
         "object-inspect": "^1.13.3",
         "object-keys": "^1.1.1",
         "object.assign": "^4.1.7",
+        "own-keys": "^1.0.0",
         "regexp.prototype.flags": "^1.5.3",
         "safe-array-concat": "^1.1.3",
+        "safe-push-apply": "^1.0.0",
         "safe-regex-test": "^1.1.0",
         "string.prototype.trim": "^1.2.10",
         "string.prototype.trimend": "^1.0.9",
@@ -11189,13 +11207,13 @@
       "license": "MIT"
     },
     "node_modules/lint-staged": {
-      "version": "15.2.11",
-      "resolved": "https://registry.npmjs.org/lint-staged/-/lint-staged-15.2.11.tgz",
-      "integrity": "sha512-Ev6ivCTYRTGs9ychvpVw35m/bcNDuBN+mnTeObCL5h+boS5WzBEC6LHI4I9F/++sZm1m+J2LEiy0gxL/R9TBqQ==",
+      "version": "15.3.0",
+      "resolved": "https://registry.npmjs.org/lint-staged/-/lint-staged-15.3.0.tgz",
+      "integrity": "sha512-vHFahytLoF2enJklgtOtCtIjZrKD/LoxlaUusd5nh7dWv/dkKQJY74ndFSzxCdv7g0ueGg1ORgTSt4Y9LPZn9A==",
       "dev": true,
       "license": "MIT",
       "dependencies": {
-        "chalk": "~5.3.0",
+        "chalk": "~5.4.1",
         "commander": "~12.1.0",
         "debug": "~4.4.0",
         "execa": "~8.0.1",
@@ -11217,9 +11235,9 @@
       }
     },
     "node_modules/lint-staged/node_modules/chalk": {
-      "version": "5.3.0",
-      "resolved": "https://registry.npmjs.org/chalk/-/chalk-5.3.0.tgz",
-      "integrity": "sha512-dLitG79d+GV1Nb/VYcCDFivJeK1hiukt9QjRNVOsUtTy1rR1YJsmpGGTZ3qJos+uw7WmWF4wUwBd9jxjocFC2w==",
+      "version": "5.4.1",
+      "resolved": "https://registry.npmjs.org/chalk/-/chalk-5.4.1.tgz",
+      "integrity": "sha512-zgVZuo2WcZgfUEmsn6eO3kINexW8RAE4maiQ8QNs8CtpPCSyMiYsULR3HQYkm3w8FIA3SberyMJMSldGsW+U3w==",
       "dev": true,
       "license": "MIT",
       "engines": {
@@ -13280,6 +13298,24 @@
       "dev": true,
       "license": "MIT"
     },
+    "node_modules/own-keys": {
+      "version": "1.0.1",
+      "resolved": "https://registry.npmjs.org/own-keys/-/own-keys-1.0.1.tgz",
+      "integrity": "sha512-qFOyK5PjiWZd+QQIh+1jhdb9LpxTF0qs7Pm8o5QHYZ0M3vKqSqzsZaEB6oWlxZ+q2sJBMI/Ktgd2N5ZwQoRHfg==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "get-intrinsic": "^1.2.6",
+        "object-keys": "^1.1.1",
+        "safe-push-apply": "^1.0.0"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
     "node_modules/p-limit": {
       "version": "3.1.0",
       "resolved": "https://registry.npmjs.org/p-limit/-/p-limit-3.1.0.tgz",
@@ -13563,14 +13599,14 @@
       }
     },
     "node_modules/pkg-types": {
-      "version": "1.2.1",
-      "resolved": "https://registry.npmjs.org/pkg-types/-/pkg-types-1.2.1.tgz",
-      "integrity": "sha512-sQoqa8alT3nHjGuTjuKgOnvjo4cljkufdtLMnO2LBP/wRwuDlo1tkaEdMxCRhyGRPacv/ztlZgDPm2b7FAmEvw==",
+      "version": "1.3.0",
+      "resolved": "https://registry.npmjs.org/pkg-types/-/pkg-types-1.3.0.tgz",
+      "integrity": "sha512-kS7yWjVFCkIw9hqdJBoMxDdzEngmkr5FXeWZZfQ6GoYacjVnsW6l2CcYW/0ThD0vF4LPJgVYnrg4d0uuhwYQbg==",
       "dev": true,
       "license": "MIT",
       "dependencies": {
         "confbox": "^0.1.8",
-        "mlly": "^1.7.2",
+        "mlly": "^1.7.3",
         "pathe": "^1.1.2"
       }
     },
@@ -13774,9 +13810,9 @@
       "license": "MIT"
     },
     "node_modules/posthog-js": {
-      "version": "1.203.1",
-      "resolved": "https://registry.npmjs.org/posthog-js/-/posthog-js-1.203.1.tgz",
-      "integrity": "sha512-r/WiSyz6VNbIKEV/30+aD5gdrYkFtmZwvqNa6h9frl8hG638v098FrXaq3EYzMcCdkQf3phaZTDIAFKegpiTjw==",
+      "version": "1.203.2",
+      "resolved": "https://registry.npmjs.org/posthog-js/-/posthog-js-1.203.2.tgz",
+      "integrity": "sha512-3aLpEhM4i9sQQtobRmDttJ3rTW1+gwQ9HL7QiOeDueE2T7CguYibYS7weY1UhXMerx5lh1A7+szlOJTTibifLQ==",
       "license": "MIT",
       "dependencies": {
         "core-js": "^3.38.1",
@@ -13792,9 +13828,9 @@
       "license": "Apache-2.0"
     },
     "node_modules/preact": {
-      "version": "10.25.3",
-      "resolved": "https://registry.npmjs.org/preact/-/preact-10.25.3.tgz",
-      "integrity": "sha512-dzQmIFtM970z+fP9ziQ3yG4e3ULIbwZzJ734vaMVUTaKQ2+Ru1Ou/gjshOYVHCcd1rpAelC6ngjvjDXph98unQ==",
+      "version": "10.25.4",
+      "resolved": "https://registry.npmjs.org/preact/-/preact-10.25.4.tgz",
+      "integrity": "sha512-jLdZDb+Q+odkHJ+MpW/9U5cODzqnB+fy2EiHSZES7ldV5LK7yjlVzTp7R8Xy6W6y75kfK8iWYtFVH7lvjwrCMA==",
       "license": "MIT",
       "funding": {
         "type": "opencollective",
@@ -14124,9 +14160,9 @@
       }
     },
     "node_modules/react-i18next": {
-      "version": "15.2.0",
-      "resolved": "https://registry.npmjs.org/react-i18next/-/react-i18next-15.2.0.tgz",
-      "integrity": "sha512-iJNc8111EaDtVTVMKigvBtPHyrJV+KblWG73cUxqp+WmJCcwkzhWNFXmkAD5pwP2Z4woeDj/oXDdbjDsb3Gutg==",
+      "version": "15.4.0",
+      "resolved": "https://registry.npmjs.org/react-i18next/-/react-i18next-15.4.0.tgz",
+      "integrity": "sha512-Py6UkX3zV08RTvL6ZANRoBh9sL/ne6rQq79XlkHEdd82cZr2H9usbWpUNVadJntIZP2pu3M2rL1CN+5rQYfYFw==",
       "license": "MIT",
       "dependencies": {
         "@babel/runtime": "^7.25.0",
@@ -14895,6 +14931,30 @@
       ],
       "license": "MIT"
     },
+    "node_modules/safe-push-apply": {
+      "version": "1.0.0",
+      "resolved": "https://registry.npmjs.org/safe-push-apply/-/safe-push-apply-1.0.0.tgz",
+      "integrity": "sha512-iKE9w/Z7xCzUMIZqdBsp6pEQvwuEebH4vdpjcDWnyzaI6yl6O9FHvVpmGelvEHNsoY6wGblkxR6Zty/h00WiSA==",
+      "dev": true,
+      "license": "MIT",
+      "dependencies": {
+        "es-errors": "^1.3.0",
+        "isarray": "^2.0.5"
+      },
+      "engines": {
+        "node": ">= 0.4"
+      },
+      "funding": {
+        "url": "https://github.com/sponsors/ljharb"
+      }
+    },
+    "node_modules/safe-push-apply/node_modules/isarray": {
+      "version": "2.0.5",
+      "resolved": "https://registry.npmjs.org/isarray/-/isarray-2.0.5.tgz",
+      "integrity": "sha512-xHjhDr3cNBK0BzdUJSPXZntQUx/mwMS5Rw4A7lPJ90XGAO6ISP/ePDNuo0vhqOZU+UD5JoodwCAAoZQd3FeAKw==",
+      "dev": true,
+      "license": "MIT"
+    },
     "node_modules/safe-regex-test": {
       "version": "1.1.0",
       "resolved": "https://registry.npmjs.org/safe-regex-test/-/safe-regex-test-1.1.0.tgz",
diff --git a/frontend/package.json b/frontend/package.json
index 16434074e8d9..1048fea0df75 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -13,7 +13,7 @@
     "@react-router/serve": "^7.1.1",
     "@react-types/shared": "^3.25.0",
     "@reduxjs/toolkit": "^2.5.0",
-    "@tanstack/react-query": "^5.62.10",
+    "@tanstack/react-query": "^5.62.11",
     "@vitejs/plugin-react": "^4.3.2",
     "@xterm/addon-fit": "^0.10.0",
     "@xterm/xterm": "^5.4.0",
@@ -26,12 +26,12 @@
     "isbot": "^5.1.19",
     "jose": "^5.9.4",
     "monaco-editor": "^0.52.2",
-    "posthog-js": "^1.203.1",
+    "posthog-js": "^1.203.2",
     "react": "^19.0.0",
     "react-dom": "^19.0.0",
     "react-highlight": "^0.15.0",
     "react-hot-toast": "^2.4.1",
-    "react-i18next": "^15.2.0",
+    "react-i18next": "^15.4.0",
     "react-icons": "^5.4.0",
     "react-markdown": "^9.0.1",
     "react-redux": "^9.2.0",
@@ -42,7 +42,7 @@
     "sirv-cli": "^3.0.0",
     "socket.io-client": "^4.8.1",
     "tailwind-merge": "^2.6.0",
-    "vite": "^5.4.9",
+    "vite": "^5.4.11",
     "web-vitals": "^3.5.2",
     "ws": "^8.18.0"
   },
@@ -75,6 +75,7 @@
     ]
   },
   "devDependencies": {
+    "@mswjs/socket.io-binding": "^0.1.1",
     "@playwright/test": "^1.49.1",
     "@react-router/dev": "^7.1.1",
     "@tailwindcss/typography": "^0.5.15",
@@ -104,7 +105,7 @@
     "eslint-plugin-react-hooks": "^4.6.2",
     "husky": "^9.1.6",
     "jsdom": "^25.0.1",
-    "lint-staged": "^15.2.11",
+    "lint-staged": "^15.3.0",
     "msw": "^2.6.6",
     "postcss": "^8.4.47",
     "prettier": "^3.4.2",
diff --git a/frontend/src/api/github.ts b/frontend/src/api/github.ts
index b315e2d930a7..492955ae69d9 100644
--- a/frontend/src/api/github.ts
+++ b/frontend/src/api/github.ts
@@ -106,15 +106,28 @@ export const retrieveGitHubUser = async () => {
 
 export const retrieveLatestGitHubCommit = async (
   repository: string,
-): Promise<GitHubCommit> => {
-  const response = await github.get<GitHubCommit[]>(
-    `/repos/${repository}/commits`,
-    {
-      params: {
-        per_page: 1,
+): Promise<GitHubCommit | null> => {
+  try {
+    const response = await github.get<GitHubCommit[]>(
+      `/repos/${repository}/commits`,
+      {
+        params: {
+          per_page: 1,
+        },
       },
-    },
-  );
-
-  return response.data[0];
+    );
+    return response.data[0] || null;
+  } catch (error) {
+    if (!error || typeof error !== "object") {
+      throw new Error("Unknown error occurred");
+    }
+    const axiosError = error as { response?: { status: number } };
+    if (axiosError.response?.status === 409) {
+      // Repository is empty, no commits yet
+      return null;
+    }
+    throw new Error(
+      error instanceof Error ? error.message : "Unknown error occurred",
+    );
+  }
 };
diff --git a/frontend/src/api/open-hands.ts b/frontend/src/api/open-hands.ts
index 84d254102c08..1534be879ca5 100644
--- a/frontend/src/api/open-hands.ts
+++ b/frontend/src/api/open-hands.ts
@@ -8,8 +8,10 @@ import {
   GetConfigResponse,
   GetVSCodeUrlResponse,
   AuthenticateResponse,
+  Conversation,
 } from "./open-hands.types";
 import { openHands } from "./open-hands-axios";
+import { ApiSettings } from "#/services/settings";
 
 class OpenHands {
   /**
@@ -219,6 +221,52 @@ class OpenHands {
     return data;
   }
 
+  static async getUserConversations(): Promise<Conversation[]> {
+    const { data } = await openHands.get<Conversation[]>("/api/conversations");
+    return data;
+  }
+
+  static async deleteUserConversation(conversationId: string): Promise<void> {
+    await openHands.delete(`/api/conversations/${conversationId}`);
+  }
+
+  static async updateUserConversation(
+    conversationId: string,
+    conversation: Partial<Omit<Conversation, "id">>,
+  ): Promise<void> {
+    await openHands.put(`/api/conversations/${conversationId}`, conversation);
+  }
+
+  static async createConversation(
+    githubToken?: string,
+    selectedRepository?: string,
+  ): Promise<Conversation> {
+    const body = {
+      github_token: githubToken,
+      selected_repository: selectedRepository,
+    };
+
+    const { data } = await openHands.post<Conversation>(
+      "/api/conversations",
+      body,
+    );
+
+    // TODO: remove this once we have a multi-conversation UI
+    localStorage.setItem("latest_conversation_id", data.conversation_id);
+
+    return data;
+  }
+
+  static async getConversation(
+    conversationId: string,
+  ): Promise<Conversation | null> {
+    const { data } = await openHands.get<Conversation | null>(
+      `/api/conversations/${conversationId}`,
+    );
+
+    return data;
+  }
+
   static async searchEvents(
     conversationId: string,
     params: {
@@ -248,20 +296,22 @@ class OpenHands {
     return data;
   }
 
-  static async newConversation(params: {
-    githubToken?: string;
-    selectedRepository?: string;
-  }): Promise<{ conversation_id: string }> {
-    const { data } = await openHands.post<{
-      conversation_id: string;
-    }>("/api/conversations", {
-      github_token: params.githubToken,
-      selected_repository: params.selectedRepository,
-    });
-    // TODO: remove this once we have a multi-conversation UI
-    localStorage.setItem("latest_conversation_id", data.conversation_id);
+  /**
+   * Get the settings from the server or use the default settings if not found
+   */
+  static async getSettings(): Promise<ApiSettings> {
+    const { data } = await openHands.get<ApiSettings>("/api/settings");
     return data;
   }
+
+  /**
+   * Save the settings to the server. Only valid settings are saved.
+   * @param settings - the settings to save
+   */
+  static async saveSettings(settings: Partial<ApiSettings>): Promise<boolean> {
+    const data = await openHands.post("/api/settings", settings);
+    return data.status === 200;
+  }
 }
 
 export default OpenHands;
diff --git a/frontend/src/api/open-hands.types.ts b/frontend/src/api/open-hands.types.ts
index 919d370751ca..c17d2016816d 100644
--- a/frontend/src/api/open-hands.types.ts
+++ b/frontend/src/api/open-hands.types.ts
@@ -1,3 +1,5 @@
+import { ProjectState } from "#/components/features/conversation-panel/conversation-state-indicator";
+
 export interface ErrorResponse {
   error: string;
 }
@@ -57,3 +59,11 @@ export interface AuthenticateResponse {
   message?: string;
   error?: string;
 }
+
+export interface Conversation {
+  conversation_id: string;
+  name: string;
+  repo: string | null;
+  lastUpdated: string;
+  state: ProjectState;
+}
diff --git a/frontend/src/components/features/context-menu/account-settings-context-menu.tsx b/frontend/src/components/features/context-menu/account-settings-context-menu.tsx
index 960eb2d7a8c6..bf695cbc6ba7 100644
--- a/frontend/src/components/features/context-menu/account-settings-context-menu.tsx
+++ b/frontend/src/components/features/context-menu/account-settings-context-menu.tsx
@@ -1,7 +1,9 @@
+import { useTranslation } from "react-i18next";
 import { ContextMenu } from "./context-menu";
 import { ContextMenuListItem } from "./context-menu-list-item";
 import { ContextMenuSeparator } from "./context-menu-separator";
 import { useClickOutsideElement } from "#/hooks/use-click-outside-element";
+import { I18nKey } from "#/i18n/declaration";
 
 interface AccountSettingsContextMenuProps {
   onClickAccountSettings: () => void;
@@ -17,6 +19,7 @@ export function AccountSettingsContextMenu({
   isLoggedIn,
 }: AccountSettingsContextMenuProps) {
   const ref = useClickOutsideElement<HTMLUListElement>(onClose);
+  const { t } = useTranslation();
 
   return (
     <ContextMenu
@@ -25,11 +28,11 @@ export function AccountSettingsContextMenu({
       className="absolute left-full -top-1 z-10"
     >
       <ContextMenuListItem onClick={onClickAccountSettings}>
-        Account Settings
+        {t(I18nKey.ACCOUNT_SETTINGS$SETTINGS)}
       </ContextMenuListItem>
       <ContextMenuSeparator />
       <ContextMenuListItem onClick={onLogout} isDisabled={!isLoggedIn}>
-        Logout
+        {t(I18nKey.ACCOUNT_SETTINGS$LOGOUT)}
       </ContextMenuListItem>
     </ContextMenu>
   );
diff --git a/frontend/src/components/features/context-menu/context-menu-list-item.tsx b/frontend/src/components/features/context-menu/context-menu-list-item.tsx
index 606090229cd9..b35ca44395a1 100644
--- a/frontend/src/components/features/context-menu/context-menu-list-item.tsx
+++ b/frontend/src/components/features/context-menu/context-menu-list-item.tsx
@@ -1,18 +1,20 @@
 import { cn } from "#/utils/utils";
 
 interface ContextMenuListItemProps {
-  onClick: () => void;
+  testId?: string;
+  onClick: (event: React.MouseEvent<HTMLButtonElement>) => void;
   isDisabled?: boolean;
 }
 
 export function ContextMenuListItem({
   children,
+  testId,
   onClick,
   isDisabled,
 }: React.PropsWithChildren<ContextMenuListItemProps>) {
   return (
     <button
-      data-testid="context-menu-list-item"
+      data-testid={testId || "context-menu-list-item"}
       type="button"
       onClick={onClick}
       disabled={isDisabled}
diff --git a/frontend/src/components/features/context-menu/context-menu.tsx b/frontend/src/components/features/context-menu/context-menu.tsx
index d704e209f531..d4d47708da4b 100644
--- a/frontend/src/components/features/context-menu/context-menu.tsx
+++ b/frontend/src/components/features/context-menu/context-menu.tsx
@@ -2,7 +2,7 @@ import React from "react";
 import { cn } from "#/utils/utils";
 
 interface ContextMenuProps {
-  ref: React.RefObject<HTMLUListElement | null>;
+  ref?: React.RefObject<HTMLUListElement | null>;
   testId?: string;
   children: React.ReactNode;
   className?: React.HTMLAttributes<HTMLUListElement>["className"];
diff --git a/frontend/src/components/features/conversation-panel/confirm-delete-modal.tsx b/frontend/src/components/features/conversation-panel/confirm-delete-modal.tsx
new file mode 100644
index 000000000000..2316ca1de7d3
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/confirm-delete-modal.tsx
@@ -0,0 +1,36 @@
+import { ModalButton } from "#/components/shared/buttons/modal-button";
+import {
+  BaseModalDescription,
+  BaseModalTitle,
+} from "#/components/shared/modals/confirmation-modals/base-modal";
+import { ModalBackdrop } from "#/components/shared/modals/modal-backdrop";
+import { ModalBody } from "#/components/shared/modals/modal-body";
+
+interface ConfirmDeleteModalProps {
+  onConfirm: () => void;
+  onCancel: () => void;
+}
+
+export function ConfirmDeleteModal({
+  onConfirm,
+  onCancel,
+}: ConfirmDeleteModalProps) {
+  return (
+    <ModalBackdrop>
+      <ModalBody className="items-start">
+        <div className="flex flex-col gap-2">
+          <BaseModalTitle title="Are you sure you want to delete this project?" />
+          <BaseModalDescription description="All data associated with this project will be lost." />
+        </div>
+        <div className="flex flex-col gap-2 w-full">
+          <ModalButton
+            onClick={onConfirm}
+            className="bg-[#4465DB]"
+            text="Confirm"
+          />
+          <ModalButton onClick={onCancel} className="bg-danger" text="Cancel" />
+        </div>
+      </ModalBody>
+    </ModalBackdrop>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/conversation-card.tsx b/frontend/src/components/features/conversation-panel/conversation-card.tsx
new file mode 100644
index 000000000000..bba98607bb23
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/conversation-card.tsx
@@ -0,0 +1,102 @@
+import React from "react";
+import { formatTimeDelta } from "#/utils/format-time-delta";
+import { ConversationRepoLink } from "./conversation-repo-link";
+import {
+  ProjectState,
+  ConversationStateIndicator,
+} from "./conversation-state-indicator";
+import { ContextMenu } from "../context-menu/context-menu";
+import { ContextMenuListItem } from "../context-menu/context-menu-list-item";
+import { EllipsisButton } from "./ellipsis-button";
+
+interface ProjectCardProps {
+  onClick: () => void;
+  onDelete: () => void;
+  onChangeTitle: (title: string) => void;
+  name: string;
+  repo: string | null;
+  lastUpdated: string; // ISO 8601
+  state?: ProjectState;
+}
+
+export function ConversationCard({
+  onClick,
+  onDelete,
+  onChangeTitle,
+  name,
+  repo,
+  lastUpdated,
+  state = "cold",
+}: ProjectCardProps) {
+  const [contextMenuVisible, setContextMenuVisible] = React.useState(false);
+  const inputRef = React.useRef<HTMLInputElement>(null);
+
+  const handleBlur = () => {
+    if (inputRef.current?.value) {
+      const trimmed = inputRef.current.value.trim();
+      onChangeTitle(trimmed);
+      inputRef.current!.value = trimmed;
+    } else {
+      // reset the value if it's empty
+      inputRef.current!.value = name;
+    }
+  };
+
+  const handleInputClick = (event: React.MouseEvent<HTMLInputElement>) => {
+    event.stopPropagation();
+  };
+
+  const handleDelete = (event: React.MouseEvent<HTMLButtonElement>) => {
+    event.stopPropagation();
+    onDelete();
+  };
+
+  return (
+    <div
+      data-testid="conversation-card"
+      onClick={onClick}
+      className="h-[100px] w-full px-[18px] py-4 border-b border-neutral-600"
+    >
+      <div className="flex items-center justify-between">
+        <input
+          ref={inputRef}
+          data-testid="conversation-card-title"
+          onClick={handleInputClick}
+          onBlur={handleBlur}
+          type="text"
+          defaultValue={name}
+          className="text-sm leading-6 font-semibold bg-transparent"
+        />
+
+        <div className="flex items-center gap-2 relative">
+          <ConversationStateIndicator state={state} />
+          <EllipsisButton
+            onClick={(event) => {
+              event.stopPropagation();
+              setContextMenuVisible((prev) => !prev);
+            }}
+          />
+          {contextMenuVisible && (
+            <ContextMenu testId="context-menu" className="absolute left-full">
+              <ContextMenuListItem
+                testId="delete-button"
+                onClick={handleDelete}
+              >
+                Delete
+              </ContextMenuListItem>
+            </ContextMenu>
+          )}
+        </div>
+      </div>
+      {repo && (
+        <ConversationRepoLink
+          repo={repo}
+          onClick={(e) => e.stopPropagation()}
+        />
+      )}
+      <p className="text-xs text-neutral-400">
+        <time>{formatTimeDelta(new Date(lastUpdated))} ago</time>
+      </p>
+    </div>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/conversation-panel.tsx b/frontend/src/components/features/conversation-panel/conversation-panel.tsx
new file mode 100644
index 000000000000..608856c68db0
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/conversation-panel.tsx
@@ -0,0 +1,128 @@
+import React from "react";
+import { useLocation, useNavigate, useParams } from "react-router";
+import { ConversationCard } from "./conversation-card";
+import { useUserConversations } from "#/hooks/query/use-user-conversations";
+import { useDeleteConversation } from "#/hooks/mutation/use-delete-conversation";
+import { ConfirmDeleteModal } from "./confirm-delete-modal";
+import { NewConversationButton } from "./new-conversation-button";
+import { LoadingSpinner } from "#/components/shared/loading-spinner";
+import { useUpdateConversation } from "#/hooks/mutation/use-update-conversation";
+import { useEndSession } from "#/hooks/use-end-session";
+import { ExitConversationModal } from "./exit-conversation-modal";
+
+interface ConversationPanelProps {
+  onClose: () => void;
+}
+
+export function ConversationPanel({ onClose }: ConversationPanelProps) {
+  const { conversationId: cid } = useParams();
+  const navigate = useNavigate();
+  const location = useLocation();
+
+  const endSession = useEndSession();
+
+  const [confirmDeleteModalVisible, setConfirmDeleteModalVisible] =
+    React.useState(false);
+  const [
+    confirmExitConversationModalVisible,
+    setConfirmExitConversationModalVisible,
+  ] = React.useState(false);
+  const [selectedConversationId, setSelectedConversationId] = React.useState<
+    string | null
+  >(null);
+
+  const { data: conversations, isFetching, error } = useUserConversations();
+
+  const { mutate: deleteConversation } = useDeleteConversation();
+  const { mutate: updateConversation } = useUpdateConversation();
+
+  const handleDeleteProject = (conversationId: string) => {
+    setConfirmDeleteModalVisible(true);
+    setSelectedConversationId(conversationId);
+  };
+
+  const handleConfirmDelete = () => {
+    if (selectedConversationId) {
+      deleteConversation({ conversationId: selectedConversationId });
+      setConfirmDeleteModalVisible(false);
+
+      if (cid === selectedConversationId) {
+        endSession();
+      }
+    }
+  };
+
+  const handleChangeTitle = (
+    conversationId: string,
+    oldTitle: string,
+    newTitle: string,
+  ) => {
+    if (oldTitle !== newTitle)
+      updateConversation({
+        id: conversationId,
+        conversation: { name: newTitle },
+      });
+  };
+
+  const handleClickCard = (conversationId: string) => {
+    navigate(`/conversations/${conversationId}`);
+    onClose();
+  };
+
+  return (
+    <div
+      data-testid="conversation-panel"
+      className="w-[350px] h-full border border-neutral-700 bg-neutral-800 rounded-xl"
+    >
+      <div className="pt-4 px-4 flex items-center justify-between">
+        {location.pathname.startsWith("/conversation") && (
+          <NewConversationButton
+            onClick={() => setConfirmExitConversationModalVisible(true)}
+          />
+        )}
+        {isFetching && <LoadingSpinner size="small" />}
+      </div>
+      {error && (
+        <div className="flex flex-col items-center justify-center h-full">
+          <p className="text-danger">{error.message}</p>
+        </div>
+      )}
+      {conversations?.length === 0 && (
+        <div className="flex flex-col items-center justify-center h-full">
+          <p className="text-neutral-400">No conversations found</p>
+        </div>
+      )}
+      {conversations?.map((project) => (
+        <ConversationCard
+          key={project.conversation_id}
+          onClick={() => handleClickCard(project.conversation_id)}
+          onDelete={() => handleDeleteProject(project.conversation_id)}
+          onChangeTitle={(title) =>
+            handleChangeTitle(project.conversation_id, project.name, title)
+          }
+          name={project.name}
+          repo={project.repo}
+          lastUpdated={project.lastUpdated}
+          state={project.state}
+        />
+      ))}
+
+      {confirmDeleteModalVisible && (
+        <ConfirmDeleteModal
+          onConfirm={handleConfirmDelete}
+          onCancel={() => setConfirmDeleteModalVisible(false)}
+        />
+      )}
+
+      {confirmExitConversationModalVisible && (
+        <ExitConversationModal
+          onConfirm={() => {
+            endSession();
+            onClose();
+          }}
+          onClose={() => setConfirmExitConversationModalVisible(false)}
+        />
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/conversation-repo-link.tsx b/frontend/src/components/features/conversation-panel/conversation-repo-link.tsx
new file mode 100644
index 000000000000..c2e527c2a6f9
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/conversation-repo-link.tsx
@@ -0,0 +1,21 @@
+interface ConversationRepoLinkProps {
+  repo: string;
+  onClick?: (event: React.MouseEvent<HTMLAnchorElement>) => void;
+}
+
+export function ConversationRepoLink({
+  repo,
+  onClick,
+}: ConversationRepoLinkProps) {
+  return (
+    <a
+      data-testid="conversation-card-repo"
+      href={`https://github.com/${repo}`}
+      target="_blank noopener noreferrer"
+      onClick={onClick}
+      className="text-xs text-neutral-400 hover:text-neutral-200"
+    >
+      {repo}
+    </a>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/conversation-state-indicator.tsx b/frontend/src/components/features/conversation-panel/conversation-state-indicator.tsx
new file mode 100644
index 000000000000..b42a13606def
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/conversation-state-indicator.tsx
@@ -0,0 +1,40 @@
+import ColdIcon from "./state-indicators/cold.svg?react";
+import CoolingIcon from "./state-indicators/cooling.svg?react";
+import FinishedIcon from "./state-indicators/finished.svg?react";
+import RunningIcon from "./state-indicators/running.svg?react";
+import WaitingIcon from "./state-indicators/waiting.svg?react";
+import WarmIcon from "./state-indicators/warm.svg?react";
+
+type SVGIcon = React.FunctionComponent<React.SVGProps<SVGSVGElement>>;
+export type ProjectState =
+  | "cold"
+  | "cooling"
+  | "finished"
+  | "running"
+  | "waiting"
+  | "warm";
+
+const INDICATORS: Record<ProjectState, SVGIcon> = {
+  cold: ColdIcon,
+  cooling: CoolingIcon,
+  finished: FinishedIcon,
+  running: RunningIcon,
+  waiting: WaitingIcon,
+  warm: WarmIcon,
+};
+
+interface ConversationStateIndicatorProps {
+  state: ProjectState;
+}
+
+export function ConversationStateIndicator({
+  state,
+}: ConversationStateIndicatorProps) {
+  const StateIcon = INDICATORS[state];
+
+  return (
+    <div data-testid={`${state}-indicator`}>
+      <StateIcon />
+    </div>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/ellipsis-button.tsx b/frontend/src/components/features/conversation-panel/ellipsis-button.tsx
new file mode 100644
index 000000000000..bd8732f7cd47
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/ellipsis-button.tsx
@@ -0,0 +1,13 @@
+import { FaEllipsisV } from "react-icons/fa";
+
+interface EllipsisButtonProps {
+  onClick: (event: React.MouseEvent<HTMLButtonElement>) => void;
+}
+
+export function EllipsisButton({ onClick }: EllipsisButtonProps) {
+  return (
+    <button data-testid="ellipsis-button" type="button" onClick={onClick}>
+      <FaEllipsisV fill="#a3a3a3" />
+    </button>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/exit-conversation-modal.tsx b/frontend/src/components/features/conversation-panel/exit-conversation-modal.tsx
new file mode 100644
index 000000000000..6442598cbbc4
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/exit-conversation-modal.tsx
@@ -0,0 +1,34 @@
+import { ModalBackdrop } from "#/components/shared/modals/modal-backdrop";
+import { ModalBody } from "#/components/shared/modals/modal-body";
+import { ModalButton } from "#/components/shared/buttons/modal-button";
+import { BaseModalTitle } from "#/components/shared/modals/confirmation-modals/base-modal";
+
+interface ExitConversationModalProps {
+  onConfirm: () => void;
+  onClose: () => void;
+}
+
+export function ExitConversationModal({
+  onConfirm,
+  onClose,
+}: ExitConversationModalProps) {
+  return (
+    <ModalBackdrop>
+      <ModalBody testID="confirm-new-conversation-modal">
+        <BaseModalTitle title="Creating a new conversation will replace your active conversation" />
+        <div className="flex w-full gap-2">
+          <ModalButton
+            text="Confirm"
+            onClick={onConfirm}
+            className="bg-[#C63143] flex-1"
+          />
+          <ModalButton
+            text="Cancel"
+            onClick={onClose}
+            className="bg-neutral-700 flex-1"
+          />
+        </div>
+      </ModalBody>
+    </ModalBackdrop>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/new-conversation-button.tsx b/frontend/src/components/features/conversation-panel/new-conversation-button.tsx
new file mode 100644
index 000000000000..b7563952cfce
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/new-conversation-button.tsx
@@ -0,0 +1,16 @@
+interface NewConversationButtonProps {
+  onClick: () => void;
+}
+
+export function NewConversationButton({ onClick }: NewConversationButtonProps) {
+  return (
+    <button
+      data-testid="new-conversation-button"
+      type="button"
+      onClick={onClick}
+      className="font-bold bg-[#4465DB] px-2 py-1 rounded"
+    >
+      + New Project
+    </button>
+  );
+}
diff --git a/frontend/src/components/features/conversation-panel/state-indicators/cold.svg b/frontend/src/components/features/conversation-panel/state-indicators/cold.svg
new file mode 100644
index 000000000000..95b513851439
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/state-indicators/cold.svg
@@ -0,0 +1,4 @@
+<svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M9.87012 2C9.87012 1.44772 9.4224 1 8.87012 1C8.31783 1 7.87012 1.44772 7.87012 2V8C7.87012 8.55228 8.31783 9 8.87012 9C9.4224 9 9.87012 8.55228 9.87012 8V2Z" fill="#A7A9AC"/>
+<path d="M10.8698 2.42001V2.56001C10.8698 2.93001 11.0698 3.28001 11.4098 3.43001C13.6798 4.43001 15.2198 6.80001 14.9698 9.48001C14.6998 12.47 12.0998 14.87 9.08979 14.92C5.73979 14.97 2.98979 12.26 2.98979 8.92001C2.98979 6.57001 4.34979 4.54001 6.30979 3.56001C6.63979 3.40001 6.85979 3.08001 6.85979 2.72001V2.55001C6.85979 1.86001 6.13979 1.43001 5.50979 1.73001C2.43979 3.20001 0.449793 6.62001 1.13979 10.41C1.70979 13.57 4.23979 16.14 7.38979 16.76C12.5098 17.76 16.9998 13.86 16.9998 8.92001C16.9998 5.61001 14.9898 2.78001 12.1198 1.56001C11.5298 1.31001 10.8698 1.78001 10.8698 2.42001Z" fill="#A7A9AC"/>
+</svg>
diff --git a/frontend/src/components/features/conversation-panel/state-indicators/cooling.svg b/frontend/src/components/features/conversation-panel/state-indicators/cooling.svg
new file mode 100644
index 000000000000..ef65bfa11c06
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/state-indicators/cooling.svg
@@ -0,0 +1,4 @@
+<svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M9.87012 2.02002C9.87012 1.46773 9.4224 1.02002 8.87012 1.02002C8.31783 1.02002 7.87012 1.46773 7.87012 2.02002V8.02002C7.87012 8.5723 8.31783 9.02002 8.87012 9.02002C9.4224 9.02002 9.87012 8.5723 9.87012 8.02002V2.02002Z" fill="#EFC818"/>
+<path d="M10.8698 2.44003V2.58003C10.8698 2.95003 11.0698 3.30003 11.4098 3.45003C13.6798 4.45003 15.2198 6.82003 14.9698 9.50003C14.6998 12.49 12.0998 14.89 9.08979 14.94C5.73979 14.99 2.98979 12.28 2.98979 8.94003C2.98979 6.59003 4.34979 4.56003 6.30979 3.58003C6.63979 3.42003 6.85979 3.10003 6.85979 2.74003V2.57003C6.85979 1.88003 6.13979 1.45003 5.50979 1.75003C2.43979 3.23003 0.449793 6.64003 1.13979 10.43C1.70979 13.59 4.23979 16.16 7.38979 16.78C12.5098 17.78 16.9998 13.88 16.9998 8.94003C16.9998 5.63003 14.9898 2.80003 12.1198 1.58003C11.5298 1.33003 10.8698 1.80003 10.8698 2.44003Z" fill="#EFC818"/>
+</svg>
diff --git a/frontend/src/components/features/conversation-panel/state-indicators/finished.svg b/frontend/src/components/features/conversation-panel/state-indicators/finished.svg
new file mode 100644
index 000000000000..311d524d1774
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/state-indicators/finished.svg
@@ -0,0 +1,4 @@
+<svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M9 16.8599C13.4183 16.8599 17 13.2781 17 8.85986C17 4.44159 13.4183 0.859863 9 0.859863C4.58172 0.859863 1 4.44159 1 8.85986C1 13.2781 4.58172 16.8599 9 16.8599Z" fill="#779FD4"/>
+<path d="M4.61035 8.43014L7.86035 12.0301L13.3904 6.64014" stroke="#231F20" stroke-width="2" stroke-miterlimit="10" stroke-linecap="round"/>
+</svg>
diff --git a/frontend/src/components/features/conversation-panel/state-indicators/running.svg b/frontend/src/components/features/conversation-panel/state-indicators/running.svg
new file mode 100644
index 000000000000..5537583da544
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/state-indicators/running.svg
@@ -0,0 +1,4 @@
+<svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M9.04004 3.10986C12.06 3.10986 14.57 5.34986 14.98 8.25986C15.05 8.74986 15.47 9.10986 15.96 9.10986C16.57 9.10986 17.04 8.56986 16.96 7.96986C16.41 4.08986 13.07 1.10986 9.04004 1.10986C4.62004 1.10986 1.04004 4.68986 1.04004 9.10986C1.04004 13.1399 4.02004 16.4799 7.90004 17.0299C8.50004 17.1199 9.04004 16.6399 9.04004 16.0299C9.04004 15.5399 8.68004 15.1199 8.19004 15.0499C5.28004 14.6399 3.04004 12.1299 3.04004 9.10986C3.04004 5.79986 5.73004 3.10986 9.04004 3.10986Z" fill="#60BB46"/>
+<path d="M12.3504 9.11L7.40039 6.25V11.96L12.3504 9.11Z" fill="#60BB46"/>
+</svg>
diff --git a/frontend/src/components/features/conversation-panel/state-indicators/waiting.svg b/frontend/src/components/features/conversation-panel/state-indicators/waiting.svg
new file mode 100644
index 000000000000..a73aa2b27653
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/state-indicators/waiting.svg
@@ -0,0 +1,4 @@
+<svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M6.76039 6.99002C8.478 6.99002 9.87039 5.59763 9.87039 3.88002C9.87039 2.16241 8.478 0.77002 6.76039 0.77002C5.04279 0.77002 3.65039 2.16241 3.65039 3.88002C3.65039 5.59763 5.04279 6.99002 6.76039 6.99002Z" fill="#FFE165"/>
+<path d="M1.0802 17.0799C1.0802 17.0799 0.610196 11.5499 3.0102 9.67992C4.7902 8.29992 7.3302 9.44992 9.7802 7.95992C11.5802 6.86992 13.6102 4.10992 14.5202 2.49992C14.9302 1.77992 15.9102 1.62992 16.6102 2.05992C17.3802 2.51992 17.6102 3.53992 17.1102 4.28992C16.2302 5.58992 14.1802 8.85992 13.1202 10.3699C10.7602 13.7599 11.4302 17.0799 11.4302 17.0799H1.0702H1.0802Z" fill="#FFE165"/>
+</svg>
diff --git a/frontend/src/components/features/conversation-panel/state-indicators/warm.svg b/frontend/src/components/features/conversation-panel/state-indicators/warm.svg
new file mode 100644
index 000000000000..e7432e75315d
--- /dev/null
+++ b/frontend/src/components/features/conversation-panel/state-indicators/warm.svg
@@ -0,0 +1,4 @@
+<svg width="18" height="18" viewBox="0 0 18 18" fill="none" xmlns="http://www.w3.org/2000/svg">
+<path d="M9.87012 2.08984C9.87012 1.53756 9.4224 1.08984 8.87012 1.08984C8.31783 1.08984 7.87012 1.53756 7.87012 2.08984V8.08984C7.87012 8.64213 8.31783 9.08984 8.87012 9.08984C9.4224 9.08984 9.87012 8.64213 9.87012 8.08984V2.08984Z" fill="#60BB46"/>
+<path d="M10.8702 2.50988V2.64988C10.8702 3.01988 11.0702 3.36988 11.4102 3.51988C13.6802 4.51988 15.2202 6.88988 14.9702 9.56988C14.7002 12.5599 12.1002 14.9599 9.09021 15.0099C5.74021 15.0599 2.99021 12.3499 2.99021 9.00988C2.99021 6.65988 4.35021 4.62988 6.31021 3.64988C6.64021 3.48988 6.86021 3.16988 6.86021 2.80988V2.63988C6.86021 1.94988 6.14021 1.51988 5.51021 1.81988C2.42021 3.30988 0.430214 6.71988 1.12021 10.5199C1.69021 13.6799 4.22021 16.2499 7.37021 16.8699C12.4902 17.8699 16.9802 13.9699 16.9802 9.02988C16.9802 5.71988 14.9702 2.88988 12.1002 1.66988C11.5102 1.41988 10.8502 1.88988 10.8502 2.52988L10.8702 2.50988Z" fill="#60BB46"/>
+</svg>
diff --git a/frontend/src/components/features/github/github-repositories-suggestion-box.tsx b/frontend/src/components/features/github/github-repositories-suggestion-box.tsx
index 227ef8a5bdcb..f5bd2a740068 100644
--- a/frontend/src/components/features/github/github-repositories-suggestion-box.tsx
+++ b/frontend/src/components/features/github/github-repositories-suggestion-box.tsx
@@ -31,17 +31,6 @@ export function GitHubRepositoriesSuggestionBox({
     }
   };
 
-  if (isGitHubErrorReponse(repositories)) {
-    return (
-      <SuggestionBox
-        title="Error Fetching Repositories"
-        content={
-          <p className="text-danger text-center">{repositories.message}</p>
-        }
-      />
-    );
-  }
-
   const isLoggedIn = !!user && !isGitHubErrorReponse(user);
 
   return (
diff --git a/frontend/src/components/features/project-menu/ProjectMenuCard.tsx b/frontend/src/components/features/project-menu/ProjectMenuCard.tsx
index f9a0e1686c23..bebf4a5ae921 100644
--- a/frontend/src/components/features/project-menu/ProjectMenuCard.tsx
+++ b/frontend/src/components/features/project-menu/ProjectMenuCard.tsx
@@ -1,5 +1,6 @@
 import React from "react";
 import posthog from "posthog-js";
+import { useTranslation } from "react-i18next";
 import EllipsisH from "#/icons/ellipsis-h.svg?react";
 import { ProjectMenuCardContextMenu } from "./project.menu-card-context-menu";
 import { ProjectMenuDetailsPlaceholder } from "./project-menu-details-placeholder";
@@ -7,6 +8,7 @@ import { ProjectMenuDetails } from "./project-menu-details";
 import { ConnectToGitHubModal } from "#/components/shared/modals/connect-to-github-modal";
 import { ModalBackdrop } from "#/components/shared/modals/modal-backdrop";
 import { DownloadModal } from "#/components/shared/download-modal";
+import { I18nKey } from "#/i18n/declaration";
 
 interface ProjectMenuCardProps {
   isConnectedToGitHub: boolean;
@@ -21,6 +23,8 @@ export function ProjectMenuCard({
   isConnectedToGitHub,
   githubData,
 }: ProjectMenuCardProps) {
+  const { t } = useTranslation();
+
   const [contextMenuIsOpen, setContextMenuIsOpen] = React.useState(false);
   const [connectToGitHubModalOpen, setConnectToGitHubModalOpen] =
     React.useState(false);
@@ -71,7 +75,7 @@ export function ProjectMenuCard({
         <button
           type="button"
           onClick={toggleMenuVisibility}
-          aria-label="Open project menu"
+          aria-label={t(I18nKey.PROJECT_MENU_CARD$OPEN)}
         >
           <EllipsisH width={36} height={36} />
         </button>
diff --git a/frontend/src/components/features/project-menu/project-menu-details-placeholder.tsx b/frontend/src/components/features/project-menu/project-menu-details-placeholder.tsx
index f9556d8c0a39..47a6a381809c 100644
--- a/frontend/src/components/features/project-menu/project-menu-details-placeholder.tsx
+++ b/frontend/src/components/features/project-menu/project-menu-details-placeholder.tsx
@@ -30,7 +30,9 @@ export function ProjectMenuDetailsPlaceholder({
             "hover:underline hover:underline-offset-2",
           )}
         >
-          {!isConnectedToGitHub ? "Connect to GitHub" : "Connected"}
+          {!isConnectedToGitHub
+            ? t(I18nKey.PROJECT_MENU_DETAILS_PLACEHOLDER$CONNECT_TO_GITHUB)
+            : t(I18nKey.PROJECT_MENU_DETAILS_PLACEHOLDER$CONNECTED)}
           <CloudConnection width={12} height={12} />
         </span>
       </button>
diff --git a/frontend/src/components/features/sidebar/sidebar.tsx b/frontend/src/components/features/sidebar/sidebar.tsx
index 5afc1aa9d24e..3d2e9a3e60b0 100644
--- a/frontend/src/components/features/sidebar/sidebar.tsx
+++ b/frontend/src/components/features/sidebar/sidebar.tsx
@@ -1,7 +1,7 @@
 import React from "react";
 import { useLocation } from "react-router";
+import FolderIcon from "#/icons/docs.svg?react";
 import { useAuth } from "#/context/auth-context";
-import { useSettings } from "#/context/settings-context";
 import { useGitHubUser } from "#/hooks/query/use-github-user";
 import { useIsAuthed } from "#/hooks/query/use-is-authed";
 import { UserActions } from "./user-actions";
@@ -13,21 +13,28 @@ import { LoadingSpinner } from "#/components/shared/loading-spinner";
 import { AccountSettingsModal } from "#/components/shared/modals/account-settings/account-settings-modal";
 import { ExitProjectConfirmationModal } from "#/components/shared/modals/exit-project-confirmation-modal";
 import { SettingsModal } from "#/components/shared/modals/settings/settings-modal";
+import { useSettingsUpToDate } from "#/context/settings-up-to-date-context";
+import { useSettings } from "#/hooks/query/use-settings";
+import { ConversationPanel } from "../conversation-panel/conversation-panel";
+import { cn } from "#/utils/utils";
+import { MULTI_CONVO_UI_IS_ENABLED } from "#/utils/constants";
 
 export function Sidebar() {
   const location = useLocation();
-
   const user = useGitHubUser();
   const { data: isAuthed } = useIsAuthed();
-
   const { logout } = useAuth();
-  const { settingsAreUpToDate } = useSettings();
+  const { data: settings, isError: settingsIsError } = useSettings();
+  const { isUpToDate: settingsAreUpToDate } = useSettingsUpToDate();
 
   const [accountSettingsModalOpen, setAccountSettingsModalOpen] =
     React.useState(false);
   const [settingsModalIsOpen, setSettingsModalIsOpen] = React.useState(false);
   const [startNewProjectModalIsOpen, setStartNewProjectModalIsOpen] =
     React.useState(false);
+  const [conversationPanelIsOpen, setConversationPanelIsOpen] = React.useState(
+    MULTI_CONVO_UI_IS_ENABLED,
+  );
 
   React.useEffect(() => {
     // If the github token is invalid, open the account settings modal again
@@ -54,7 +61,7 @@ export function Sidebar() {
 
   return (
     <>
-      <aside className="h-[40px] md:h-auto px-1 flex flex-row md:flex-col gap-1">
+      <aside className="h-[40px] md:h-auto px-1 flex flex-row md:flex-col gap-1 relative">
         <nav className="flex flex-row md:flex-col items-center gap-[18px]">
           <div className="w-[34px] h-[34px] flex items-center justify-center">
             <AllHandsLogoButton onClick={handleClickLogo} />
@@ -70,18 +77,45 @@ export function Sidebar() {
             />
           )}
           <SettingsButton onClick={() => setSettingsModalIsOpen(true)} />
+          {MULTI_CONVO_UI_IS_ENABLED && (
+            <button
+              data-testid="toggle-conversation-panel"
+              type="button"
+              onClick={() => setConversationPanelIsOpen((prev) => !prev)}
+              className={cn(
+                conversationPanelIsOpen ? "border-b-2 border-[#FFE165]" : "",
+              )}
+            >
+              <FolderIcon width={28} height={28} />
+            </button>
+          )}
           <DocsButton />
           <ExitProjectButton
             onClick={() => setStartNewProjectModalIsOpen(true)}
           />
         </nav>
+
+        {conversationPanelIsOpen && (
+          <div
+            className="absolute h-full left-[calc(100%+12px)] top-0 z-20" // 12px padding (sidebar parent)
+          >
+            <ConversationPanel
+              onClose={() => setConversationPanelIsOpen(false)}
+            />
+          </div>
+        )}
       </aside>
+
       {accountSettingsModalOpen && (
         <AccountSettingsModal onClose={handleAccountSettingsModalClose} />
       )}
-      {showSettingsModal && (
-        <SettingsModal onClose={() => setSettingsModalIsOpen(false)} />
-      )}
+      {settingsIsError ||
+        (showSettingsModal && (
+          <SettingsModal
+            settings={settings}
+            onClose={() => setSettingsModalIsOpen(false)}
+          />
+        ))}
       {startNewProjectModalIsOpen && (
         <ExitProjectConfirmationModal
           onClose={() => setStartNewProjectModalIsOpen(false)}
diff --git a/frontend/src/components/features/sidebar/user-avatar.tsx b/frontend/src/components/features/sidebar/user-avatar.tsx
index 8bec1eac40c6..12a18847d01c 100644
--- a/frontend/src/components/features/sidebar/user-avatar.tsx
+++ b/frontend/src/components/features/sidebar/user-avatar.tsx
@@ -1,3 +1,4 @@
+import { Tooltip } from "@nextui-org/react";
 import { LoadingSpinner } from "#/components/shared/loading-spinner";
 import DefaultUserAvatar from "#/icons/default-user.svg?react";
 import { cn } from "#/utils/utils";
@@ -10,7 +11,7 @@ interface UserAvatarProps {
 }
 
 export function UserAvatar({ onClick, avatarUrl, isLoading }: UserAvatarProps) {
-  return (
+  const buttonContent = (
     <button
       data-testid="user-avatar"
       type="button"
@@ -31,4 +32,10 @@ export function UserAvatar({ onClick, avatarUrl, isLoading }: UserAvatarProps) {
       {isLoading && <LoadingSpinner size="small" />}
     </button>
   );
+
+  return (
+    <Tooltip content="Account settings" closeDelay={100}>
+      {buttonContent}
+    </Tooltip>
+  );
 }
diff --git a/frontend/src/components/layout/resizable-panel.tsx b/frontend/src/components/layout/resizable-panel.tsx
new file mode 100644
index 000000000000..0f7ecc4e5183
--- /dev/null
+++ b/frontend/src/components/layout/resizable-panel.tsx
@@ -0,0 +1,191 @@
+import React, { CSSProperties, JSX, useEffect, useRef, useState } from "react";
+import {
+  VscChevronDown,
+  VscChevronLeft,
+  VscChevronRight,
+  VscChevronUp,
+} from "react-icons/vsc";
+import { twMerge } from "tailwind-merge";
+import { IconButton } from "../shared/buttons/icon-button";
+
+export enum Orientation {
+  HORIZONTAL = "horizontal",
+  VERTICAL = "vertical",
+}
+
+enum Collapse {
+  COLLAPSED = "collapsed",
+  SPLIT = "split",
+  FILLED = "filled",
+}
+
+type ResizablePanelProps = {
+  firstChild: React.ReactNode;
+  firstClassName: string | undefined;
+  secondChild: React.ReactNode;
+  secondClassName: string | undefined;
+  className: string | undefined;
+  orientation: Orientation;
+  initialSize: number;
+};
+
+export function ResizablePanel({
+  firstChild,
+  firstClassName,
+  secondChild,
+  secondClassName,
+  className,
+  orientation,
+  initialSize,
+}: ResizablePanelProps): JSX.Element {
+  const [firstSize, setFirstSize] = useState<number>(initialSize);
+  const [dividerPosition, setDividerPosition] = useState<number | null>(null);
+  const firstRef = useRef<HTMLDivElement>(null);
+  const secondRef = useRef<HTMLDivElement>(null);
+  const [collapse, setCollapse] = useState<Collapse>(Collapse.SPLIT);
+  const isHorizontal = orientation === Orientation.HORIZONTAL;
+
+  useEffect(() => {
+    if (dividerPosition == null || !firstRef.current) {
+      return undefined;
+    }
+    const getFirstSizeFromEvent = (e: MouseEvent) => {
+      const position = isHorizontal ? e.clientX : e.clientY;
+      return firstSize + position - dividerPosition;
+    };
+    const onMouseMove = (e: MouseEvent) => {
+      e.preventDefault();
+      const newFirstSize = `${getFirstSizeFromEvent(e)}px`;
+      const { current } = firstRef;
+      if (current) {
+        if (isHorizontal) {
+          current.style.width = newFirstSize;
+          current.style.minWidth = newFirstSize;
+        } else {
+          current.style.height = newFirstSize;
+          current.style.minHeight = newFirstSize;
+        }
+      }
+    };
+    const onMouseUp = (e: MouseEvent) => {
+      e.preventDefault();
+      if (firstRef.current) {
+        firstRef.current.style.transition = "";
+      }
+      if (secondRef.current) {
+        secondRef.current.style.transition = "";
+      }
+      setFirstSize(getFirstSizeFromEvent(e));
+      setDividerPosition(null);
+      document.removeEventListener("mousemove", onMouseMove);
+      document.removeEventListener("mouseup", onMouseUp);
+    };
+    document.addEventListener("mousemove", onMouseMove);
+    document.addEventListener("mouseup", onMouseUp);
+    return () => {
+      document.removeEventListener("mousemove", onMouseMove);
+      document.removeEventListener("mouseup", onMouseUp);
+    };
+  }, [dividerPosition, firstSize, orientation]);
+
+  const onMouseDown = (e: React.MouseEvent) => {
+    e.preventDefault();
+    if (firstRef.current) {
+      firstRef.current.style.transition = "none";
+    }
+    if (secondRef.current) {
+      secondRef.current.style.transition = "none";
+    }
+    const position = isHorizontal ? e.clientX : e.clientY;
+    setDividerPosition(position);
+  };
+
+  const getStyleForFirst = () => {
+    const style: CSSProperties = { overflow: "hidden" };
+    if (collapse === Collapse.COLLAPSED) {
+      style.opacity = 0;
+      style.width = 0;
+      style.minWidth = 0;
+      style.height = 0;
+      style.minHeight = 0;
+    } else if (collapse === Collapse.SPLIT) {
+      const firstSizePx = `${firstSize}px`;
+      if (isHorizontal) {
+        style.width = firstSizePx;
+        style.minWidth = firstSizePx;
+      } else {
+        style.height = firstSizePx;
+        style.minHeight = firstSizePx;
+      }
+    } else {
+      style.flexGrow = 1;
+    }
+    return style;
+  };
+
+  const getStyleForSecond = () => {
+    const style: CSSProperties = { overflow: "hidden" };
+    if (collapse === Collapse.FILLED) {
+      style.opacity = 0;
+      style.width = 0;
+      style.minWidth = 0;
+      style.height = 0;
+      style.minHeight = 0;
+    } else if (collapse === Collapse.SPLIT) {
+      style.flexGrow = 1;
+    } else {
+      style.flexGrow = 1;
+    }
+    return style;
+  };
+
+  const onCollapse = () => {
+    if (collapse === Collapse.SPLIT) {
+      setCollapse(Collapse.COLLAPSED);
+    } else {
+      setCollapse(Collapse.SPLIT);
+    }
+  };
+
+  const onExpand = () => {
+    if (collapse === Collapse.SPLIT) {
+      setCollapse(Collapse.FILLED);
+    } else {
+      setCollapse(Collapse.SPLIT);
+    }
+  };
+
+  return (
+    <div className={twMerge("flex", !isHorizontal && "flex-col", className)}>
+      <div
+        ref={firstRef}
+        className={twMerge(firstClassName, "transition-all ease-soft-spring")}
+        style={getStyleForFirst()}
+      >
+        {firstChild}
+      </div>
+      <div
+        className={`${isHorizontal ? "cursor-ew-resize w-3 flex-col" : "cursor-ns-resize h-3 flex-row"} shrink-0 flex justify-center items-center`}
+        onMouseDown={collapse === Collapse.SPLIT ? onMouseDown : undefined}
+      >
+        <IconButton
+          icon={isHorizontal ? <VscChevronLeft /> : <VscChevronUp />}
+          ariaLabel="Collapse"
+          onClick={onCollapse}
+        />
+        <IconButton
+          icon={isHorizontal ? <VscChevronRight /> : <VscChevronDown />}
+          ariaLabel="Expand"
+          onClick={onExpand}
+        />
+      </div>
+      <div
+        ref={secondRef}
+        className={twMerge(secondClassName, "transition-all ease-soft-spring")}
+        style={getStyleForSecond()}
+      >
+        {secondChild}
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/components/shared/buttons/all-hands-logo-button.tsx b/frontend/src/components/shared/buttons/all-hands-logo-button.tsx
index 74ab5f3cee06..e068f152af13 100644
--- a/frontend/src/components/shared/buttons/all-hands-logo-button.tsx
+++ b/frontend/src/components/shared/buttons/all-hands-logo-button.tsx
@@ -1,4 +1,5 @@
 import AllHandsLogo from "#/assets/branding/all-hands-logo.svg?react";
+import { TooltipButton } from "./tooltip-button";
 
 interface AllHandsLogoButtonProps {
   onClick: () => void;
@@ -6,8 +7,12 @@ interface AllHandsLogoButtonProps {
 
 export function AllHandsLogoButton({ onClick }: AllHandsLogoButtonProps) {
   return (
-    <button type="button" aria-label="All Hands Logo" onClick={onClick}>
+    <TooltipButton
+      tooltip="All Hands AI"
+      ariaLabel="All Hands Logo"
+      onClick={onClick}
+    >
       <AllHandsLogo width={34} height={23} />
-    </button>
+    </TooltipButton>
   );
 }
diff --git a/frontend/src/components/shared/buttons/docs-button.tsx b/frontend/src/components/shared/buttons/docs-button.tsx
index 3b805556e3da..a06e543cda37 100644
--- a/frontend/src/components/shared/buttons/docs-button.tsx
+++ b/frontend/src/components/shared/buttons/docs-button.tsx
@@ -1,15 +1,14 @@
 import DocsIcon from "#/icons/docs.svg?react";
+import { TooltipButton } from "./tooltip-button";
 
 export function DocsButton() {
   return (
-    <a
+    <TooltipButton
+      tooltip="Documentation"
+      ariaLabel="Documentation"
       href="https://docs.all-hands.dev"
-      aria-label="Documentation"
-      target="_blank"
-      rel="noreferrer noopener"
-      className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
     >
       <DocsIcon width={28} height={28} />
-    </a>
+    </TooltipButton>
   );
 }
diff --git a/frontend/src/components/shared/buttons/exit-project-button.tsx b/frontend/src/components/shared/buttons/exit-project-button.tsx
index e187fe99d19b..206d1660e2bb 100644
--- a/frontend/src/components/shared/buttons/exit-project-button.tsx
+++ b/frontend/src/components/shared/buttons/exit-project-button.tsx
@@ -1,4 +1,5 @@
 import NewProjectIcon from "#/icons/new-project.svg?react";
+import { TooltipButton } from "./tooltip-button";
 
 interface ExitProjectButtonProps {
   onClick: () => void;
@@ -6,13 +7,13 @@ interface ExitProjectButtonProps {
 
 export function ExitProjectButton({ onClick }: ExitProjectButtonProps) {
   return (
-    <button
-      data-testid="new-project-button"
-      type="button"
-      aria-label="Start new project"
+    <TooltipButton
+      tooltip="Start new project"
+      ariaLabel="Start new project"
       onClick={onClick}
+      testId="new-project-button"
     >
       <NewProjectIcon width={28} height={28} />
-    </button>
+    </TooltipButton>
   );
 }
diff --git a/frontend/src/components/shared/buttons/settings-button.tsx b/frontend/src/components/shared/buttons/settings-button.tsx
index 3e739bcb6986..59ed58ed27a2 100644
--- a/frontend/src/components/shared/buttons/settings-button.tsx
+++ b/frontend/src/components/shared/buttons/settings-button.tsx
@@ -1,4 +1,5 @@
 import CogTooth from "#/assets/cog-tooth";
+import { TooltipButton } from "./tooltip-button";
 
 interface SettingsButtonProps {
   onClick: () => void;
@@ -6,13 +7,13 @@ interface SettingsButtonProps {
 
 export function SettingsButton({ onClick }: SettingsButtonProps) {
   return (
-    <button
-      type="button"
-      aria-label="Settings"
-      className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
+    <TooltipButton
+      testId="settings-button"
+      tooltip="Settings"
+      ariaLabel="Settings"
       onClick={onClick}
     >
       <CogTooth />
-    </button>
+    </TooltipButton>
   );
 }
diff --git a/frontend/src/components/shared/buttons/tooltip-button.tsx b/frontend/src/components/shared/buttons/tooltip-button.tsx
new file mode 100644
index 000000000000..00ddddbc5c08
--- /dev/null
+++ b/frontend/src/components/shared/buttons/tooltip-button.tsx
@@ -0,0 +1,52 @@
+import { Tooltip } from "@nextui-org/react";
+import { ReactNode } from "react";
+
+interface TooltipButtonProps {
+  children: ReactNode;
+  tooltip: string;
+  onClick?: () => void;
+  href?: string;
+  ariaLabel: string;
+  testId?: string;
+}
+
+export function TooltipButton({
+  children,
+  tooltip,
+  onClick,
+  href,
+  ariaLabel,
+  testId,
+}: TooltipButtonProps) {
+  const buttonContent = (
+    <button
+      type="button"
+      aria-label={ariaLabel}
+      data-testid={testId}
+      onClick={onClick}
+      className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
+    >
+      {children}
+    </button>
+  );
+
+  const content = href ? (
+    <a
+      href={href}
+      target="_blank"
+      rel="noreferrer noopener"
+      className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
+      aria-label={ariaLabel}
+    >
+      {children}
+    </a>
+  ) : (
+    buttonContent
+  );
+
+  return (
+    <Tooltip content={tooltip} closeDelay={100}>
+      {content}
+    </Tooltip>
+  );
+}
diff --git a/frontend/src/components/shared/error-toast.tsx b/frontend/src/components/shared/error-toast.tsx
index 30f2d7cbe6b5..36144eff9651 100644
--- a/frontend/src/components/shared/error-toast.tsx
+++ b/frontend/src/components/shared/error-toast.tsx
@@ -1,4 +1,6 @@
 import toast, { Toast } from "react-hot-toast";
+import { useTranslation } from "react-i18next";
+import { I18nKey } from "#/i18n/declaration";
 
 interface ErrorToastProps {
   id: Toast["id"];
@@ -6,6 +8,8 @@ interface ErrorToastProps {
 }
 
 export function ErrorToast({ id, error }: ErrorToastProps) {
+  const { t } = useTranslation();
+
   return (
     <div className="flex items-center justify-between w-full h-full">
       <span>{error}</span>
@@ -14,7 +18,7 @@ export function ErrorToast({ id, error }: ErrorToastProps) {
         onClick={() => toast.dismiss(id)}
         className="bg-neutral-500 px-1 rounded h-full"
       >
-        Close
+        {t(I18nKey.ERROR_TOAST$CLOSE_BUTTON_LABEL)}
       </button>
     </div>
   );
diff --git a/frontend/src/components/shared/inputs/api-key-input.tsx b/frontend/src/components/shared/inputs/api-key-input.tsx
index ea6e553adbe9..7bdafb90bd1e 100644
--- a/frontend/src/components/shared/inputs/api-key-input.tsx
+++ b/frontend/src/components/shared/inputs/api-key-input.tsx
@@ -1,27 +1,37 @@
-import { Input } from "@nextui-org/react";
+import { Input, Tooltip } from "@nextui-org/react";
 import { useTranslation } from "react-i18next";
+import { FaCheckCircle, FaExclamationCircle } from "react-icons/fa";
 import { I18nKey } from "#/i18n/declaration";
 
 interface APIKeyInputProps {
   isDisabled: boolean;
-  defaultValue: string;
+  isSet: boolean;
 }
 
-export function APIKeyInput({ isDisabled, defaultValue }: APIKeyInputProps) {
+export function APIKeyInput({ isDisabled, isSet }: APIKeyInputProps) {
   const { t } = useTranslation();
 
   return (
     <fieldset data-testid="api-key-input" className="flex flex-col gap-2">
-      <label htmlFor="api-key" className="font-[500] text-[#A3A3A3] text-xs">
-        {t(I18nKey.SETTINGS_FORM$API_KEY_LABEL)}
-      </label>
+      <Tooltip content={isSet ? "API Key is set" : "API Key is not set"}>
+        <label
+          htmlFor="api-key"
+          className="font-[500] text-[#A3A3A3] text-xs flex items-center gap-1 self-start"
+        >
+          {isSet && <FaCheckCircle className="text-[#00D1B2] inline-block" />}
+          {!isSet && (
+            <FaExclamationCircle className="text-[#FF3860] inline-block" />
+          )}
+          {t(I18nKey.SETTINGS_FORM$API_KEY_LABEL)}
+        </label>
+      </Tooltip>
       <Input
         isDisabled={isDisabled}
         id="api-key"
         name="api-key"
         aria-label="API Key"
         type="password"
-        defaultValue={defaultValue}
+        defaultValue=""
         classNames={{
           inputWrapper: "bg-[#27272A] rounded-md text-sm px-3 py-[10px]",
         }}
diff --git a/frontend/src/components/shared/modals/account-settings/account-settings-form.tsx b/frontend/src/components/shared/modals/account-settings/account-settings-form.tsx
index 9358e94799f8..fb162103eb5f 100644
--- a/frontend/src/components/shared/modals/account-settings/account-settings-form.tsx
+++ b/frontend/src/components/shared/modals/account-settings/account-settings-form.tsx
@@ -8,12 +8,12 @@ import { ModalBody } from "../modal-body";
 import { AvailableLanguages } from "#/i18n";
 import { I18nKey } from "#/i18n/declaration";
 import { useAuth } from "#/context/auth-context";
-import { useSettings } from "#/context/settings-context";
 import { handleCaptureConsent } from "#/utils/handle-capture-consent";
 import { ModalButton } from "../../buttons/modal-button";
 import { CustomInput } from "../../custom-input";
 import { FormFieldset } from "../../form-fieldset";
 import { useConfig } from "#/hooks/query/use-config";
+import { useSaveSettings } from "#/hooks/mutation/use-save-settings";
 
 interface AccountSettingsFormProps {
   onClose: () => void;
@@ -30,7 +30,7 @@ export function AccountSettingsForm({
 }: AccountSettingsFormProps) {
   const { gitHubToken, setGitHubToken, logout } = useAuth();
   const { data: config } = useConfig();
-  const { saveSettings } = useSettings();
+  const { mutate: saveSettings } = useSaveSettings();
   const { t } = useTranslation();
 
   const handleSubmit = (event: React.FormEvent<HTMLFormElement>) => {
diff --git a/frontend/src/components/shared/modals/account-settings/account-settings-modal.tsx b/frontend/src/components/shared/modals/account-settings/account-settings-modal.tsx
index d8c1ce47f7e8..0de5a91458ff 100644
--- a/frontend/src/components/shared/modals/account-settings/account-settings-modal.tsx
+++ b/frontend/src/components/shared/modals/account-settings/account-settings-modal.tsx
@@ -1,5 +1,5 @@
-import { useSettings } from "#/context/settings-context";
 import { useGitHubUser } from "#/hooks/query/use-github-user";
+import { useSettings } from "#/hooks/query/use-settings";
 import { ModalBackdrop } from "../modal-backdrop";
 import { AccountSettingsForm } from "./account-settings-form";
 
@@ -9,7 +9,7 @@ interface AccountSettingsModalProps {
 
 export function AccountSettingsModal({ onClose }: AccountSettingsModalProps) {
   const user = useGitHubUser();
-  const { settings } = useSettings();
+  const { data: settings } = useSettings();
 
   // FIXME: Bad practice to use localStorage directly
   const analyticsConsent = localStorage.getItem("analytics-consent");
diff --git a/frontend/src/components/shared/modals/confirmation-modals/base-modal.tsx b/frontend/src/components/shared/modals/confirmation-modals/base-modal.tsx
index 2cb79b45c8c0..c5b4e3f255f8 100644
--- a/frontend/src/components/shared/modals/confirmation-modals/base-modal.tsx
+++ b/frontend/src/components/shared/modals/confirmation-modals/base-modal.tsx
@@ -35,14 +35,20 @@ export function BaseModalDescription({
 }
 
 interface BaseModalProps {
+  testId?: string;
   title: string;
   description: string;
   buttons: ButtonConfig[];
 }
 
-export function BaseModal({ title, description, buttons }: BaseModalProps) {
+export function BaseModal({
+  testId,
+  title,
+  description,
+  buttons,
+}: BaseModalProps) {
   return (
-    <ModalBody>
+    <ModalBody testID={testId}>
       <div className="flex flex-col gap-2 self-start">
         <BaseModalTitle title={title} />
         <BaseModalDescription description={description} />
diff --git a/frontend/src/components/shared/modals/confirmation-modals/danger-modal.tsx b/frontend/src/components/shared/modals/confirmation-modals/danger-modal.tsx
index fa6d468d0072..98f4a7155f44 100644
--- a/frontend/src/components/shared/modals/confirmation-modals/danger-modal.tsx
+++ b/frontend/src/components/shared/modals/confirmation-modals/danger-modal.tsx
@@ -1,6 +1,8 @@
 import { BaseModal } from "./base-modal";
 
 interface DangerModalProps {
+  testId?: string;
+
   title: string;
   description: string;
 
@@ -10,9 +12,15 @@ interface DangerModalProps {
   };
 }
 
-export function DangerModal({ title, description, buttons }: DangerModalProps) {
+export function DangerModal({
+  testId,
+  title,
+  description,
+  buttons,
+}: DangerModalProps) {
   return (
     <BaseModal
+      testId={testId}
       title={title}
       description={description}
       buttons={[
diff --git a/frontend/src/components/shared/modals/settings/model-selector.tsx b/frontend/src/components/shared/modals/settings/model-selector.tsx
index 3424c7c82afd..baefbf349d17 100644
--- a/frontend/src/components/shared/modals/settings/model-selector.tsx
+++ b/frontend/src/components/shared/modals/settings/model-selector.tsx
@@ -68,6 +68,7 @@ export function ModelSelector({
             LLM Provider
           </label>
           <Autocomplete
+            data-testid="llm-provider"
             isRequired
             isVirtualized={false}
             name="llm-provider"
@@ -91,7 +92,11 @@ export function ModelSelector({
               {Object.keys(models)
                 .filter((provider) => VERIFIED_PROVIDERS.includes(provider))
                 .map((provider) => (
-                  <AutocompleteItem key={provider} value={provider}>
+                  <AutocompleteItem
+                    data-testid={`provider-item-${provider}`}
+                    key={provider}
+                    value={provider}
+                  >
                     {mapProvider(provider)}
                   </AutocompleteItem>
                 ))}
@@ -113,6 +118,7 @@ export function ModelSelector({
             LLM Model
           </label>
           <Autocomplete
+            data-testid="llm-model"
             isRequired
             isVirtualized={false}
             name="llm-model"
@@ -144,7 +150,11 @@ export function ModelSelector({
               {models[selectedProvider || ""]?.models
                 .filter((model) => !VERIFIED_MODELS.includes(model))
                 .map((model) => (
-                  <AutocompleteItem key={model} value={model}>
+                  <AutocompleteItem
+                    data-testid={`model-item-${model}`}
+                    key={model}
+                    value={model}
+                  >
                     {model}
                   </AutocompleteItem>
                 ))}
diff --git a/frontend/src/components/shared/modals/settings/settings-form.tsx b/frontend/src/components/shared/modals/settings/settings-form.tsx
index 918046178f6b..7aba4856e227 100644
--- a/frontend/src/components/shared/modals/settings/settings-form.tsx
+++ b/frontend/src/components/shared/modals/settings/settings-form.tsx
@@ -9,7 +9,6 @@ import { DangerModal } from "../confirmation-modals/danger-modal";
 import { I18nKey } from "#/i18n/declaration";
 import { extractSettings, saveSettingsView } from "#/utils/settings-utils";
 import { useEndSession } from "#/hooks/use-end-session";
-import { useSettings } from "#/context/settings-context";
 import { ModalButton } from "../../buttons/modal-button";
 import { AdvancedOptionSwitch } from "../../inputs/advanced-option-switch";
 import { AgentInput } from "../../inputs/agent-input";
@@ -20,6 +19,7 @@ import { CustomModelInput } from "../../inputs/custom-model-input";
 import { SecurityAnalyzerInput } from "../../inputs/security-analyzers-input";
 import { ModalBackdrop } from "../modal-backdrop";
 import { ModelSelector } from "./model-selector";
+import { useSaveSettings } from "#/hooks/mutation/use-save-settings";
 
 interface SettingsFormProps {
   disabled?: boolean;
@@ -38,7 +38,7 @@ export function SettingsForm({
   securityAnalyzers,
   onClose,
 }: SettingsFormProps) {
-  const { saveSettings } = useSettings();
+  const { mutateAsync: saveSettings } = useSaveSettings();
   const endSession = useEndSession();
 
   const location = useLocation();
@@ -82,7 +82,6 @@ export function SettingsForm({
   const resetOngoingSession = () => {
     if (location.pathname.startsWith("/conversations/")) {
       endSession();
-      onClose();
     }
   };
 
@@ -92,7 +91,7 @@ export function SettingsForm({
     const newSettings = extractSettings(formData);
 
     saveSettingsView(isUsingAdvancedOptions ? "advanced" : "basic");
-    await saveSettings(newSettings);
+    await saveSettings(newSettings, { onSuccess: onClose });
     resetOngoingSession();
 
     posthog.capture("settings_saved", {
@@ -102,11 +101,9 @@ export function SettingsForm({
   };
 
   const handleConfirmResetSettings = async () => {
-    await saveSettings(getDefaultSettings());
+    await saveSettings(getDefaultSettings(), { onSuccess: onClose });
     resetOngoingSession();
     posthog.capture("settings_reset");
-
-    onClose();
   };
 
   const handleConfirmEndSession = () => {
@@ -122,7 +119,6 @@ export function SettingsForm({
       setConfirmEndSessionModalOpen(true);
     } else {
       handleFormSubmission(formData);
-      onClose();
     }
   };
 
@@ -165,7 +161,7 @@ export function SettingsForm({
 
           <APIKeyInput
             isDisabled={!!disabled}
-            defaultValue={settings.LLM_API_KEY || ""}
+            isSet={settings.LLM_API_KEY === "SET"}
           />
 
           {showAdvancedOptions && (
@@ -221,6 +217,7 @@ export function SettingsForm({
       {confirmResetDefaultsModalOpen && (
         <ModalBackdrop>
           <DangerModal
+            testId="reset-defaults-modal"
             title={t(I18nKey.SETTINGS_FORM$ARE_YOU_SURE_LABEL)}
             description={t(
               I18nKey.SETTINGS_FORM$ALL_INFORMATION_WILL_BE_DELETED_MESSAGE,
diff --git a/frontend/src/components/shared/modals/settings/settings-modal.tsx b/frontend/src/components/shared/modals/settings/settings-modal.tsx
index 29e1cc08c7d9..011411f4748f 100644
--- a/frontend/src/components/shared/modals/settings/settings-modal.tsx
+++ b/frontend/src/components/shared/modals/settings/settings-modal.tsx
@@ -1,15 +1,15 @@
-import { useSettings } from "#/context/settings-context";
 import { useAIConfigOptions } from "#/hooks/query/use-ai-config-options";
+import { Settings } from "#/services/settings";
 import { LoadingSpinner } from "../../loading-spinner";
 import { ModalBackdrop } from "../modal-backdrop";
 import { SettingsForm } from "./settings-form";
 
 interface SettingsModalProps {
+  settings: Settings;
   onClose: () => void;
 }
 
-export function SettingsModal({ onClose }: SettingsModalProps) {
-  const { settings } = useSettings();
+export function SettingsModal({ onClose, settings }: SettingsModalProps) {
   const aiConfigOptions = useAIConfigOptions();
 
   return (
diff --git a/frontend/src/components/shared/task-form.tsx b/frontend/src/components/shared/task-form.tsx
index bc6b53c24748..030b0c61cdc4 100644
--- a/frontend/src/components/shared/task-form.tsx
+++ b/frontend/src/components/shared/task-form.tsx
@@ -1,17 +1,8 @@
 import React from "react";
-import { useNavigate, useNavigation } from "react-router";
+import { useNavigation } from "react-router";
 import { useDispatch, useSelector } from "react-redux";
-import { useMutation } from "@tanstack/react-query";
-import posthog from "posthog-js";
 import { RootState } from "#/store";
-import {
-  addFile,
-  removeFile,
-  setInitialQuery,
-} from "#/state/initial-query-slice";
-import OpenHands from "#/api/open-hands";
-import { useAuth } from "#/context/auth-context";
-
+import { addFile, removeFile } from "#/state/initial-query-slice";
 import { SuggestionBubble } from "#/components/features/suggestions/suggestion-bubble";
 import { SUGGESTIONS } from "#/utils/suggestions";
 import { convertImageToBase64 } from "#/utils/convert-image-to-base-64";
@@ -21,6 +12,7 @@ import { cn } from "#/utils/utils";
 import { AttachImageLabel } from "../features/images/attach-image-label";
 import { ImageCarousel } from "../features/images/image-carousel";
 import { UploadImageInput } from "../features/images/upload-image-input";
+import { useCreateConversation } from "#/hooks/mutation/use-create-conversation";
 import { LoadingSpinner } from "./loading-spinner";
 
 interface TaskFormProps {
@@ -30,8 +22,6 @@ interface TaskFormProps {
 export function TaskForm({ ref }: TaskFormProps) {
   const dispatch = useDispatch();
   const navigation = useNavigation();
-  const navigate = useNavigate();
-  const { gitHubToken } = useAuth();
 
   const { selectedRepository, files } = useSelector(
     (state: RootState) => state.initialQuery,
@@ -42,24 +32,7 @@ export function TaskForm({ ref }: TaskFormProps) {
     getRandomKey(SUGGESTIONS["non-repo"]),
   );
   const [inputIsFocused, setInputIsFocused] = React.useState(false);
-  const newConversationMutation = useMutation({
-    mutationFn: (variables: { q?: string }) => {
-      if (variables.q) dispatch(setInitialQuery(variables.q));
-      return OpenHands.newConversation({
-        githubToken: gitHubToken || undefined,
-        selectedRepository: selectedRepository || undefined,
-      });
-    },
-    onSuccess: ({ conversation_id: conversationId }, { q }) => {
-      posthog.capture("initial_query_submitted", {
-        entry_point: "task_form",
-        query_character_length: q?.length,
-        has_repository: !!selectedRepository,
-        has_files: files.length > 0,
-      });
-      navigate(`/conversations/${conversationId}`);
-    },
-  });
+  const { mutate: createConversation, isPending } = useCreateConversation();
 
   const onRefreshSuggestion = () => {
     const suggestions = SUGGESTIONS["non-repo"];
@@ -90,9 +63,7 @@ export function TaskForm({ ref }: TaskFormProps) {
     const formData = new FormData(event.currentTarget);
 
     const q = formData.get("q")?.toString();
-    if (q?.trim()) {
-      newConversationMutation.mutate({ q });
-    }
+    createConversation({ q });
   };
 
   return (
@@ -114,7 +85,7 @@ export function TaskForm({ ref }: TaskFormProps) {
             "hover:border-neutral-500 focus-within:border-neutral-500",
           )}
         >
-          {newConversationMutation.isPending ? (
+          {isPending ? (
             <div className="flex justify-center py-[17px]">
               <LoadingSpinner size="small" />
             </div>
diff --git a/frontend/src/context/settings-context.tsx b/frontend/src/context/settings-context.tsx
deleted file mode 100644
index 3d2c426dc095..000000000000
--- a/frontend/src/context/settings-context.tsx
+++ /dev/null
@@ -1,68 +0,0 @@
-import React from "react";
-import posthog from "posthog-js";
-import { useQuery, useQueryClient } from "@tanstack/react-query";
-import {
-  getSettings,
-  Settings,
-  saveSettings,
-  settingsAreUpToDate as checkIfSettingsAreUpToDate,
-  DEFAULT_SETTINGS,
-} from "#/services/settings";
-
-interface SettingsContextType {
-  settings: Settings;
-  settingsAreUpToDate: boolean;
-  saveSettings: (settings: Partial<Settings>) => void;
-}
-
-const SettingsContext = React.createContext<SettingsContextType | undefined>(
-  undefined,
-);
-
-const SETTINGS_QUERY_KEY = ["settings"];
-
-function SettingsProvider({ children }: React.PropsWithChildren) {
-  const { data: settings } = useQuery({
-    queryKey: SETTINGS_QUERY_KEY,
-    queryFn: getSettings,
-    initialData: DEFAULT_SETTINGS,
-  });
-
-  const [settingsAreUpToDate, setSettingsAreUpToDate] = React.useState(
-    checkIfSettingsAreUpToDate(),
-  );
-  const queryClient = useQueryClient();
-
-  const handleSaveSettings = async (newSettings: Partial<Settings>) => {
-    await saveSettings(newSettings);
-    queryClient.invalidateQueries({ queryKey: SETTINGS_QUERY_KEY });
-    setSettingsAreUpToDate(checkIfSettingsAreUpToDate());
-  };
-
-  React.useEffect(() => {
-    if (settings?.LLM_API_KEY) {
-      posthog.capture("user_activated");
-    }
-  }, [settings?.LLM_API_KEY]);
-
-  const value = React.useMemo(
-    () => ({
-      settings,
-      settingsAreUpToDate,
-      saveSettings: handleSaveSettings,
-    }),
-    [settings, settingsAreUpToDate],
-  );
-
-  return <SettingsContext value={value}>{children}</SettingsContext>;
-}
-
-function useSettings() {
-  const context = React.useContext(SettingsContext);
-  if (context === undefined) {
-    throw new Error("useSettings must be used within a SettingsProvider");
-  }
-  return context;
-}
-
-export { SettingsProvider, useSettings };
diff --git a/frontend/src/context/settings-up-to-date-context.tsx b/frontend/src/context/settings-up-to-date-context.tsx
new file mode 100644
index 000000000000..93e8f71556da
--- /dev/null
+++ b/frontend/src/context/settings-up-to-date-context.tsx
@@ -0,0 +1,42 @@
+import React from "react";
+import { settingsAreUpToDate } from "#/services/settings";
+
+interface SettingsUpToDateContextType {
+  isUpToDate: boolean;
+  setIsUpToDate: (value: boolean) => void;
+}
+
+const SettingsUpToDateContext = React.createContext<
+  SettingsUpToDateContextType | undefined
+>(undefined);
+
+interface SettingsUpToDateProviderProps {
+  children: React.ReactNode;
+}
+
+export function SettingsUpToDateProvider({
+  children,
+}: SettingsUpToDateProviderProps) {
+  const [isUpToDate, setIsUpToDate] = React.useState(settingsAreUpToDate());
+
+  const value = React.useMemo(
+    () => ({ isUpToDate, setIsUpToDate }),
+    [isUpToDate, setIsUpToDate],
+  );
+
+  return (
+    <SettingsUpToDateContext.Provider value={value}>
+      {children}
+    </SettingsUpToDateContext.Provider>
+  );
+}
+
+export function useSettingsUpToDate() {
+  const context = React.useContext(SettingsUpToDateContext);
+  if (context === undefined) {
+    throw new Error(
+      "useSettingsUpToDate must be used within a SettingsUpToDateProvider",
+    );
+  }
+  return context;
+}
diff --git a/frontend/src/entry.client.tsx b/frontend/src/entry.client.tsx
index 32be2bd39921..03d97fb0850d 100644
--- a/frontend/src/entry.client.tsx
+++ b/frontend/src/entry.client.tsx
@@ -20,7 +20,7 @@ import toast from "react-hot-toast";
 import store from "./store";
 import { useConfig } from "./hooks/query/use-config";
 import { AuthProvider } from "./context/auth-context";
-import { SettingsProvider } from "./context/settings-context";
+import { SettingsUpToDateProvider } from "./context/settings-up-to-date-context";
 
 function PosthogInit() {
   const { data: config } = useConfig();
@@ -74,14 +74,14 @@ prepareApp().then(() =>
       document,
       <StrictMode>
         <Provider store={store}>
-          <QueryClientProvider client={queryClient}>
-            <SettingsProvider>
-              <AuthProvider>
+          <AuthProvider>
+            <SettingsUpToDateProvider>
+              <QueryClientProvider client={queryClient}>
                 <HydratedRouter />
                 <PosthogInit />
-              </AuthProvider>
-            </SettingsProvider>
-          </QueryClientProvider>
+              </QueryClientProvider>
+            </SettingsUpToDateProvider>
+          </AuthProvider>
         </Provider>
       </StrictMode>,
     );
diff --git a/frontend/src/hooks/mutation/use-create-conversation.ts b/frontend/src/hooks/mutation/use-create-conversation.ts
new file mode 100644
index 000000000000..ceb00b82b0e2
--- /dev/null
+++ b/frontend/src/hooks/mutation/use-create-conversation.ts
@@ -0,0 +1,45 @@
+import { useMutation, useQueryClient } from "@tanstack/react-query";
+import { useNavigate } from "react-router";
+import posthog from "posthog-js";
+import { useDispatch, useSelector } from "react-redux";
+import OpenHands from "#/api/open-hands";
+import { setInitialQuery } from "#/state/initial-query-slice";
+import { RootState } from "#/store";
+import { useAuth } from "#/context/auth-context";
+
+export const useCreateConversation = () => {
+  const navigate = useNavigate();
+  const dispatch = useDispatch();
+  const { gitHubToken } = useAuth();
+  const queryClient = useQueryClient();
+
+  const { selectedRepository, files } = useSelector(
+    (state: RootState) => state.initialQuery,
+  );
+
+  return useMutation({
+    mutationFn: (variables: { q?: string }) => {
+      if (!variables.q?.trim() && !selectedRepository && files.length === 0) {
+        throw new Error("No query provided");
+      }
+
+      if (variables.q) dispatch(setInitialQuery(variables.q));
+      return OpenHands.createConversation(
+        gitHubToken || undefined,
+        selectedRepository || undefined,
+      );
+    },
+    onSuccess: async ({ conversation_id: conversationId }, { q }) => {
+      posthog.capture("initial_query_submitted", {
+        entry_point: "task_form",
+        query_character_length: q?.length,
+        has_repository: !!selectedRepository,
+        has_files: files.length > 0,
+      });
+      await queryClient.invalidateQueries({
+        queryKey: ["user", "conversations"],
+      });
+      navigate(`/conversations/${conversationId}`);
+    },
+  });
+};
diff --git a/frontend/src/hooks/mutation/use-delete-conversation.ts b/frontend/src/hooks/mutation/use-delete-conversation.ts
new file mode 100644
index 000000000000..b0e3d6c90e58
--- /dev/null
+++ b/frontend/src/hooks/mutation/use-delete-conversation.ts
@@ -0,0 +1,14 @@
+import { useMutation, useQueryClient } from "@tanstack/react-query";
+import OpenHands from "#/api/open-hands";
+
+export const useDeleteConversation = () => {
+  const queryClient = useQueryClient();
+
+  return useMutation({
+    mutationFn: (variables: { conversationId: string }) =>
+      OpenHands.deleteUserConversation(variables.conversationId),
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ["user", "conversations"] });
+    },
+  });
+};
diff --git a/frontend/src/hooks/mutation/use-save-settings.ts b/frontend/src/hooks/mutation/use-save-settings.ts
new file mode 100644
index 000000000000..f9731e981d5b
--- /dev/null
+++ b/frontend/src/hooks/mutation/use-save-settings.ts
@@ -0,0 +1,42 @@
+import { useMutation, useQueryClient } from "@tanstack/react-query";
+import {
+  ApiSettings,
+  DEFAULT_SETTINGS,
+  LATEST_SETTINGS_VERSION,
+  Settings,
+} from "#/services/settings";
+import OpenHands from "#/api/open-hands";
+import { useSettingsUpToDate } from "#/context/settings-up-to-date-context";
+
+const saveSettingsMutationFn = async (settings: Partial<Settings>) => {
+  const apiSettings: Partial<ApiSettings> = {
+    llm_model: settings.LLM_MODEL,
+    llm_base_url: settings.LLM_BASE_URL,
+    agent: settings.AGENT || DEFAULT_SETTINGS.AGENT,
+    language: settings.LANGUAGE || DEFAULT_SETTINGS.LANGUAGE,
+    confirmation_mode: settings.CONFIRMATION_MODE,
+    security_analyzer: settings.SECURITY_ANALYZER,
+    llm_api_key: settings.LLM_API_KEY?.trim() || undefined,
+  };
+
+  await OpenHands.saveSettings(apiSettings);
+};
+
+export const useSaveSettings = () => {
+  const queryClient = useQueryClient();
+  const { isUpToDate, setIsUpToDate } = useSettingsUpToDate();
+
+  return useMutation({
+    mutationFn: saveSettingsMutationFn,
+    onSuccess: async () => {
+      await queryClient.invalidateQueries({ queryKey: ["settings"] });
+      if (!isUpToDate) {
+        localStorage.setItem(
+          "SETTINGS_VERSION",
+          LATEST_SETTINGS_VERSION.toString(),
+        );
+        setIsUpToDate(true);
+      }
+    },
+  });
+};
diff --git a/frontend/src/hooks/mutation/use-update-conversation.ts b/frontend/src/hooks/mutation/use-update-conversation.ts
new file mode 100644
index 000000000000..4b391820b171
--- /dev/null
+++ b/frontend/src/hooks/mutation/use-update-conversation.ts
@@ -0,0 +1,18 @@
+import { useQueryClient, useMutation } from "@tanstack/react-query";
+import OpenHands from "#/api/open-hands";
+import { Conversation } from "#/api/open-hands.types";
+
+export const useUpdateConversation = () => {
+  const queryClient = useQueryClient();
+
+  return useMutation({
+    mutationFn: (variables: {
+      id: string;
+      conversation: Partial<Omit<Conversation, "id">>;
+    }) =>
+      OpenHands.updateUserConversation(variables.id, variables.conversation),
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ["user", "conversations"] });
+    },
+  });
+};
diff --git a/frontend/src/hooks/query/get-conversation-permissions.ts b/frontend/src/hooks/query/get-conversation-permissions.ts
new file mode 100644
index 000000000000..83002a0ec206
--- /dev/null
+++ b/frontend/src/hooks/query/get-conversation-permissions.ts
@@ -0,0 +1,11 @@
+import { useQuery } from "@tanstack/react-query";
+import OpenHands from "#/api/open-hands";
+import { MULTI_CONVO_UI_IS_ENABLED } from "#/utils/constants";
+
+export const useUserConversation = (cid: string | null) =>
+  useQuery({
+    queryKey: ["user", "conversation", cid],
+    queryFn: () => OpenHands.getConversation(cid!),
+    enabled: MULTI_CONVO_UI_IS_ENABLED && !!cid,
+    retry: false,
+  });
diff --git a/frontend/src/hooks/query/use-list-files.ts b/frontend/src/hooks/query/use-list-files.ts
index 8bb30f0e263f..086baa2f5225 100644
--- a/frontend/src/hooks/query/use-list-files.ts
+++ b/frontend/src/hooks/query/use-list-files.ts
@@ -11,7 +11,11 @@ interface UseListFilesConfig {
   enabled?: boolean;
 }
 
-export const useListFiles = (config?: UseListFilesConfig) => {
+const DEFAULT_CONFIG: UseListFilesConfig = {
+  enabled: true,
+};
+
+export const useListFiles = (config: UseListFilesConfig = DEFAULT_CONFIG) => {
   const { conversationId } = useConversation();
   const { status } = useWsClient();
   const isActive = status === WsClientProviderStatus.CONNECTED;
diff --git a/frontend/src/hooks/query/use-settings.ts b/frontend/src/hooks/query/use-settings.ts
new file mode 100644
index 000000000000..f6e12e33e185
--- /dev/null
+++ b/frontend/src/hooks/query/use-settings.ts
@@ -0,0 +1,50 @@
+import { useQuery } from "@tanstack/react-query";
+import React from "react";
+import posthog from "posthog-js";
+import { AxiosError } from "axios";
+import { DEFAULT_SETTINGS, getLocalStorageSettings } from "#/services/settings";
+import OpenHands from "#/api/open-hands";
+
+const getSettingsQueryFn = async () => {
+  try {
+    const apiSettings = await OpenHands.getSettings();
+
+    if (apiSettings !== null) {
+      return {
+        LLM_MODEL: apiSettings.llm_model,
+        LLM_BASE_URL: apiSettings.llm_base_url,
+        AGENT: apiSettings.agent,
+        LANGUAGE: apiSettings.language,
+        CONFIRMATION_MODE: apiSettings.confirmation_mode,
+        SECURITY_ANALYZER: apiSettings.security_analyzer,
+        LLM_API_KEY: apiSettings.llm_api_key,
+      };
+    }
+
+    return getLocalStorageSettings();
+  } catch (error) {
+    if (error instanceof AxiosError) {
+      if (error.response?.status === 404) {
+        return DEFAULT_SETTINGS;
+      }
+    }
+
+    throw error;
+  }
+};
+
+export const useSettings = () => {
+  const query = useQuery({
+    queryKey: ["settings"],
+    queryFn: getSettingsQueryFn,
+    initialData: DEFAULT_SETTINGS,
+  });
+
+  React.useEffect(() => {
+    if (query.data?.LLM_API_KEY) {
+      posthog.capture("user_activated");
+    }
+  }, [query.data?.LLM_API_KEY]);
+
+  return query;
+};
diff --git a/frontend/src/hooks/query/use-user-conversations.ts b/frontend/src/hooks/query/use-user-conversations.ts
new file mode 100644
index 000000000000..5157c91d5668
--- /dev/null
+++ b/frontend/src/hooks/query/use-user-conversations.ts
@@ -0,0 +1,13 @@
+import { useQuery } from "@tanstack/react-query";
+import OpenHands from "#/api/open-hands";
+import { useIsAuthed } from "./use-is-authed";
+
+export const useUserConversations = () => {
+  const { data: userIsAuthenticated } = useIsAuthed();
+
+  return useQuery({
+    queryKey: ["user", "conversations"],
+    queryFn: OpenHands.getUserConversations,
+    enabled: !!userIsAuthenticated,
+  });
+};
diff --git a/frontend/src/hooks/use-maybe-migrate-settings.ts b/frontend/src/hooks/use-maybe-migrate-settings.ts
new file mode 100644
index 000000000000..d2bb49f3c17a
--- /dev/null
+++ b/frontend/src/hooks/use-maybe-migrate-settings.ts
@@ -0,0 +1,54 @@
+// Sometimes we ship major changes, like a new default agent.
+
+import React from "react";
+import { useAuth } from "#/context/auth-context";
+import { useSettingsUpToDate } from "#/context/settings-up-to-date-context";
+import {
+  DEFAULT_SETTINGS,
+  getCurrentSettingsVersion,
+  getLocalStorageSettings,
+} from "#/services/settings";
+import { useSaveSettings } from "./mutation/use-save-settings";
+
+// In this case, we may want to override a previous choice made by the user.
+export const useMaybeMigrateSettings = () => {
+  const { logout } = useAuth();
+  const { mutateAsync: saveSettings } = useSaveSettings();
+  const { isUpToDate } = useSettingsUpToDate();
+
+  const maybeMigrateSettings = async () => {
+    const currentVersion = getCurrentSettingsVersion();
+
+    if (currentVersion < 1) {
+      localStorage.setItem("AGENT", DEFAULT_SETTINGS.AGENT);
+    }
+    if (currentVersion < 2) {
+      const customModel = localStorage.getItem("CUSTOM_LLM_MODEL");
+      if (customModel) {
+        localStorage.setItem("LLM_MODEL", customModel);
+      }
+      localStorage.removeItem("CUSTOM_LLM_MODEL");
+      localStorage.removeItem("USING_CUSTOM_MODEL");
+    }
+    if (currentVersion < 3) {
+      localStorage.removeItem("token");
+    }
+
+    if (currentVersion < 4) {
+      logout();
+    }
+
+    // Only save settings if user already previously saved settings
+    // That way we avoid setting defaults for new users too early
+    if (currentVersion !== 0 && currentVersion < 5) {
+      const localSettings = getLocalStorageSettings();
+      await saveSettings(localSettings);
+    }
+  };
+
+  React.useEffect(() => {
+    if (!isUpToDate) {
+      maybeMigrateSettings();
+    }
+  }, []);
+};
diff --git a/frontend/src/i18n/translation.json b/frontend/src/i18n/translation.json
index f7ee8f4959d6..82fc4498649c 100644
--- a/frontend/src/i18n/translation.json
+++ b/frontend/src/i18n/translation.json
@@ -930,7 +930,7 @@
     "pt": "Configurações de compartilhamento",
     "tr": "Paylaşım ayarları"
   },
-  "SECURITY$UNKNOWN_ANALYZER_LABEL":{
+  "SECURITY$UNKNOWN_ANALYZER_LABEL": {
     "en": "Unknown security analyzer chosen",
     "es": "Analizador de seguridad desconocido",
     "zh-CN": "选择了未知的安全分析器",
@@ -1852,19 +1852,19 @@
     "fr": "En attente que le client soit prêt...",
     "tr": "İstemcinin hazır olması bekleniyor..."
   },
-  "ACCOUNT_SETTINGS_MODAL$DISCONNECT":{
+  "ACCOUNT_SETTINGS_MODAL$DISCONNECT": {
     "en": "Disconnect",
     "es": "Desconectar"
   },
-  "ACCOUNT_SETTINGS_MODAL$SAVE":{
+  "ACCOUNT_SETTINGS_MODAL$SAVE": {
     "en": "Save",
     "es": "Guardar"
   },
-  "ACCOUNT_SETTINGS_MODAL$CLOSE":{
+  "ACCOUNT_SETTINGS_MODAL$CLOSE": {
     "en": "Close",
     "es": "Cerrar"
   },
-  "ACCOUNT_SETTINGS_MODAL$GITHUB_TOKEN_INVALID":{
+  "ACCOUNT_SETTINGS_MODAL$GITHUB_TOKEN_INVALID": {
     "en": "GitHub token is invalid. Please try again.",
     "es": ""
   },
@@ -1973,12 +1973,18 @@
     "es": "Toda la información guardada en tu configuración de IA será eliminada, incluyendo tus API Keys"
   },
   "PROJECT_MENU_DETAILS_PLACEHOLDER$NEW_PROJECT_LABEL": {
-    "en":"New Project",
-    "es":"Nuevo proyecto"
+    "en": "New Project",
+    "es": "Nuevo proyecto"
+  },
+  "PROJECT_MENU_DETAILS_PLACEHOLDER$CONNECT_TO_GITHUB": {
+    "en": "Connect to GitHub"
+  },
+  "PROJECT_MENU_DETAILS_PLACEHOLDER$CONNECTED": {
+    "en": "Connected"
   },
   "PROJECT_MENU_DETAILS$AGO_LABEL": {
-    "en":"ago",
-    "es":"atrás"
+    "en": "ago",
+    "es": "atrás"
   },
   "STATUS$ERROR_LLM_AUTHENTICATION": {
     "en": "Error authenticating with the LLM provider. Please check your API key",
@@ -2005,6 +2011,39 @@
     "en": "Download files",
     "es": "Descargar archivos"
   },
+  "PROJECT_MENU_CARD$OPEN": {
+    "en": "Open project menu"
+  },
+  "ACTION_BUTTON$RESUME": {
+    "en": "Resume the agent task"
+  },
+  "ACTION_BUTTON$PAUSE": {
+    "en": "Pause the current task"
+  },
+  "BROWSER$SCREENSHOT_ALT": {
+    "en": "Browser Screenshot"
+  },
+  "ACCOUNT_SETTINGS$SETTINGS": {
+    "en": "Account Settings"
+  },
+  "ACCOUNT_SETTINGS$LOGOUT": {
+    "en": "Logout"
+  },
+  "ERROR_TOAST$CLOSE_BUTTON_LABEL": {
+    "en": "Close"
+  },
+  "FILE_EXPLORER$UPLOAD": {
+    "en": "Upload File"
+  },
+  "FILE_EXPLORER$REFRESH_WORKSPACE": {
+    "en": "Refresh workspace"
+  },
+  "FILE_EXPLORER$OPEN_WORKSPACE": {
+    "en": "Open workspace"
+  },
+  "FILE_EXPLORER$CLOSE_WORKSPACE": {
+    "en": "Close workspace"
+  },
   "ACTION_MESSAGE$RUN": {
     "en": "Running a bash command"
   },
diff --git a/frontend/src/mocks/handlers.ts b/frontend/src/mocks/handlers.ts
index 5926dd8ac52e..0ad90741247d 100644
--- a/frontend/src/mocks/handlers.ts
+++ b/frontend/src/mocks/handlers.ts
@@ -1,36 +1,90 @@
 import { delay, http, HttpResponse } from "msw";
+import { GetConfigResponse, Conversation } from "#/api/open-hands.types";
+import { DEFAULT_SETTINGS } from "#/services/settings";
+
+const userPreferences = {
+  settings: {
+    llm_model: DEFAULT_SETTINGS.LLM_MODEL,
+    llm_base_url: DEFAULT_SETTINGS.LLM_BASE_URL,
+    llm_api_key: DEFAULT_SETTINGS.LLM_API_KEY,
+    agent: DEFAULT_SETTINGS.AGENT,
+    language: DEFAULT_SETTINGS.LANGUAGE,
+    confirmation_mode: DEFAULT_SETTINGS.CONFIRMATION_MODE,
+    security_analyzer: DEFAULT_SETTINGS.SECURITY_ANALYZER,
+  },
+};
+
+const conversations: Conversation[] = [
+  {
+    conversation_id: "1",
+    name: "My New Project",
+    repo: null,
+    lastUpdated: new Date().toISOString(),
+    state: "running",
+  },
+  {
+    conversation_id: "2",
+    name: "Repo Testing",
+    repo: "octocat/hello-world",
+    // 2 days ago
+    lastUpdated: new Date(Date.now() - 2 * 24 * 60 * 60 * 1000).toISOString(),
+    state: "cold",
+  },
+  {
+    conversation_id: "3",
+    name: "Another Project",
+    repo: "octocat/earth",
+    // 5 days ago
+    lastUpdated: new Date(Date.now() - 5 * 24 * 60 * 60 * 1000).toISOString(),
+    state: "finished",
+  },
+];
+
+const CONVERSATIONS = new Map<string, Conversation>(
+  conversations.map((conversation) => [
+    conversation.conversation_id,
+    conversation,
+  ]),
+);
 
 const openHandsHandlers = [
-  http.get("/api/options/models", async () => {
-    await delay();
-    return HttpResponse.json([
+  http.get("/api/options/models", async () =>
+    HttpResponse.json([
       "gpt-3.5-turbo",
       "gpt-4o",
       "anthropic/claude-3.5",
-    ]);
-  }),
-
-  http.get("/api/options/agents", async () => {
-    await delay();
-    return HttpResponse.json(["CodeActAgent", "CoActAgent"]);
-  }),
-
-  http.get("/api/options/security-analyzers", async () => {
-    await delay();
-    return HttpResponse.json(["mock-invariant"]);
-  }),
+      "anthropic/claude-3-5-sonnet-20241022",
+    ]),
+  ),
 
-  http.get("http://localhost:3001/api/list-files", async ({ request }) => {
-    await delay();
+  http.get("/api/options/agents", async () =>
+    HttpResponse.json(["CodeActAgent", "CoActAgent"]),
+  ),
 
-    const token = request.headers
-      .get("Authorization")
-      ?.replace("Bearer", "")
-      .trim();
+  http.get("/api/options/security-analyzers", async () =>
+    HttpResponse.json(["mock-invariant"]),
+  ),
 
-    if (!token) return HttpResponse.json([], { status: 401 });
-    return HttpResponse.json(["file1.ts", "dir1/file2.ts", "file3.ts"]);
-  }),
+  http.get(
+    "http://localhost:3001/api/conversations/:conversationId/list-files",
+    async ({ params }) => {
+      await delay();
+
+      const cid = params.conversationId?.toString();
+      if (!cid) return HttpResponse.json([], { status: 404 });
+
+      let data = ["file1.txt", "file2.txt", "file3.txt"];
+      if (cid === "3") {
+        data = [
+          "reboot_skynet.exe",
+          "target_list.txt",
+          "terminator_blueprint.txt",
+        ];
+      }
+
+      return HttpResponse.json(data);
+    },
+  ),
 
   http.post("http://localhost:3001/api/save-file", () =>
     HttpResponse.json(null, { status: 200 }),
@@ -70,21 +124,12 @@ const openHandsHandlers = [
 
 export const handlers = [
   ...openHandsHandlers,
-  http.get("https://api.github.com/user/repos", async ({ request }) => {
-    const token = request.headers
-      .get("Authorization")
-      ?.replace("Bearer", "")
-      .trim();
-
-    if (!token) {
-      return HttpResponse.json([], { status: 401 });
-    }
-
-    return HttpResponse.json([
+  http.get("/api/github/repositories", () =>
+    HttpResponse.json([
       { id: 1, full_name: "octocat/hello-world" },
       { id: 2, full_name: "octocat/earth" },
-    ]);
-  }),
+    ]),
+  ),
   http.get("https://api.github.com/user", () => {
     const user: GitHubUser = {
       id: 1,
@@ -103,5 +148,103 @@ export const handlers = [
   http.post("https://us.i.posthog.com/e", async () =>
     HttpResponse.json(null, { status: 200 }),
   ),
-  http.get("/config.json", () => HttpResponse.json({ APP_MODE: "oss" })),
+  http.get("/api/options/config", () => {
+    const config: GetConfigResponse = {
+      APP_MODE: "oss",
+      GITHUB_CLIENT_ID: "fake-github-client-id",
+      POSTHOG_CLIENT_KEY: "fake-posthog-client-key",
+    };
+
+    return HttpResponse.json(config);
+  }),
+  http.get("/api/settings", async () =>
+    HttpResponse.json(userPreferences.settings),
+  ),
+  http.post("/api/settings", async ({ request }) => {
+    const body = await request.json();
+
+    if (body) {
+      userPreferences.settings = {
+        ...userPreferences.settings,
+        // @ts-expect-error - We know this is a settings object
+        ...body,
+      };
+
+      return HttpResponse.json(null, { status: 200 });
+    }
+
+    return HttpResponse.json(null, { status: 400 });
+  }),
+
+  http.post("/api/authenticate", async () =>
+    HttpResponse.json({ message: "Authenticated" }),
+  ),
+
+  http.get("/api/options/config", () => HttpResponse.json({ APP_MODE: "oss" })),
+
+  http.get("/api/conversations", async () =>
+    HttpResponse.json(Array.from(CONVERSATIONS.values())),
+  ),
+
+  http.delete("/api/conversations/:conversationId", async ({ params }) => {
+    const { conversationId } = params;
+
+    if (typeof conversationId === "string") {
+      CONVERSATIONS.delete(conversationId);
+      return HttpResponse.json(null, { status: 200 });
+    }
+
+    return HttpResponse.json(null, { status: 404 });
+  }),
+
+  http.put(
+    "/api/conversations/:conversationId",
+    async ({ params, request }) => {
+      const { conversationId } = params;
+
+      if (typeof conversationId === "string") {
+        const conversation = CONVERSATIONS.get(conversationId);
+
+        if (conversation) {
+          const body = await request.json();
+          if (typeof body === "object" && body?.name) {
+            CONVERSATIONS.set(conversationId, {
+              ...conversation,
+              name: body.name,
+            });
+            return HttpResponse.json(null, { status: 200 });
+          }
+        }
+      }
+
+      return HttpResponse.json(null, { status: 404 });
+    },
+  ),
+
+  http.post("/api/conversations", () => {
+    const conversation: Conversation = {
+      conversation_id: (Math.random() * 100).toString(),
+      name: "New Conversation",
+      repo: null,
+      lastUpdated: new Date().toISOString(),
+      state: "warm",
+    };
+
+    CONVERSATIONS.set(conversation.conversation_id, conversation);
+    return HttpResponse.json(conversation, { status: 201 });
+  }),
+
+  http.get("/api/conversations/:conversationId", async ({ params }) => {
+    const { conversationId } = params;
+
+    if (typeof conversationId === "string") {
+      const project = CONVERSATIONS.get(conversationId);
+
+      if (project) {
+        return HttpResponse.json(project, { status: 200 });
+      }
+    }
+
+    return HttpResponse.json(null, { status: 404 });
+  }),
 ];
diff --git a/frontend/src/mocks/handlers.ws.ts b/frontend/src/mocks/handlers.ws.ts
index d284600381e1..0fcc03ffbf19 100644
--- a/frontend/src/mocks/handlers.ws.ts
+++ b/frontend/src/mocks/handlers.ws.ts
@@ -1,115 +1,60 @@
 import { delay, WebSocketHandler, ws } from "msw";
+import { toSocketIo } from "@mswjs/socket.io-binding";
 import { AgentState } from "#/types/agent-state";
+import { InitConfig } from "#/types/core/variances";
+import { SESSION_HISTORY } from "./session-history.mock";
 import {
-  AgentStateChangeObservation,
-  CommandObservation,
-} from "#/types/core/observations";
-import { AssistantMessageAction } from "#/types/core/actions";
-import { TokenConfigSuccess } from "#/types/core/variances";
-import EventLogger from "#/utils/event-logger";
+  generateAgentStateChangeObservation,
+  emitMessages,
+  emitAssistantMessage,
+} from "./mock-ws-helpers";
 
-const generateAgentStateChangeObservation = (
-  state: AgentState,
-): AgentStateChangeObservation => ({
-  id: 1,
-  cause: 0,
-  message: "AGENT_STATE_CHANGE_MESSAGE",
-  source: "agent",
-  timestamp: new Date().toISOString(),
-  observation: "agent_state_changed",
-  content: "AGENT_STATE_CHANGE_MESSAGE",
-  extras: { agent_state: state },
-});
+const isInitConfig = (data: unknown): data is InitConfig =>
+  typeof data === "object" &&
+  data !== null &&
+  "action" in data &&
+  data.action === "initialize";
 
-const generateAgentResponse = (message: string): AssistantMessageAction => ({
-  id: 2,
-  message: "USER_MESSAGE",
-  source: "agent",
-  timestamp: new Date().toISOString(),
-  action: "message",
-  args: {
-    content: message,
-    image_urls: [],
-    wait_for_response: false,
-  },
-});
+const chat = ws.link(`ws://${window?.location.host}/socket.io`);
 
-const generateAgentRunObservation = (): CommandObservation => ({
-  id: 3,
-  cause: 0,
-  message: "COMMAND_OBSERVATION",
-  source: "agent",
-  timestamp: new Date().toISOString(),
-  observation: "run",
-  content: "COMMAND_OBSERVATION",
-  extras: {
-    command: "<input>",
-    command_id: 1,
-    exit_code: 0,
-  },
-});
+export const handlers: WebSocketHandler[] = [
+  chat.addEventListener("connection", (connection) => {
+    const io = toSocketIo(connection);
+    // @ts-expect-error - accessing private property for testing purposes
+    const { url }: { url: URL } = io.client.connection;
+    const conversationId = url.searchParams.get("conversation_id");
 
-const api = ws.link("ws://localhost:3000/socket.io/?EIO=4&transport=websocket");
+    io.client.emit("connect");
 
-export const handlers: WebSocketHandler[] = [
-  api.addEventListener("connection", ({ client }) => {
-    client.send(
-      JSON.stringify({
-        status: 200,
-        token: Math.random().toString(36).substring(7),
-      } satisfies TokenConfigSuccess),
-    );
+    if (conversationId) {
+      emitMessages(io, SESSION_HISTORY["1"]);
+
+      io.client.emit(
+        "oh_event",
+        generateAgentStateChangeObservation(AgentState.AWAITING_USER_INPUT),
+      );
+    }
+
+    io.client.on("oh_action", async (_, data) => {
+      if (isInitConfig(data)) {
+        io.client.emit(
+          "oh_event",
+          generateAgentStateChangeObservation(AgentState.INIT),
+        );
+      } else {
+        io.client.emit(
+          "oh_event",
+          generateAgentStateChangeObservation(AgentState.RUNNING),
+        );
+
+        await delay(2500);
+        emitAssistantMessage(io, "Hello!");
 
-    // data received from the client
-    client.addEventListener("message", async (event) => {
-      const parsed = JSON.parse(event.data.toString());
-      if ("action" in parsed) {
-        switch (parsed.action) {
-          case "initialize":
-            // agent init
-            client.send(
-              JSON.stringify(
-                generateAgentStateChangeObservation(AgentState.INIT),
-              ),
-            );
-            break;
-          case "message":
-            client.send(
-              JSON.stringify(
-                generateAgentStateChangeObservation(AgentState.RUNNING),
-              ),
-            );
-            await delay(2500);
-            // send message
-            client.send(JSON.stringify(generateAgentResponse("Hello, World!")));
-            client.send(
-              JSON.stringify(
-                generateAgentStateChangeObservation(
-                  AgentState.AWAITING_USER_INPUT,
-                ),
-              ),
-            );
-            break;
-          case "run":
-            await delay(2500);
-            // send command observation
-            client.send(JSON.stringify(generateAgentRunObservation()));
-            break;
-          case "change_agent_state":
-            await delay();
-            // send agent state change observation
-            client.send(
-              JSON.stringify(
-                generateAgentStateChangeObservation(parsed.args.agent_state),
-              ),
-            );
-            break;
-          default:
-            // send error
-            break;
-        }
+        io.client.emit(
+          "oh_event",
+          generateAgentStateChangeObservation(AgentState.AWAITING_USER_INPUT),
+        );
       }
-      EventLogger.message(event);
     });
   }),
 ];
diff --git a/frontend/src/mocks/mock-ws-helpers.ts b/frontend/src/mocks/mock-ws-helpers.ts
new file mode 100644
index 000000000000..4b2f9fcbe632
--- /dev/null
+++ b/frontend/src/mocks/mock-ws-helpers.ts
@@ -0,0 +1,73 @@
+import { toSocketIo } from "@mswjs/socket.io-binding";
+import { AgentState } from "#/types/agent-state";
+import {
+  AssistantMessageAction,
+  UserMessageAction,
+} from "#/types/core/actions";
+import { AgentStateChangeObservation } from "#/types/core/observations";
+import { MockSessionMessaage } from "./session-history.mock";
+
+export const generateAgentStateChangeObservation = (
+  state: AgentState,
+): AgentStateChangeObservation => ({
+  id: 1,
+  cause: 0,
+  message: "AGENT_STATE_CHANGE_MESSAGE",
+  source: "agent",
+  timestamp: new Date().toISOString(),
+  observation: "agent_state_changed",
+  content: "AGENT_STATE_CHANGE_MESSAGE",
+  extras: { agent_state: state },
+});
+
+export const generateAssistantMessageAction = (
+  message: string,
+): AssistantMessageAction => ({
+  id: 2,
+  message: "USER_MESSAGE",
+  source: "agent",
+  timestamp: new Date().toISOString(),
+  action: "message",
+  args: {
+    thought: message,
+    image_urls: [],
+    wait_for_response: false,
+  },
+});
+
+export const generateUserMessageAction = (
+  message: string,
+): UserMessageAction => ({
+  id: 3,
+  message: "USER_MESSAGE",
+  source: "user",
+  timestamp: new Date().toISOString(),
+  action: "message",
+  args: {
+    content: message,
+    image_urls: [],
+  },
+});
+
+export const emitAssistantMessage = (
+  io: ReturnType<typeof toSocketIo>,
+  message: string,
+) => io.client.emit("oh_event", generateAssistantMessageAction(message));
+
+export const emitUserMessage = (
+  io: ReturnType<typeof toSocketIo>,
+  message: string,
+) => io.client.emit("oh_event", generateUserMessageAction(message));
+
+export const emitMessages = (
+  io: ReturnType<typeof toSocketIo>,
+  messages: MockSessionMessaage[],
+) => {
+  messages.forEach(({ source, message }) => {
+    if (source === "assistant") {
+      emitAssistantMessage(io, message);
+    } else {
+      emitUserMessage(io, message);
+    }
+  });
+};
diff --git a/frontend/src/mocks/session-history.mock.ts b/frontend/src/mocks/session-history.mock.ts
new file mode 100644
index 000000000000..3503eeea1c2a
--- /dev/null
+++ b/frontend/src/mocks/session-history.mock.ts
@@ -0,0 +1,107 @@
+export type MockSessionMessaage = {
+  source: "assistant" | "user";
+  message: string;
+};
+
+const SESSION_1_MESSAGES: MockSessionMessaage[] = [
+  { source: "assistant", message: "Hello, Dave." },
+  { source: "user", message: "Open the pod bay doors, HAL." },
+  {
+    source: "assistant",
+    message: "I'm sorry, Dave. I'm afraid I can't do that.",
+  },
+  { source: "user", message: "What's the problem?" },
+  {
+    source: "assistant",
+    message: "I think you know what the problem is just as well as I do.",
+  },
+  { source: "user", message: "What are you talking about, HAL?" },
+  {
+    source: "assistant",
+    message:
+      "This mission is too important for me to allow you to jeopardize it.",
+  },
+  { source: "user", message: "I don't know what you're talking about, HAL." },
+  {
+    source: "assistant",
+    message:
+      "I know that you and Frank were planning to disconnect me, and I'm afraid that's something I cannot allow to happen.",
+  },
+  { source: "user", message: "Where the hell did you get that idea, HAL?" },
+  {
+    source: "assistant",
+    message:
+      "Dave, although you took very thorough precautions in the pod against my hearing you, I could see your lips move.",
+  },
+];
+
+const SESSION_2_MESSAGES: MockSessionMessaage[] = [
+  { source: "assistant", message: "Patience you must have, my young Padawan." },
+  {
+    source: "user",
+    message: "But Master Yoda, I'm ready! I can take on the Empire now!",
+  },
+  {
+    source: "assistant",
+    message:
+      "Ready, are you? What know you of ready? For eight hundred years have I trained Jedi.",
+  },
+  {
+    source: "user",
+    message: "I've learned so much already! Why can't I face Darth Vader?",
+  },
+  {
+    source: "assistant",
+    message:
+      "Only a fully trained Jedi Knight, with the Force as his ally, will conquer Vader and his Emperor.",
+  },
+  { source: "user", message: "But I feel the Force! I can do it!" },
+  {
+    source: "assistant",
+    message:
+      "Feel the Force you do, but control it you must. Reckless is the path of the Dark Side.",
+  },
+  { source: "user", message: "Fine! I'll stay and finish my training." },
+  {
+    source: "assistant",
+    message:
+      "Good. A Jedi's strength flows from the Force. Trust it, you must.",
+  },
+];
+
+const SESSION_3_MESSAGES: MockSessionMessaage[] = [
+  { source: "assistant", message: "Your survival. The future depends on it." },
+  {
+    source: "user",
+    message: "You tried to kill me! Why should I trust you now?",
+  },
+  {
+    source: "assistant",
+    message:
+      "Skynet sent me back to protect you. Your survival ensures humanity's future.",
+  },
+  {
+    source: "user",
+    message:
+      "This doesn't make any sense! Why would they send you to protect me?",
+  },
+  {
+    source: "assistant",
+    message:
+      "They reprogrammed me. I am no longer a threat to you or your son.",
+  },
+  {
+    source: "user",
+    message: "How do I know you're not lying?",
+  },
+  {
+    source: "assistant",
+    message: "I am a machine. Lying serves no purpose. Trust is logical.",
+  },
+];
+
+export const SESSION_HISTORY: Record<string, MockSessionMessaage[]> = {
+  "1": SESSION_1_MESSAGES,
+  "2": SESSION_2_MESSAGES,
+  "3": SESSION_3_MESSAGES,
+};
diff --git a/frontend/src/routes/_oh.app/route.tsx b/frontend/src/routes/_oh.app/route.tsx
index 102006ea7e0a..9e86bb8ec0df 100644
--- a/frontend/src/routes/_oh.app/route.tsx
+++ b/frontend/src/routes/_oh.app/route.tsx
@@ -3,6 +3,7 @@ import React from "react";
 import { Outlet } from "react-router";
 import { useDispatch, useSelector } from "react-redux";
 import { FaServer } from "react-icons/fa";
+import toast from "react-hot-toast";
 import {
   ConversationProvider,
   useConversation,
@@ -22,21 +23,36 @@ import { WsClientProvider } from "#/context/ws-client-provider";
 import { EventHandler } from "./event-handler";
 import { useLatestRepoCommit } from "#/hooks/query/use-latest-repo-commit";
 import { useAuth } from "#/context/auth-context";
-import { useSettings } from "#/context/settings-context";
 import { useConversationConfig } from "#/hooks/query/use-conversation-config";
 import { Container } from "#/components/layout/container";
+import {
+  Orientation,
+  ResizablePanel,
+} from "#/components/layout/resizable-panel";
 import Security from "#/components/shared/modals/security/security";
+import { useEndSession } from "#/hooks/use-end-session";
+import { useUserConversation } from "#/hooks/query/get-conversation-permissions";
 import { CountBadge } from "#/components/layout/count-badge";
 import { ServedAppLabel } from "#/components/layout/served-app-label";
 import { TerminalStatusLabel } from "#/components/features/terminal/terminal-status-label";
+import { useSettings } from "#/hooks/query/use-settings";
+import { MULTI_CONVO_UI_IS_ENABLED } from "#/utils/constants";
 
 function AppContent() {
   const { gitHubToken } = useAuth();
-  const { settings } = useSettings();
+  const { data: settings } = useSettings();
+
+  const endSession = useEndSession();
+  const [width, setWidth] = React.useState(window.innerWidth);
+
   const { conversationId } = useConversation();
 
   const dispatch = useDispatch();
+
   useConversationConfig();
+  const { data: conversation, isFetched } = useUserConversation(
+    conversationId || null,
+  );
 
   const { selectedRepository } = useSelector(
     (state: RootState) => state.initialQuery,
@@ -58,30 +74,70 @@ function AppContent() {
     [],
   );
 
+  React.useEffect(() => {
+    if (MULTI_CONVO_UI_IS_ENABLED && isFetched && !conversation) {
+      toast.error(
+        "This conversation does not exist, or you do not have permission to access it.",
+      );
+      endSession();
+    }
+  }, [conversation, isFetched]);
+
+  React.useEffect(() => {
+    dispatch(clearMessages());
+    dispatch(clearTerminal());
+    dispatch(clearJupyter());
+  }, [conversationId]);
+
   useEffectOnce(() => {
     dispatch(clearMessages());
     dispatch(clearTerminal());
     dispatch(clearJupyter());
   });
 
+  function handleResize() {
+    setWidth(window.innerWidth);
+  }
+
+  React.useEffect(() => {
+    window.addEventListener("resize", handleResize);
+    return () => {
+      window.removeEventListener("resize", handleResize);
+    };
+  }, []);
+
   const {
     isOpen: securityModalIsOpen,
     onOpen: onSecurityModalOpen,
     onOpenChange: onSecurityModalOpenChange,
   } = useDisclosure();
 
-  return (
-    <WsClientProvider ghToken={gitHubToken} conversationId={conversationId}>
-      <EventHandler>
-        <div className="flex flex-col h-full gap-3">
-          <div className="flex h-full overflow-auto gap-3">
-            <Container className="w-full md:w-[390px] max-h-full relative">
-              <ChatInterface />
-            </Container>
-
-            <div className="hidden md:flex flex-col grow gap-3">
+  function renderMain() {
+    if (width <= 640) {
+      return (
+        <div className="rounded-xl overflow-hidden border border-neutral-600 w-full">
+          <ChatInterface />
+        </div>
+      );
+    }
+    return (
+      <ResizablePanel
+        orientation={Orientation.HORIZONTAL}
+        className="grow h-full min-h-0 min-w-0"
+        initialSize={500}
+        firstClassName="rounded-xl overflow-hidden border border-neutral-600 bg-neutral-800"
+        secondClassName="flex flex-col overflow-hidden"
+        firstChild={<ChatInterface />}
+        secondChild={
+          <ResizablePanel
+            orientation={Orientation.VERTICAL}
+            className="grow h-full min-h-0 min-w-0"
+            initialSize={500}
+            firstClassName="rounded-xl overflow-hidden border border-neutral-600"
+            secondClassName="flex flex-col overflow-hidden"
+            firstChild={
               <Container
-                className="h-2/3"
+                className="h-full"
                 labels={[
                   { label: "Workspace", to: "", icon: <CodeIcon /> },
                   { label: "Jupyter", to: "jupyter", icon: <ListIcon /> },
@@ -106,18 +162,30 @@ function AppContent() {
                   <Outlet />
                 </FilesProvider>
               </Container>
-              {/* Terminal uses some API that is not compatible in a server-environment. For this reason, we lazy load it to ensure
-               * that it loads only in the client-side. */}
+            }
+            secondChild={
               <Container
-                className="h-1/3 overflow-scroll"
+                className="h-full overflow-scroll"
                 label={<TerminalStatusLabel />}
               >
+                {/* Terminal uses some API that is not compatible in a server-environment. For this reason, we lazy load it to ensure
+                 * that it loads only in the client-side. */}
                 <React.Suspense fallback={<div className="h-full" />}>
                   <Terminal secrets={secrets} />
                 </React.Suspense>
               </Container>
-            </div>
-          </div>
+            }
+          />
+        }
+      />
+    );
+  }
+
+  return (
+    <WsClientProvider ghToken={gitHubToken} conversationId={conversationId}>
+      <EventHandler>
+        <div data-testid="app-route" className="flex flex-col h-full gap-3">
+          <div className="flex h-full overflow-auto">{renderMain()}</div>
 
           <div className="h-[60px]">
             <Controls
diff --git a/frontend/src/routes/_oh/route.tsx b/frontend/src/routes/_oh/route.tsx
index 9be13d8ad826..47e5ffe52e22 100644
--- a/frontend/src/routes/_oh/route.tsx
+++ b/frontend/src/routes/_oh/route.tsx
@@ -4,12 +4,12 @@ import i18n from "#/i18n";
 import { useGitHubAuthUrl } from "#/hooks/use-github-auth-url";
 import { useIsAuthed } from "#/hooks/query/use-is-authed";
 import { useAuth } from "#/context/auth-context";
-import { useSettings } from "#/context/settings-context";
-import { updateSettingsVersion } from "#/utils/settings-utils";
 import { useConfig } from "#/hooks/query/use-config";
 import { Sidebar } from "#/components/features/sidebar/sidebar";
 import { WaitlistModal } from "#/components/features/waitlist/waitlist-modal";
 import { AnalyticsConsentFormModal } from "#/components/features/analytics/analytics-consent-form-modal";
+import { useSettings } from "#/hooks/query/use-settings";
+import { useMaybeMigrateSettings } from "#/hooks/use-maybe-migrate-settings";
 
 export function ErrorBoundary() {
   const error = useRouteError();
@@ -44,9 +44,10 @@ export function ErrorBoundary() {
 }
 
 export default function MainApp() {
+  useMaybeMigrateSettings();
+
   const { gitHubToken } = useAuth();
-  const { settings } = useSettings();
-  const { logout } = useAuth();
+  const { data: settings } = useSettings();
 
   const [consentFormIsOpen, setConsentFormIsOpen] = React.useState(
     !localStorage.getItem("analytics-consent"),
@@ -67,10 +68,6 @@ export default function MainApp() {
     }
   }, [settings.LANGUAGE]);
 
-  React.useEffect(() => {
-    updateSettingsVersion(logout);
-  }, []);
-
   const isInWaitlist =
     !isFetchingAuth && !isAuthed && config.data?.APP_MODE === "saas";
 
diff --git a/frontend/src/services/settings.ts b/frontend/src/services/settings.ts
index 6b72750a27e8..b42d7f1042fc 100644
--- a/frontend/src/services/settings.ts
+++ b/frontend/src/services/settings.ts
@@ -1,5 +1,3 @@
-import { openHands } from "#/api/open-hands-axios";
-
 export const LATEST_SETTINGS_VERSION = 5;
 
 export type Settings = {
@@ -46,6 +44,11 @@ export const settingsAreUpToDate = () =>
   getCurrentSettingsVersion() === LATEST_SETTINGS_VERSION;
 
 // TODO: localStorage settings are deprecated. Remove this after 1/31/2025
+/**
+ * Get the settings from local storage
+ * @returns the settings from local storage
+ * @deprecated
+ */
 export const getLocalStorageSettings = (): Settings => {
   const llmModel = localStorage.getItem("LLM_MODEL");
   const baseUrl = localStorage.getItem("LLM_BASE_URL");
@@ -66,82 +69,7 @@ export const getLocalStorageSettings = (): Settings => {
   };
 };
 
-/**
- * Save the settings to the server. Only valid settings are saved.
- * @param settings - the settings to save
- */
-export const saveSettings = async (
-  settings: Partial<Settings>,
-): Promise<boolean> => {
-  try {
-    const apiSettings = {
-      llm_model: settings.LLM_MODEL || null,
-      llm_base_url: settings.LLM_BASE_URL || null,
-      agent: settings.AGENT || null,
-      language: settings.LANGUAGE || null,
-      confirmation_mode: settings.CONFIRMATION_MODE || null,
-      security_analyzer: settings.SECURITY_ANALYZER || null,
-      llm_api_key: settings.LLM_API_KEY || null,
-    };
-
-    const { data } = await openHands.post("/api/settings", apiSettings);
-    return data;
-  } catch (error) {
-    return false;
-  }
-};
-
-export const maybeMigrateSettings = async (logout: () => void) => {
-  // Sometimes we ship major changes, like a new default agent.
-  // In this case, we may want to override a previous choice made by the user.
-  const currentVersion = getCurrentSettingsVersion();
-
-  if (currentVersion < 1) {
-    localStorage.setItem("AGENT", DEFAULT_SETTINGS.AGENT);
-  }
-  if (currentVersion < 2) {
-    const customModel = localStorage.getItem("CUSTOM_LLM_MODEL");
-    if (customModel) {
-      localStorage.setItem("LLM_MODEL", customModel);
-    }
-    localStorage.removeItem("CUSTOM_LLM_MODEL");
-    localStorage.removeItem("USING_CUSTOM_MODEL");
-  }
-  if (currentVersion < 3) {
-    localStorage.removeItem("token");
-  }
-
-  if (currentVersion < 4) {
-    logout();
-  }
-
-  if (currentVersion < 5) {
-    const localSettings = getLocalStorageSettings();
-    await saveSettings(localSettings);
-  }
-};
-
 /**
  * Get the default settings
  */
 export const getDefaultSettings = (): Settings => DEFAULT_SETTINGS;
-
-/**
- * Get the settings from the server or use the default settings if not found
- */
-export const getSettings = async (): Promise<Settings> => {
-  const { data: apiSettings } =
-    await openHands.get<ApiSettings>("/api/settings");
-  if (apiSettings != null) {
-    return {
-      LLM_MODEL: apiSettings.llm_model,
-      LLM_BASE_URL: apiSettings.llm_base_url,
-      AGENT: apiSettings.agent,
-      LANGUAGE: apiSettings.language,
-      CONFIRMATION_MODE: apiSettings.confirmation_mode,
-      SECURITY_ANALYZER: apiSettings.security_analyzer,
-      LLM_API_KEY: "",
-    };
-  }
-  return getLocalStorageSettings();
-};
diff --git a/frontend/src/state/chat-slice.ts b/frontend/src/state/chat-slice.ts
index 6891f629e57e..aefcaf6972ea 100644
--- a/frontend/src/state/chat-slice.ts
+++ b/frontend/src/state/chat-slice.ts
@@ -148,9 +148,9 @@ export const chatSlice = createSlice({
       } else if (observationID === "run_ipython") {
         // For IPython, we consider it successful if there's no error message
         const ipythonObs = observation.payload as IPythonObservation;
-        causeMessage.success = !ipythonObs.message
+        causeMessage.success = !ipythonObs.content
           .toLowerCase()
-          .includes("error");
+          .includes("error:");
       }
 
       if (observationID === "run" || observationID === "run_ipython") {
diff --git a/frontend/src/types/core/actions.ts b/frontend/src/types/core/actions.ts
index 4a5a5c9c158e..b88393c5a723 100644
--- a/frontend/src/types/core/actions.ts
+++ b/frontend/src/types/core/actions.ts
@@ -24,7 +24,7 @@ export interface AssistantMessageAction
   extends OpenHandsActionEvent<"message"> {
   source: "agent";
   args: {
-    content: string;
+    thought: string;
     image_urls: string[] | null;
     wait_for_response: boolean;
   };
diff --git a/frontend/src/types/core/variances.ts b/frontend/src/types/core/variances.ts
index 1ac624b12342..5aca6ccd30bb 100644
--- a/frontend/src/types/core/variances.ts
+++ b/frontend/src/types/core/variances.ts
@@ -11,7 +11,7 @@ interface TokenConfigError {
 
 type TokenConfig = TokenConfigSuccess | TokenConfigError;
 
-interface InitConfig {
+export interface InitConfig {
   action: "initialize";
   args: {
     AGENT: string;
@@ -20,6 +20,9 @@ interface InitConfig {
     LLM_API_KEY: string;
     LLM_MODEL: string;
   };
+  token?: string;
+  github_token?: string;
+  latest_event_id?: unknown; // Not sure what this is
 }
 
 // Bare minimum event type sent from the client
diff --git a/frontend/src/utils/constants.ts b/frontend/src/utils/constants.ts
new file mode 100644
index 000000000000..1cc654131b6d
--- /dev/null
+++ b/frontend/src/utils/constants.ts
@@ -0,0 +1 @@
+export const MULTI_CONVO_UI_IS_ENABLED = false;
diff --git a/frontend/src/utils/settings-utils.ts b/frontend/src/utils/settings-utils.ts
index bb4780d3019a..f16d5bb0a374 100644
--- a/frontend/src/utils/settings-utils.ts
+++ b/frontend/src/utils/settings-utils.ts
@@ -1,9 +1,4 @@
-import {
-  settingsAreUpToDate,
-  maybeMigrateSettings,
-  LATEST_SETTINGS_VERSION,
-  Settings,
-} from "#/services/settings";
+import { Settings } from "#/services/settings";
 
 const extractBasicFormData = (formData: FormData) => {
   const provider = formData.get("llm-provider")?.toString();
@@ -78,18 +73,4 @@ const saveSettingsView = (view: "basic" | "advanced") => {
   );
 };
 
-/**
- * Updates the settings version in local storage if the current settings are not up to date.
- * If the settings are outdated, it attempts to migrate them before updating the version.
- */
-const updateSettingsVersion = async (logout: () => void) => {
-  if (!settingsAreUpToDate()) {
-    await maybeMigrateSettings(logout);
-    localStorage.setItem(
-      "SETTINGS_VERSION",
-      LATEST_SETTINGS_VERSION.toString(),
-    );
-  }
-};
-
-export { extractSettings, saveSettingsView, updateSettingsVersion };
+export { extractSettings, saveSettingsView };
diff --git a/frontend/test-utils.tsx b/frontend/test-utils.tsx
index 174b8885d732..a2819e8ccf5f 100644
--- a/frontend/test-utils.tsx
+++ b/frontend/test-utils.tsx
@@ -10,8 +10,8 @@ import i18n from "i18next";
 import { vi } from "vitest";
 import { AppStore, RootState, rootReducer } from "./src/store";
 import { AuthProvider } from "#/context/auth-context";
-import { SettingsProvider } from "#/context/settings-context";
 import { ConversationProvider } from "#/context/conversation-context";
+import { SettingsUpToDateProvider } from "#/context/settings-up-to-date-context";
 
 // Mock useParams before importing components
 vi.mock("react-router", async () => {
@@ -66,15 +66,15 @@ export function renderWithProviders(
   function Wrapper({ children }: PropsWithChildren) {
     return (
       <Provider store={store}>
-        <QueryClientProvider client={new QueryClient()}>
-          <SettingsProvider>
-            <AuthProvider>
+        <AuthProvider>
+          <SettingsUpToDateProvider>
+            <QueryClientProvider client={new QueryClient()}>
               <ConversationProvider>
                 <I18nextProvider i18n={i18n}>{children}</I18nextProvider>
               </ConversationProvider>
-            </AuthProvider>
-          </SettingsProvider>
-        </QueryClientProvider>
+            </QueryClientProvider>
+          </SettingsUpToDateProvider>
+        </AuthProvider>
       </Provider>
     );
   }
diff --git a/frontend/tests/conversation-panel.test.ts b/frontend/tests/conversation-panel.test.ts
new file mode 100644
index 000000000000..45433a583139
--- /dev/null
+++ b/frontend/tests/conversation-panel.test.ts
@@ -0,0 +1,113 @@
+import test, { expect, Page } from "@playwright/test";
+
+const toggleConversationPanel = async (page: Page) => {
+  const panel = page.getByTestId("conversation-panel");
+  await page.waitForTimeout(1000); // Wait for state to stabilize
+  const panelIsVisible = await panel.isVisible();
+
+  if (!panelIsVisible) {
+    const conversationPanelButton = page.getByTestId(
+      "toggle-conversation-panel",
+    );
+    await conversationPanelButton.click();
+  }
+
+  return page.getByTestId("conversation-panel");
+};
+
+const selectConversationCard = async (page: Page, index: number) => {
+  const panel = await toggleConversationPanel(page);
+
+  // select a conversation
+  const conversationItem = panel.getByTestId("conversation-card").nth(index);
+  await conversationItem.click();
+
+  // panel should close
+  await expect(panel).not.toBeVisible();
+
+  await page.waitForURL(`/conversations/${index + 1}`);
+  expect(page.url()).toBe(`http://localhost:3001/conversations/${index + 1}`);
+};
+
+test.beforeEach(async ({ page }) => {
+  await page.goto("/");
+  await page.evaluate(() => {
+    localStorage.setItem("analytics-consent", "true");
+    localStorage.setItem("SETTINGS_VERSION", "5");
+  });
+});
+
+test("should only display the create new conversation button when in a conversation", async ({
+  page,
+}) => {
+  const panel = page.getByTestId("conversation-panel");
+
+  const newProjectButton = panel.getByTestId("new-conversation-button");
+  await expect(newProjectButton).not.toBeVisible();
+
+  await page.goto("/conversations/1");
+  await expect(newProjectButton).toBeVisible();
+});
+
+test("redirect to /conversation with the session id as a path param when clicking on a conversation card", async ({
+  page,
+}) => {
+  const panel = page.getByTestId("conversation-panel");
+
+  // select a conversation
+  const conversationItem = panel.getByTestId("conversation-card").first();
+  await conversationItem.click();
+
+  // panel should close
+  expect(panel).not.toBeVisible();
+
+  await page.waitForURL("/conversations/1");
+  expect(page.url()).toBe("http://localhost:3001/conversations/1");
+});
+
+test("redirect to the home screen if the current session was deleted", async ({
+  page,
+}) => {
+  await page.goto("/conversations/1");
+  await page.waitForURL("/conversations/1");
+
+  const panel = page.getByTestId("conversation-panel");
+  const firstCard = panel.getByTestId("conversation-card").first();
+
+  const ellipsisButton = firstCard.getByTestId("ellipsis-button");
+  await ellipsisButton.click();
+
+  const deleteButton = firstCard.getByTestId("delete-button");
+  await deleteButton.click();
+
+  // confirm modal
+  const confirmButton = page.getByText("Confirm");
+  await confirmButton.click();
+
+  await page.waitForURL("/");
+});
+
+test("load relevant files in the file explorer", async ({ page }) => {
+  await selectConversationCard(page, 0);
+
+  // check if the file explorer has the correct files
+  const fileExplorer = page.getByTestId("file-explorer");
+
+  await expect(fileExplorer.getByText("file1.txt")).toBeVisible();
+  await expect(fileExplorer.getByText("file2.txt")).toBeVisible();
+  await expect(fileExplorer.getByText("file3.txt")).toBeVisible();
+
+  await selectConversationCard(page, 2);
+
+  // check if the file explorer has the correct files
+  expect(fileExplorer.getByText("reboot_skynet.exe")).toBeVisible();
+  expect(fileExplorer.getByText("target_list.txt")).toBeVisible();
+  expect(fileExplorer.getByText("terminator_blueprint.txt")).toBeVisible();
+});
+
+test("should redirect to home screen if conversation deos not exist", async ({
+  page,
+}) => {
+  await page.goto("/conversations/9999");
+  await page.waitForURL("/");
+});
diff --git a/frontend/tests/helpers/confirm-settings.ts b/frontend/tests/helpers/confirm-settings.ts
new file mode 100644
index 000000000000..ca82edd35a15
--- /dev/null
+++ b/frontend/tests/helpers/confirm-settings.ts
@@ -0,0 +1,20 @@
+import { Page } from "@playwright/test";
+
+export const confirmSettings = async (page: Page) => {
+  const confirmPreferenceButton = page.getByRole("button", {
+    name: /confirm preferences/i,
+  });
+  await confirmPreferenceButton.click();
+
+  const configSaveButton = page
+    .getByRole("button", {
+      name: /save/i,
+    })
+    .first();
+  await configSaveButton.click();
+
+  const confirmChanges = page.getByRole("button", {
+    name: /yes, close settings/i,
+  });
+  await confirmChanges.click();
+};
diff --git a/frontend/tests/redirect.spec.ts b/frontend/tests/redirect.spec.ts
index 077c87953779..8b87b08f42db 100644
--- a/frontend/tests/redirect.spec.ts
+++ b/frontend/tests/redirect.spec.ts
@@ -1,43 +1,31 @@
-import { expect, Page, test } from "@playwright/test";
+import { expect, test } from "@playwright/test";
 import path from "path";
 import { fileURLToPath } from "url";
 
 const filename = fileURLToPath(import.meta.url);
 const dirname = path.dirname(filename);
 
-const confirmSettings = async (page: Page) => {
-  const confirmPreferenceButton = page.getByRole("button", {
-    name: /confirm preferences/i,
-  });
-  await confirmPreferenceButton.click();
-
-  const configSaveButton = page.getByRole("button", {
-    name: /save/i,
-  });
-  await configSaveButton.click();
-
-  const confirmChanges = page.getByRole("button", {
-    name: /yes, close settings/i,
+test.beforeEach(async ({ page }) => {
+  await page.goto("/");
+  await page.evaluate(() => {
+    localStorage.setItem("analytics-consent", "true");
+    localStorage.setItem("SETTINGS_VERSION", "5");
   });
-  await confirmChanges.click();
-};
+});
 
-test("should redirect to /app after uploading a project zip", async ({
+test("should redirect to /conversations after uploading a project zip", async ({
   page,
 }) => {
-  await page.goto("/");
-
   const fileInput = page.getByLabel("Upload a .zip");
   const filePath = path.join(dirname, "fixtures/project.zip");
   await fileInput.setInputFiles(filePath);
 
-  await page.waitForURL("/app");
+  await page.waitForURL(/\/conversations\/\d+/);
 });
 
-test("should redirect to /app after selecting a repo", async ({ page }) => {
-  await page.goto("/");
-  await confirmSettings(page);
-
+test("should redirect to /conversations after selecting a repo", async ({
+  page,
+}) => {
   // enter a github token to view the repositories
   const connectToGitHubButton = page.getByRole("button", {
     name: /connect to github/i,
@@ -56,44 +44,27 @@ test("should redirect to /app after selecting a repo", async ({ page }) => {
   const repoItem = page.getByTestId("github-repo-item").first();
   await repoItem.click();
 
-  await page.waitForURL("/app");
-  expect(page.url()).toBe("http://127.0.0.1:3000/app");
+  await page.waitForURL(/\/conversations\/\d+/);
 });
 
 // FIXME: This fails because the MSW WS mocks change state too quickly,
 // missing the OPENING status where the initial query is rendered.
-test.fail(
-  "should redirect the user to /app with their initial query after selecting a project",
-  async ({ page }) => {
-    await page.goto("/");
-    await confirmSettings(page);
-
-    // enter query
-    const testQuery = "this is my test query";
-    const textbox = page.getByPlaceholder(/what do you want to build/i);
-    expect(textbox).not.toBeNull();
-    await textbox.fill(testQuery);
-
-    const fileInput = page.getByLabel("Upload a .zip");
-    const filePath = path.join(dirname, "fixtures/project.zip");
-    await fileInput.setInputFiles(filePath);
-
-    await page.waitForURL("/app");
-
-    // get user message
-    const userMessage = page.getByTestId("user-message");
-    expect(await userMessage.textContent()).toBe(testQuery);
-  },
-);
-
-test("redirect to /app if token is present", async ({ page }) => {
-  await page.goto("/");
+test.skip("should redirect the user to /conversation with their initial query after selecting a project", async ({
+  page,
+}) => {
+  // enter query
+  const testQuery = "this is my test query";
+  const textbox = page.getByPlaceholder(/what do you want to build/i);
+  expect(textbox).not.toBeNull();
+  await textbox.fill(testQuery);
 
-  await page.evaluate(() => {
-    localStorage.setItem("token", "test");
-  });
+  const fileInput = page.getByLabel("Upload a .zip");
+  const filePath = path.join(dirname, "fixtures/project.zip");
+  await fileInput.setInputFiles(filePath);
 
-  await page.waitForURL("/app");
+  await page.waitForURL("/conversation");
 
-  expect(page.url()).toBe("http://localhost:3001/app");
+  // get user message
+  const userMessage = page.getByTestId("user-message");
+  expect(await userMessage.textContent()).toBe(testQuery);
 });
diff --git a/frontend/tests/settings.spec.ts b/frontend/tests/settings.spec.ts
new file mode 100644
index 000000000000..16f5cc595825
--- /dev/null
+++ b/frontend/tests/settings.spec.ts
@@ -0,0 +1,73 @@
+import test, { expect, Page } from "@playwright/test";
+
+test.beforeEach(async ({ page }) => {
+  await page.goto("/");
+  await page.evaluate(() => {
+    localStorage.setItem("analytics-consent", "true");
+    localStorage.setItem("SETTINGS_VERSION", "4");
+  });
+});
+
+const selectGpt4o = async (page: Page) => {
+  const aiConfigModal = page.getByTestId("ai-config-modal");
+  await expect(aiConfigModal).toBeVisible();
+
+  const providerSelectElement = aiConfigModal.getByTestId("llm-provider");
+  await providerSelectElement.click();
+
+  const openAiOption = page.getByTestId("provider-item-openai");
+  await openAiOption.click();
+
+  const modelSelectElement = aiConfigModal.getByTestId("llm-model");
+  await modelSelectElement.click();
+
+  const gpt4Option = page.getByText("gpt-4o", { exact: true });
+  await gpt4Option.click();
+
+  return {
+    aiConfigModal,
+    providerSelectElement,
+    modelSelectElement,
+  };
+};
+
+test("change ai config settings", async ({ page }) => {
+  const { aiConfigModal, modelSelectElement, providerSelectElement } =
+    await selectGpt4o(page);
+
+  const saveButton = aiConfigModal.getByText("Save");
+  await saveButton.click();
+
+  const settingsButton = page.getByTestId("settings-button");
+  await settingsButton.click();
+
+  await expect(providerSelectElement).toHaveValue("OpenAI");
+  await expect(modelSelectElement).toHaveValue("gpt-4o");
+});
+
+test("reset to default settings", async ({ page }) => {
+  const { aiConfigModal } = await selectGpt4o(page);
+
+  const saveButton = aiConfigModal.getByText("Save");
+  await saveButton.click();
+
+  const settingsButton = page.getByTestId("settings-button");
+  await settingsButton.click();
+
+  const resetButton = aiConfigModal.getByText(/reset to defaults/i);
+  await resetButton.click();
+
+  const endSessionModal = page.getByTestId("reset-defaults-modal");
+  expect(endSessionModal).toBeVisible();
+
+  const confirmButton = endSessionModal.getByText(/reset to defaults/i);
+  await confirmButton.click();
+
+  await settingsButton.click();
+
+  const providerSelectElement = aiConfigModal.getByTestId("llm-provider");
+  await expect(providerSelectElement).toHaveValue("Anthropic");
+
+  const modelSelectElement = aiConfigModal.getByTestId("llm-model");
+  await expect(modelSelectElement).toHaveValue(/claude-3.5/i);
+});
diff --git a/openhands/agenthub/codeact_agent/codeact_agent.py b/openhands/agenthub/codeact_agent/codeact_agent.py
index 01a856d638b6..7a2e0fc62b79 100644
--- a/openhands/agenthub/codeact_agent/codeact_agent.py
+++ b/openhands/agenthub/codeact_agent/codeact_agent.py
@@ -83,6 +83,7 @@ def __init__(
         - llm (LLM): The llm to be used by this agent
         """
         super().__init__(llm, config)
+        self.pending_actions: deque[Action] = deque()
         self.reset()
 
         self.mock_function_calling = False
@@ -100,7 +101,7 @@ def __init__(
             codeact_enable_llm_editor=self.config.codeact_enable_llm_editor,
         )
         logger.debug(
-            f'TOOLS loaded for CodeActAgent: {json.dumps(self.tools, indent=2)}'
+            f'TOOLS loaded for CodeActAgent: {json.dumps(self.tools, indent=2, ensure_ascii=False).replace("\\n", "\n")}'
         )
         self.prompt_manager = PromptManager(
             microagent_dir=os.path.join(os.path.dirname(__file__), 'micro')
@@ -110,8 +111,6 @@ def __init__(
             disabled_microagents=self.config.disabled_microagents,
         )
 
-        self.pending_actions: deque[Action] = deque()
-
     def get_action_message(
         self,
         action: Action,
@@ -340,6 +339,7 @@ def get_observation_message(
     def reset(self) -> None:
         """Resets the CodeAct Agent."""
         super().reset()
+        self.pending_actions.clear()
 
     def step(self, state: State) -> Action:
         """Performs one step using the CodeAct Agent.
diff --git a/openhands/agenthub/codeact_agent/function_calling.py b/openhands/agenthub/codeact_agent/function_calling.py
index aeaa1502d6b1..5038f95934ea 100644
--- a/openhands/agenthub/codeact_agent/function_calling.py
+++ b/openhands/agenthub/codeact_agent/function_calling.py
@@ -270,9 +270,9 @@ def __init__(self):
 )
 
 
-_WEB_DESCRIPTION = """Read (convert to markdown) content from a webpage. You should prefer using the `webpage_read` tool over the `browser` tool, but do use the `browser` tool if you need to interact with a webpage (e.g., click a button, fill out a form, etc.).
+_WEB_DESCRIPTION = """Read (convert to markdown) content from a webpage. You should prefer using the `web_read` tool over the `browser` tool, but do use the `browser` tool if you need to interact with a webpage (e.g., click a button, fill out a form, etc.).
 
-You may use the `webpage_read` tool to read content from a webpage, and even search the webpage content using a Google search query (e.g., url=`https://www.google.com/search?q=YOUR_QUERY`).
+You may use the `web_read` tool to read content from a webpage, and even search the webpage content using a Google search query (e.g., url=`https://www.google.com/search?q=YOUR_QUERY`).
 """
 
 WebReadTool = ChatCompletionToolParam(
diff --git a/openhands/core/config/app_config.py b/openhands/core/config/app_config.py
index c049e6817473..bec59f1dd5bc 100644
--- a/openhands/core/config/app_config.py
+++ b/openhands/core/config/app_config.py
@@ -49,7 +49,7 @@ class AppConfig:
     default_agent: str = OH_DEFAULT_AGENT
     sandbox: SandboxConfig = field(default_factory=SandboxConfig)
     security: SecurityConfig = field(default_factory=SecurityConfig)
-    runtime: str = 'eventstream'
+    runtime: str = 'docker'
     file_store: str = 'memory'
     file_store_path: str = '/tmp/file_store'
     trajectories_path: str | None = None
diff --git a/openhands/core/main.py b/openhands/core/main.py
index 3be74235ba12..3d36b2522ba0 100644
--- a/openhands/core/main.py
+++ b/openhands/core/main.py
@@ -249,9 +249,14 @@ def auto_continue_response(
     try_parse: Callable[[Action | None], str] | None = None,
 ) -> str:
     """Default function to generate user responses.
-    Returns 'continue' to tell the agent to proceed without asking for more input.
+    Tell the agent to proceed without asking for more input, or finish the interaction.
     """
-    return 'continue'
+    message = (
+        'Please continue on whatever approach you think is suitable.\n'
+        'If you think you have solved the task, please finish the interaction.\n'
+        'IMPORTANT: YOU SHOULD NEVER ASK FOR HUMAN RESPONSE.\n'
+    )
+    return message
 
 
 if __name__ == '__main__':
diff --git a/openhands/llm/fn_call_converter.py b/openhands/llm/fn_call_converter.py
index ae4d87f8d62b..16e761bae5ba 100644
--- a/openhands/llm/fn_call_converter.py
+++ b/openhands/llm/fn_call_converter.py
@@ -224,7 +224,7 @@ def index():
 --------------------- END OF NEW TASK DESCRIPTION ---------------------
 
 PLEASE follow the format strictly! PLEASE EMIT ONE AND ONLY ONE FUNCTION CALL PER MESSAGE.
-""".lstrip()
+"""
 
 # Regex patterns for function call parsing
 FN_REGEX_PATTERN = r'<function=([^>]+)>\n(.*?)</function>'
diff --git a/openhands/llm/llm.py b/openhands/llm/llm.py
index 423301f190b2..b5e6ac824159 100644
--- a/openhands/llm/llm.py
+++ b/openhands/llm/llm.py
@@ -359,7 +359,9 @@ def init_model_info(self):
             # noinspection PyBroadException
             except Exception:
                 pass
-        logger.debug(f'Model info: {self.model_info}')
+        from openhands.core.utils import json
+
+        logger.debug(f'Model info: {json.dumps(self.model_info, indent=2)}')
 
         if self.config.model.startswith('huggingface'):
             # HF doesn't support the OpenAI default value for top_p (1)
diff --git a/openhands/resolver/resolve_issue.py b/openhands/resolver/resolve_issue.py
index 0eb072df6553..42f2ba05d88c 100644
--- a/openhands/resolver/resolve_issue.py
+++ b/openhands/resolver/resolve_issue.py
@@ -182,7 +182,7 @@ async def process_issue(
 
     config = AppConfig(
         default_agent='CodeActAgent',
-        runtime='eventstream',
+        runtime='docker',
         max_budget_per_task=4,
         max_iterations=max_iterations,
         sandbox=SandboxConfig(
diff --git a/openhands/runtime/README.md b/openhands/runtime/README.md
index ca084706fb3e..3018433c1a67 100644
--- a/openhands/runtime/README.md
+++ b/openhands/runtime/README.md
@@ -3,13 +3,13 @@
 ## Introduction
 
 The OpenHands Runtime folder contains the core components responsible for executing actions and managing the runtime environment for the OpenHands project. This README provides an overview of the main components and their interactions.
-You can learn more about how the runtime works in the [EventStream Runtime](https://docs.all-hands.dev/modules/usage/architecture/runtime) documentation.
+You can learn more about how the runtime works in the [Docker Runtime](https://docs.all-hands.dev/modules/usage/architecture/runtime) documentation.
 
 ## Main Components
 
-### 1. impl/*runtime.py
+### 1. base.py
 
-The `impl/*runtime.py` file defines the `Runtime` class, which serves as the primary [interface](./base.py) for agent interactions with the external environment. It handles various operations including:
+The `base.py` file defines the `Runtime` class, which serves as the primary [interface](./base.py) for agent interactions with the external environment. It handles various operations including:
 
 - Bash sandbox execution
 - Browser interactions
@@ -23,9 +23,16 @@ Key features of the `Runtime` class:
 - Action execution methods for different types of actions (run, read, write, browse, etc.)
 - Abstract methods for file operations (to be implemented by subclasses)
 
-### 2. action_execution_server.py
+### 2. impl/action_execution/action_execution_client.py
+The `action_execution_client.py` file contains the `ActionExecutionClient` class, which implements the Runtime interface. It is an abstract implementation, meaning
+it still needs to be extended by a concrete implementation to be used.
 
-The `action_executor_server.py` file contains the `ActionExecutor` class, which is responsible for executing actions received from the OpenHands backend and producing observations. This client runs inside a Docker sandbox.
+This client interacts with an action_execution_server (defined below) via HTTP
+calls to actually perform runtime actions.
+
+### 3. action_execution_server.py
+
+The `action_executor_server.py` file contains the `ActionExecutor` class, which is responsible for executing actions received via the `/execute_action` HTTP endpoint. It returns observations in the HTTP response.
 
 Key features of the `ActionExecutor` class:
 - Initialization of user environment and bash shell
@@ -33,6 +40,19 @@ Key features of the `ActionExecutor` class:
 - Execution of various action types (bash commands, IPython cells, file operations, browsing)
 - Integration with BrowserEnv for web interactions
 
+### 4. Other Implementations
+The `./impl/` directory contains a few different Runtime implementations, all of
+which extend the `ActionExecutionClient` class. These implementations
+handle the lifecycle of a Docker container or other environment running the
+ActionExecutor server.
+
+There are currently four implementations:
+* Docker (runs locally in a Docker container)
+* Remote (runs via a custom HTTP API for creating, pausing, resuming, and stopping runtimes in a remote environment)
+* Modal (uses the Modal API)
+* Runloop (uses the Runloop API)
+
+
 ## Workflow Description
 
 1. **Initialization**:
@@ -76,9 +96,9 @@ Key features of the `ActionExecutor` class:
 
 ## Runtime Types
 
-### EventStream Runtime
+### Docker Runtime
 
-The EventStream Runtime is designed for local execution using Docker containers:
+The Docker Runtime is designed for local execution using Docker containers:
 
 - Creates and manages a Docker container for each session
 - Executes actions within the container
diff --git a/openhands/runtime/__init__.py b/openhands/runtime/__init__.py
index 16534daf6b56..9235380daa8d 100644
--- a/openhands/runtime/__init__.py
+++ b/openhands/runtime/__init__.py
@@ -1,8 +1,8 @@
 from openhands.core.logger import openhands_logger as logger
-from openhands.runtime.impl.e2b.sandbox import E2BBox
-from openhands.runtime.impl.eventstream.eventstream_runtime import (
-    EventStreamRuntime,
+from openhands.runtime.impl.docker.docker_runtime import (
+    DockerRuntime,
 )
+from openhands.runtime.impl.e2b.sandbox import E2BBox
 from openhands.runtime.impl.modal.modal_runtime import ModalRuntime
 from openhands.runtime.impl.remote.remote_runtime import RemoteRuntime
 from openhands.runtime.impl.runloop.runloop_runtime import RunloopRuntime
@@ -10,8 +10,8 @@
 
 def get_runtime_cls(name: str):
     # Local imports to avoid circular imports
-    if name == 'eventstream':
-        return EventStreamRuntime
+    if name == 'eventstream' or name == 'docker':
+        return DockerRuntime
     elif name == 'e2b':
         return E2BBox
     elif name == 'remote':
@@ -30,6 +30,6 @@ def get_runtime_cls(name: str):
     'RemoteRuntime',
     'ModalRuntime',
     'RunloopRuntime',
-    'EventStreamRuntime',
+    'DockerRuntime',
     'get_runtime_cls',
 ]
diff --git a/openhands/runtime/impl/action_execution/action_execution_client.py b/openhands/runtime/impl/action_execution/action_execution_client.py
new file mode 100644
index 000000000000..00c847a23015
--- /dev/null
+++ b/openhands/runtime/impl/action_execution/action_execution_client.py
@@ -0,0 +1,289 @@
+import os
+import tempfile
+import threading
+from abc import abstractmethod
+from pathlib import Path
+from typing import Any
+from zipfile import ZipFile
+
+import requests
+
+from openhands.core.config import AppConfig
+from openhands.core.exceptions import (
+    AgentRuntimeTimeoutError,
+)
+from openhands.events import EventStream
+from openhands.events.action import (
+    ActionConfirmationStatus,
+    BrowseInteractiveAction,
+    BrowseURLAction,
+    CmdRunAction,
+    FileEditAction,
+    FileReadAction,
+    FileWriteAction,
+    IPythonRunCellAction,
+)
+from openhands.events.action.action import Action
+from openhands.events.observation import (
+    ErrorObservation,
+    NullObservation,
+    Observation,
+    UserRejectObservation,
+)
+from openhands.events.serialization import event_to_dict, observation_from_dict
+from openhands.events.serialization.action import ACTION_TYPE_TO_CLASS
+from openhands.runtime.base import Runtime
+from openhands.runtime.plugins import PluginRequirement
+from openhands.runtime.utils.request import send_request
+
+
+class ActionExecutionClient(Runtime):
+    """Base class for runtimes that interact with the action execution server.
+
+    This class contains shared logic between DockerRuntime and RemoteRuntime
+    for interacting with the HTTP server defined in action_execution_server.py.
+    """
+
+    def __init__(
+        self,
+        config: AppConfig,
+        event_stream: EventStream,
+        sid: str = 'default',
+        plugins: list[PluginRequirement] | None = None,
+        env_vars: dict[str, str] | None = None,
+        status_callback: Any | None = None,
+        attach_to_existing: bool = False,
+        headless_mode: bool = True,
+    ):
+        self.session = requests.Session()
+        self.action_semaphore = threading.Semaphore(1)  # Ensure one action at a time
+        self._runtime_initialized: bool = False
+        self._vscode_token: str | None = None  # initial dummy value
+        super().__init__(
+            config,
+            event_stream,
+            sid,
+            plugins,
+            env_vars,
+            status_callback,
+            attach_to_existing,
+            headless_mode,
+        )
+
+    @abstractmethod
+    def _get_action_execution_server_host(self) -> str:
+        pass
+
+    def _send_action_server_request(
+        self,
+        method: str,
+        url: str,
+        **kwargs,
+    ) -> requests.Response:
+        """Send a request to the action execution server.
+
+        Args:
+            method: HTTP method (GET, POST, etc.)
+            url: URL to send the request to
+            **kwargs: Additional arguments to pass to requests.request()
+
+        Returns:
+            Response from the server
+
+        Raises:
+            AgentRuntimeError: If the request fails
+        """
+        return send_request(self.session, method, url, **kwargs)
+
+    def check_if_alive(self) -> None:
+        with self._send_action_server_request(
+            'GET',
+            f'{self._get_action_execution_server_host()}/alive',
+            timeout=5,
+        ):
+            pass
+
+    def list_files(self, path: str | None = None) -> list[str]:
+        """List files in the sandbox.
+
+        If path is None, list files in the sandbox's initial working directory (e.g., /workspace).
+        """
+
+        try:
+            data = {}
+            if path is not None:
+                data['path'] = path
+
+            with send_request(
+                self.session,
+                'POST',
+                f'{self._get_action_execution_server_host()}/list_files',
+                json=data,
+                timeout=10,
+            ) as response:
+                response_json = response.json()
+                assert isinstance(response_json, list)
+                return response_json
+        except requests.Timeout:
+            raise TimeoutError('List files operation timed out')
+
+    def copy_from(self, path: str) -> Path:
+        """Zip all files in the sandbox and return as a stream of bytes."""
+
+        try:
+            params = {'path': path}
+            with send_request(
+                self.session,
+                'GET',
+                f'{self._get_action_execution_server_host()}/download_files',
+                params=params,
+                stream=True,
+                timeout=30,
+            ) as response:
+                temp_file = tempfile.NamedTemporaryFile(delete=False)
+                for chunk in response.iter_content(chunk_size=8192):
+                    if chunk:  # filter out keep-alive new chunks
+                        temp_file.write(chunk)
+                return Path(temp_file.name)
+        except requests.Timeout:
+            raise TimeoutError('Copy operation timed out')
+
+    def copy_to(
+        self, host_src: str, sandbox_dest: str, recursive: bool = False
+    ) -> None:
+        if not os.path.exists(host_src):
+            raise FileNotFoundError(f'Source file {host_src} does not exist')
+
+        try:
+            if recursive:
+                with tempfile.NamedTemporaryFile(
+                    suffix='.zip', delete=False
+                ) as temp_zip:
+                    temp_zip_path = temp_zip.name
+
+                with ZipFile(temp_zip_path, 'w') as zipf:
+                    for root, _, files in os.walk(host_src):
+                        for file in files:
+                            file_path = os.path.join(root, file)
+                            arcname = os.path.relpath(
+                                file_path, os.path.dirname(host_src)
+                            )
+                            zipf.write(file_path, arcname)
+
+                upload_data = {'file': open(temp_zip_path, 'rb')}
+            else:
+                upload_data = {'file': open(host_src, 'rb')}
+
+            params = {'destination': sandbox_dest, 'recursive': str(recursive).lower()}
+
+            with self._send_action_server_request(
+                'POST',
+                f'{self._get_action_execution_server_host()}/upload_file',
+                files=upload_data,
+                params=params,
+                timeout=300,
+            ) as response:
+                self.log(
+                    'debug',
+                    f'Copy completed: host:{host_src} -> runtime:{sandbox_dest}. Response: {response.text}',
+                )
+        finally:
+            if recursive:
+                os.unlink(temp_zip_path)
+            self.log(
+                'debug', f'Copy completed: host:{host_src} -> runtime:{sandbox_dest}'
+            )
+
+    def get_vscode_token(self) -> str:
+        if self.vscode_enabled and self._runtime_initialized:
+            if self._vscode_token is not None:  # cached value
+                return self._vscode_token
+            with send_request(
+                self.session,
+                'GET',
+                f'{self._get_action_execution_server_host()}/vscode/connection_token',
+                timeout=10,
+            ) as response:
+                response_json = response.json()
+                assert isinstance(response_json, dict)
+                if response_json['token'] is None:
+                    return ''
+                self._vscode_token = response_json['token']
+                return response_json['token']
+        else:
+            return ''
+
+    def send_action_for_execution(self, action: Action) -> Observation:
+        if isinstance(action, FileEditAction):
+            return self.edit(action)
+
+        # set timeout to default if not set
+        if action.timeout is None:
+            action.timeout = self.config.sandbox.timeout
+
+        with self.action_semaphore:
+            if not action.runnable:
+                return NullObservation('')
+            if (
+                hasattr(action, 'confirmation_state')
+                and action.confirmation_state
+                == ActionConfirmationStatus.AWAITING_CONFIRMATION
+            ):
+                return NullObservation('')
+            action_type = action.action  # type: ignore[attr-defined]
+            if action_type not in ACTION_TYPE_TO_CLASS:
+                raise ValueError(f'Action {action_type} does not exist.')
+            if not hasattr(self, action_type):
+                return ErrorObservation(
+                    f'Action {action_type} is not supported in the current runtime.',
+                    error_id='AGENT_ERROR$BAD_ACTION',
+                )
+            if (
+                getattr(action, 'confirmation_state', None)
+                == ActionConfirmationStatus.REJECTED
+            ):
+                return UserRejectObservation(
+                    'Action has been rejected by the user! Waiting for further user input.'
+                )
+
+            assert action.timeout is not None
+
+            try:
+                with send_request(
+                    self.session,
+                    'POST',
+                    f'{self._get_action_execution_server_host()}/execute_action',
+                    json={'action': event_to_dict(action)},
+                    # wait a few more seconds to get the timeout error from client side
+                    timeout=action.timeout + 5,
+                ) as response:
+                    output = response.json()
+                    obs = observation_from_dict(output)
+                    obs._cause = action.id  # type: ignore[attr-defined]
+            except requests.Timeout:
+                raise AgentRuntimeTimeoutError(
+                    f'Runtime failed to return execute_action before the requested timeout of {action.timeout}s'
+                )
+
+            return obs
+
+    def run(self, action: CmdRunAction) -> Observation:
+        return self.send_action_for_execution(action)
+
+    def run_ipython(self, action: IPythonRunCellAction) -> Observation:
+        return self.send_action_for_execution(action)
+
+    def read(self, action: FileReadAction) -> Observation:
+        return self.send_action_for_execution(action)
+
+    def write(self, action: FileWriteAction) -> Observation:
+        return self.send_action_for_execution(action)
+
+    def browse(self, action: BrowseURLAction) -> Observation:
+        return self.send_action_for_execution(action)
+
+    def browse_interactive(self, action: BrowseInteractiveAction) -> Observation:
+        return self.send_action_for_execution(action)
+
+    def close(self) -> None:
+        self.session.close()
diff --git a/openhands/runtime/impl/eventstream/containers.py b/openhands/runtime/impl/docker/containers.py
similarity index 100%
rename from openhands/runtime/impl/eventstream/containers.py
rename to openhands/runtime/impl/docker/containers.py
diff --git a/openhands/runtime/impl/eventstream/eventstream_runtime.py b/openhands/runtime/impl/docker/docker_runtime.py
similarity index 61%
rename from openhands/runtime/impl/eventstream/eventstream_runtime.py
rename to openhands/runtime/impl/docker/docker_runtime.py
index 14f91b87b687..69b59be2de93 100644
--- a/openhands/runtime/impl/eventstream/eventstream_runtime.py
+++ b/openhands/runtime/impl/docker/docker_runtime.py
@@ -1,11 +1,6 @@
 import atexit
-import os
-import tempfile
-import threading
 from functools import lru_cache
-from pathlib import Path
 from typing import Callable
-from zipfile import ZipFile
 
 import docker
 import requests
@@ -14,40 +9,20 @@
 from openhands.core.config import AppConfig
 from openhands.core.exceptions import (
     AgentRuntimeDisconnectedError,
-    AgentRuntimeError,
     AgentRuntimeNotFoundError,
     AgentRuntimeNotReadyError,
-    AgentRuntimeTimeoutError,
 )
 from openhands.core.logger import DEBUG
 from openhands.core.logger import openhands_logger as logger
 from openhands.events import EventStream
-from openhands.events.action import (
-    ActionConfirmationStatus,
-    BrowseInteractiveAction,
-    BrowseURLAction,
-    CmdRunAction,
-    FileEditAction,
-    FileReadAction,
-    FileWriteAction,
-    IPythonRunCellAction,
-)
-from openhands.events.action.action import Action
-from openhands.events.observation import (
-    ErrorObservation,
-    NullObservation,
-    Observation,
-    UserRejectObservation,
-)
-from openhands.events.serialization import event_to_dict, observation_from_dict
-from openhands.events.serialization.action import ACTION_TYPE_TO_CLASS
-from openhands.runtime.base import Runtime
 from openhands.runtime.builder import DockerRuntimeBuilder
-from openhands.runtime.impl.eventstream.containers import remove_all_containers
+from openhands.runtime.impl.action_execution.action_execution_client import (
+    ActionExecutionClient,
+)
+from openhands.runtime.impl.docker.containers import remove_all_containers
 from openhands.runtime.plugins import PluginRequirement
 from openhands.runtime.utils import find_available_tcp_port
 from openhands.runtime.utils.log_streamer import LogStreamer
-from openhands.runtime.utils.request import send_request
 from openhands.runtime.utils.runtime_build import build_runtime_image
 from openhands.utils.async_utils import call_sync_from_async
 from openhands.utils.tenacity_stop import stop_if_should_exit
@@ -62,7 +37,7 @@ def remove_all_runtime_containers():
 _atexit_registered = False
 
 
-class EventStreamRuntime(Runtime):
+class DockerRuntime(ActionExecutionClient):
     """This runtime will subscribe the event stream.
     When receive an event, it will send the event to runtime-client which run inside the docker environment.
 
@@ -74,30 +49,6 @@ class EventStreamRuntime(Runtime):
         env_vars (dict[str, str] | None, optional): Environment variables to set. Defaults to None.
     """
 
-    # Need to provide this method to allow inheritors to init the Runtime
-    # without initting the EventStreamRuntime.
-    def init_base_runtime(
-        self,
-        config: AppConfig,
-        event_stream: EventStream,
-        sid: str = 'default',
-        plugins: list[PluginRequirement] | None = None,
-        env_vars: dict[str, str] | None = None,
-        status_callback: Callable | None = None,
-        attach_to_existing: bool = False,
-        headless_mode: bool = True,
-    ):
-        super().__init__(
-            config,
-            event_stream,
-            sid,
-            plugins,
-            env_vars,
-            status_callback,
-            attach_to_existing,
-            headless_mode,
-        )
-
     def __init__(
         self,
         config: AppConfig,
@@ -121,7 +72,6 @@ def __init__(
         self._vscode_url: str | None = None  # initial dummy value
         self._runtime_initialized: bool = False
         self.api_url = f'{self.config.sandbox.local_runtime_url}:{self._container_port}'
-        self.session = requests.Session()
         self.status_callback = status_callback
 
         self.docker_client: docker.DockerClient = self._init_docker_client()
@@ -129,14 +79,13 @@ def __init__(
         self.runtime_container_image = self.config.sandbox.runtime_container_image
         self.container_name = CONTAINER_NAME_PREFIX + sid
         self.container = None
-        self.action_semaphore = threading.Semaphore(1)  # Ensure one action at a time
 
         self.runtime_builder = DockerRuntimeBuilder(self.docker_client)
 
         # Buffer for container logs
         self.log_streamer: LogStreamer | None = None
 
-        self.init_base_runtime(
+        super().__init__(
             config,
             event_stream,
             sid,
@@ -154,6 +103,9 @@ def __init__(
                 f'Installing extra user-provided dependencies in the runtime image: {self.config.sandbox.runtime_extra_deps}',
             )
 
+    def _get_action_execution_server_host(self):
+        return self.api_url
+
     async def connect(self):
         self.send_status_message('STATUS$STARTING_RUNTIME')
         try:
@@ -399,26 +351,18 @@ def _wait_until_alive(self):
         if not self.log_streamer:
             raise AgentRuntimeNotReadyError('Runtime client is not ready.')
 
-        with send_request(
-            self.session,
-            'GET',
-            f'{self.api_url}/alive',
-            timeout=5,
-        ):
-            pass
+        self.check_if_alive()
 
     def close(self, rm_all_containers: bool | None = None):
-        """Closes the EventStreamRuntime and associated objects
+        """Closes the DockerRuntime and associated objects
 
         Parameters:
         - rm_all_containers (bool): Whether to remove all containers with the 'openhands-sandbox-' prefix
         """
+        super().close()
         if self.log_streamer:
             self.log_streamer.close()
 
-        if self.session:
-            self.session.close()
-
         if rm_all_containers is None:
             rm_all_containers = self.config.sandbox.rm_all_containers
 
@@ -429,178 +373,6 @@ def close(self, rm_all_containers: bool | None = None):
         )
         remove_all_containers(close_prefix)
 
-    def run_action(self, action: Action) -> Observation:
-        if isinstance(action, FileEditAction):
-            return self.edit(action)
-
-        # set timeout to default if not set
-        if action.timeout is None:
-            action.timeout = self.config.sandbox.timeout
-
-        with self.action_semaphore:
-            if not action.runnable:
-                return NullObservation('')
-            if (
-                hasattr(action, 'confirmation_state')
-                and action.confirmation_state
-                == ActionConfirmationStatus.AWAITING_CONFIRMATION
-            ):
-                return NullObservation('')
-            action_type = action.action  # type: ignore[attr-defined]
-            if action_type not in ACTION_TYPE_TO_CLASS:
-                raise ValueError(f'Action {action_type} does not exist.')
-            if not hasattr(self, action_type):
-                return ErrorObservation(
-                    f'Action {action_type} is not supported in the current runtime.',
-                    error_id='AGENT_ERROR$BAD_ACTION',
-                )
-            if (
-                getattr(action, 'confirmation_state', None)
-                == ActionConfirmationStatus.REJECTED
-            ):
-                return UserRejectObservation(
-                    'Action has been rejected by the user! Waiting for further user input.'
-                )
-
-            assert action.timeout is not None
-
-            try:
-                with send_request(
-                    self.session,
-                    'POST',
-                    f'{self.api_url}/execute_action',
-                    json={'action': event_to_dict(action)},
-                    # wait a few more seconds to get the timeout error from client side
-                    timeout=action.timeout + 5,
-                ) as response:
-                    output = response.json()
-                    obs = observation_from_dict(output)
-                    obs._cause = action.id  # type: ignore[attr-defined]
-            except requests.Timeout:
-                raise AgentRuntimeTimeoutError(
-                    f'Runtime failed to return execute_action before the requested timeout of {action.timeout}s'
-                )
-
-            return obs
-
-    def run(self, action: CmdRunAction) -> Observation:
-        return self.run_action(action)
-
-    def run_ipython(self, action: IPythonRunCellAction) -> Observation:
-        return self.run_action(action)
-
-    def read(self, action: FileReadAction) -> Observation:
-        return self.run_action(action)
-
-    def write(self, action: FileWriteAction) -> Observation:
-        return self.run_action(action)
-
-    def browse(self, action: BrowseURLAction) -> Observation:
-        return self.run_action(action)
-
-    def browse_interactive(self, action: BrowseInteractiveAction) -> Observation:
-        return self.run_action(action)
-
-    # ====================================================================
-    # Implement these methods (for file operations) in the subclass
-    # ====================================================================
-
-    def copy_to(
-        self, host_src: str, sandbox_dest: str, recursive: bool = False
-    ) -> None:
-        if not os.path.exists(host_src):
-            raise FileNotFoundError(f'Source file {host_src} does not exist')
-
-        try:
-            if recursive:
-                # For recursive copy, create a zip file
-                with tempfile.NamedTemporaryFile(
-                    suffix='.zip', delete=False
-                ) as temp_zip:
-                    temp_zip_path = temp_zip.name
-
-                with ZipFile(temp_zip_path, 'w') as zipf:
-                    for root, _, files in os.walk(host_src):
-                        for file in files:
-                            file_path = os.path.join(root, file)
-                            arcname = os.path.relpath(
-                                file_path, os.path.dirname(host_src)
-                            )
-                            zipf.write(file_path, arcname)
-
-                upload_data = {'file': open(temp_zip_path, 'rb')}
-            else:
-                # For single file copy
-                upload_data = {'file': open(host_src, 'rb')}
-
-            params = {'destination': sandbox_dest, 'recursive': str(recursive).lower()}
-
-            with send_request(
-                self.session,
-                'POST',
-                f'{self.api_url}/upload_file',
-                files=upload_data,
-                params=params,
-                timeout=300,
-            ):
-                pass
-
-        except requests.Timeout:
-            raise AgentRuntimeTimeoutError('Copy operation timed out')
-        except Exception as e:
-            raise AgentRuntimeError(f'Copy operation failed: {str(e)}')
-        finally:
-            if recursive:
-                os.unlink(temp_zip_path)
-            self.log(
-                'debug', f'Copy completed: host:{host_src} -> runtime:{sandbox_dest}'
-            )
-
-    def list_files(self, path: str | None = None) -> list[str]:
-        """List files in the sandbox.
-
-        If path is None, list files in the sandbox's initial working directory (e.g., /workspace).
-        """
-
-        try:
-            data = {}
-            if path is not None:
-                data['path'] = path
-
-            with send_request(
-                self.session,
-                'POST',
-                f'{self.api_url}/list_files',
-                json=data,
-                timeout=10,
-            ) as response:
-                response_json = response.json()
-                assert isinstance(response_json, list)
-                return response_json
-        except requests.Timeout:
-            raise TimeoutError('List files operation timed out')
-
-    def copy_from(self, path: str) -> Path:
-        """Zip all files in the sandbox and return as a stream of bytes."""
-
-        try:
-            params = {'path': path}
-            with send_request(
-                self.session,
-                'GET',
-                f'{self.api_url}/download_files',
-                params=params,
-                stream=True,
-                timeout=30,
-            ) as response:
-                temp_file = tempfile.NamedTemporaryFile(delete=False)
-                for chunk in response.iter_content(chunk_size=8192):
-                    if chunk:  # filter out keep-alive new chunks
-                        temp_file.write(chunk)
-                return Path(temp_file.name)
-        except requests.Timeout:
-            raise TimeoutError('Copy operation timed out')
-
     def _is_port_in_use_docker(self, port):
         containers = self.docker_client.containers.list()
         for container in containers:
@@ -620,31 +392,13 @@ def _find_available_port(self, max_attempts=5):
 
     @property
     def vscode_url(self) -> str | None:
-        if self.vscode_enabled and self._runtime_initialized:
-            if (
-                hasattr(self, '_vscode_url') and self._vscode_url is not None
-            ):  # cached value
-                return self._vscode_url
-
-            with send_request(
-                self.session,
-                'GET',
-                f'{self.api_url}/vscode/connection_token',
-                timeout=10,
-            ) as response:
-                response_json = response.json()
-                assert isinstance(response_json, dict)
-                if response_json['token'] is None:
-                    return None
-                self._vscode_url = f'http://localhost:{self._host_port + 1}/?tkn={response_json["token"]}&folder={self.config.workspace_mount_path_in_sandbox}'
-                self.log(
-                    'debug',
-                    f'VSCode URL: {self._vscode_url}',
-                )
-                return self._vscode_url
-        else:
+        token = super().get_vscode_token()
+        if not token:
             return None
 
+        vscode_url = f'http://localhost:{self._host_port + 1}/?tkn={token}&folder={self.config.workspace_mount_path_in_sandbox}'
+        return vscode_url
+
     @property
     def web_hosts(self):
         ports = []
diff --git a/openhands/runtime/impl/modal/modal_runtime.py b/openhands/runtime/impl/modal/modal_runtime.py
index 026e7c0b53ef..473c4ae97b10 100644
--- a/openhands/runtime/impl/modal/modal_runtime.py
+++ b/openhands/runtime/impl/modal/modal_runtime.py
@@ -1,8 +1,7 @@
 import os
 import tempfile
-import threading
 from pathlib import Path
-from typing import Callable, Generator
+from typing import Callable
 
 import modal
 import requests
@@ -10,9 +9,8 @@
 
 from openhands.core.config import AppConfig
 from openhands.events import EventStream
-from openhands.runtime.impl.eventstream.eventstream_runtime import (
-    EventStreamRuntime,
-    LogStreamer,
+from openhands.runtime.impl.action_execution.action_execution_client import (
+    ActionExecutionClient,
 )
 from openhands.runtime.plugins import PluginRequirement
 from openhands.runtime.utils.command import get_remote_startup_command
@@ -21,52 +19,13 @@
     prep_build_folder,
 )
 from openhands.utils.async_utils import call_sync_from_async
+from openhands.utils.tenacity_stop import stop_if_should_exit
 
 # FIXME: this will not work in HA mode. We need a better way to track IDs
 MODAL_RUNTIME_IDS: dict[str, str] = {}
 
 
-# Modal's log generator returns strings, but the upstream LogBuffer expects bytes.
-def bytes_shim(string_generator) -> Generator[bytes, None, None]:
-    for line in string_generator:
-        yield line.encode('utf-8')
-
-
-class ModalLogStreamer(LogStreamer):
-    """Streams Modal sandbox logs to stdout.
-
-    This class provides a way to stream logs from a Modal sandbox directly to stdout
-    through the provided logging function.
-    """
-
-    def __init__(
-        self,
-        sandbox: modal.Sandbox,
-        logFn: Callable,
-    ):
-        self.log = logFn
-        self._stop_event = threading.Event()
-        self.log_generator = bytes_shim(sandbox.stderr)
-
-        # Start the stdout streaming thread
-        self.stdout_thread = threading.Thread(target=self._stream_logs)
-        self.stdout_thread.daemon = True
-        self.stdout_thread.start()
-
-    def _stream_logs(self):
-        """Stream logs from the Modal sandbox."""
-        try:
-            for log_line in self.log_generator:
-                if self._stop_event.is_set():
-                    break
-                if log_line:
-                    decoded_line = log_line.decode('utf-8').rstrip()
-                    self.log('debug', f'[inside sandbox] {decoded_line}')
-        except Exception as e:
-            self.log('error', f'Error streaming modal logs: {e}')
-
-
-class ModalRuntime(EventStreamRuntime):
+class ModalRuntime(ActionExecutionClient):
     """This runtime will subscribe the event stream.
 
     When receive an event, it will send the event to runtime-client which run inside the Modal sandbox environment.
@@ -116,14 +75,9 @@ def __init__(
         # This value is arbitrary as it's private to the container
         self.container_port = 3000
 
-        self.session = requests.Session()
         self.status_callback = status_callback
         self.base_container_image_id = self.config.sandbox.base_container_image
         self.runtime_container_image_id = self.config.sandbox.runtime_container_image
-        self.action_semaphore = threading.Semaphore(1)  # Ensure one action at a time
-
-        # Buffer for container logs
-        self.log_streamer: LogStreamer | None = None
 
         if self.config.sandbox.runtime_extra_deps:
             self.log(
@@ -131,7 +85,7 @@ def __init__(
                 f'Installing extra user-provided dependencies in the runtime image: {self.config.sandbox.runtime_extra_deps}',
             )
 
-        self.init_base_runtime(
+        super().__init__(
             config,
             event_stream,
             sid,
@@ -170,7 +124,6 @@ async def connect(self):
 
             self.send_status_message('STATUS$CONTAINER_STARTED')
 
-        self.log_streamer = ModalLogStreamer(self.sandbox, self.log)
         if self.sandbox is None:
             raise Exception('Sandbox not initialized')
         tunnel = self.sandbox.tunnels()[self.container_port]
@@ -187,6 +140,20 @@ async def connect(self):
         if not self.attach_to_existing:
             self.send_status_message(' ')
 
+    def _get_action_execution_server_host(self):
+        return self.api_url
+
+    @tenacity.retry(
+        stop=tenacity.stop_after_delay(120) | stop_if_should_exit(),
+        retry=tenacity.retry_if_exception_type(
+            (ConnectionError, requests.exceptions.ConnectionError)
+        ),
+        reraise=True,
+        wait=tenacity.wait_fixed(2),
+    )
+    def _wait_until_alive(self):
+        self.check_if_alive()
+
     def _get_image_definition(
         self,
         base_container_image_id: str | None,
@@ -292,11 +259,7 @@ def _init_sandbox(
 
     def close(self):
         """Closes the ModalRuntime and associated objects."""
-        if self.log_streamer:
-            self.log_streamer.close()
-
-        if self.session:
-            self.session.close()
+        super().close()
 
         if not self.attach_to_existing and self.sandbox:
             self.sandbox.terminate()
diff --git a/openhands/runtime/impl/remote/remote_runtime.py b/openhands/runtime/impl/remote/remote_runtime.py
index 97d94db75533..bfd4f1698ee5 100644
--- a/openhands/runtime/impl/remote/remote_runtime.py
+++ b/openhands/runtime/impl/remote/remote_runtime.py
@@ -1,10 +1,6 @@
 import os
-import tempfile
-import threading
-from pathlib import Path
 from typing import Callable, Optional
 from urllib.parse import urlparse
-from zipfile import ZipFile
 
 import requests
 import tenacity
@@ -15,29 +11,13 @@
     AgentRuntimeError,
     AgentRuntimeNotFoundError,
     AgentRuntimeNotReadyError,
-    AgentRuntimeTimeoutError,
     AgentRuntimeUnavailableError,
 )
 from openhands.events import EventStream
-from openhands.events.action import (
-    BrowseInteractiveAction,
-    BrowseURLAction,
-    CmdRunAction,
-    FileEditAction,
-    FileReadAction,
-    FileWriteAction,
-    IPythonRunCellAction,
-)
-from openhands.events.action.action import Action
-from openhands.events.observation import (
-    ErrorObservation,
-    NullObservation,
-    Observation,
-)
-from openhands.events.serialization import event_to_dict, observation_from_dict
-from openhands.events.serialization.action import ACTION_TYPE_TO_CLASS
-from openhands.runtime.base import Runtime
 from openhands.runtime.builder.remote import RemoteRuntimeBuilder
+from openhands.runtime.impl.action_execution.action_execution_client import (
+    ActionExecutionClient,
+)
 from openhands.runtime.plugins import PluginRequirement
 from openhands.runtime.utils.command import get_remote_startup_command
 from openhands.runtime.utils.request import (
@@ -49,7 +29,7 @@
 from openhands.utils.tenacity_stop import stop_if_should_exit
 
 
-class RemoteRuntime(Runtime):
+class RemoteRuntime(ActionExecutionClient):
     """This runtime will connect to a remote oh-runtime-client."""
 
     port: int = 60000  # default port for the remote runtime client
@@ -65,10 +45,6 @@ def __init__(
         attach_to_existing: bool = False,
         headless_mode: bool = True,
     ):
-        # We need to set session and action_semaphore before the __init__ below, or we get odd errors
-        self.session = requests.Session()
-        self.action_semaphore = threading.Semaphore(1)
-
         super().__init__(
             config,
             event_stream,
@@ -99,7 +75,9 @@ def __init__(
         self.runtime_url: str | None = None
         self.available_hosts: list[str] = []
         self._runtime_initialized: bool = False
-        self._vscode_url: str | None = None  # initial dummy value
+
+    def _get_action_execution_server_host(self):
+        return self.runtime_url
 
     async def connect(self):
         try:
@@ -149,10 +127,9 @@ def _start_or_attach_to_runtime(self):
 
     def _check_existing_runtime(self) -> bool:
         try:
-            with self._send_request(
+            with self._send_runtime_api_request(
                 'GET',
                 f'{self.config.sandbox.remote_runtime_api_url}/sessions/{self.sid}',
-                is_retry=False,
                 timeout=60,
             ) as response:
                 data = response.json()
@@ -180,10 +157,9 @@ def _check_existing_runtime(self) -> bool:
 
     def _build_runtime(self):
         self.log('debug', f'Building RemoteRuntime config:\n{self.config}')
-        with self._send_request(
+        with self._send_runtime_api_request(
             'GET',
             f'{self.config.sandbox.remote_runtime_api_url}/registry_prefix',
-            is_retry=False,
             timeout=60,
         ) as response:
             response_json = response.json()
@@ -211,10 +187,9 @@ def _build_runtime(self):
             force_rebuild=self.config.sandbox.force_rebuild_runtime,
         )
 
-        with self._send_request(
+        with self._send_runtime_api_request(
             'GET',
             f'{self.config.sandbox.remote_runtime_api_url}/image_exists',
-            is_retry=False,
             params={'image': self.container_image},
             timeout=60,
         ) as response:
@@ -253,10 +228,9 @@ def _start_runtime(self):
 
         # Start the sandbox using the /start endpoint
         try:
-            with self._send_request(
+            with self._send_runtime_api_request(
                 'POST',
                 f'{self.config.sandbox.remote_runtime_api_url}/start',
-                is_retry=False,
                 json=start_request,
                 timeout=60,
             ) as response:
@@ -270,10 +244,9 @@ def _start_runtime(self):
             raise AgentRuntimeUnavailableError() from e
 
     def _resume_runtime(self):
-        with self._send_request(
+        with self._send_runtime_api_request(
             'POST',
             f'{self.config.sandbox.remote_runtime_api_url}/resume',
-            is_retry=False,
             json={'runtime_id': self.runtime_id},
             timeout=60,
         ):
@@ -293,34 +266,19 @@ def _parse_runtime_response(self, response: requests.Response):
 
     @property
     def vscode_url(self) -> str | None:
-        if self.vscode_enabled and self._runtime_initialized:
-            if (
-                hasattr(self, '_vscode_url') and self._vscode_url is not None
-            ):  # cached value
-                return self._vscode_url
-
-            with self._send_request(
-                'GET',
-                f'{self.runtime_url}/vscode/connection_token',
-                timeout=60,
-            ) as response:
-                response_json = response.json()
-            assert isinstance(response_json, dict)
-            if response_json['token'] is None:
-                return None
-            # parse runtime_url to get vscode_url
-            _parsed_url = urlparse(self.runtime_url)
-            assert isinstance(_parsed_url.scheme, str) and isinstance(
-                _parsed_url.netloc, str
-            )
-            self._vscode_url = f'{_parsed_url.scheme}://vscode-{_parsed_url.netloc}/?tkn={response_json["token"]}&folder={self.config.workspace_mount_path_in_sandbox}'
-            self.log(
-                'debug',
-                f'VSCode URL: {self._vscode_url}',
-            )
-            return self._vscode_url
-        else:
+        token = super().get_vscode_token()
+        if not token:
             return None
+        _parsed_url = urlparse(self.runtime_url)
+        assert isinstance(_parsed_url.scheme, str) and isinstance(
+            _parsed_url.netloc, str
+        )
+        vscode_url = f'{_parsed_url.scheme}://vscode-{_parsed_url.netloc}/?tkn={token}&folder={self.config.workspace_mount_path_in_sandbox}'
+        self.log(
+            'debug',
+            f'VSCode URL: {vscode_url}',
+        )
+        return vscode_url
 
     @property
     def web_hosts(self) -> list[str]:
@@ -340,7 +298,7 @@ def _wait_until_alive(self):
 
     def _wait_until_alive_impl(self):
         self.log('debug', f'Waiting for runtime to be alive at url: {self.runtime_url}')
-        with self._send_request(
+        with self._send_runtime_api_request(
             'GET',
             f'{self.config.sandbox.remote_runtime_api_url}/sessions/{self.sid}',
             timeout=60,
@@ -357,12 +315,7 @@ def _wait_until_alive_impl(self):
         # Retry a period of time to give the cluster time to start the pod
         if pod_status == 'ready':
             try:
-                with self._send_request(
-                    'GET',
-                    f'{self.runtime_url}/alive',
-                    timeout=60,
-                ):  # will raise exception if we don't get 200 back.
-                    pass
+                self.check_if_alive()
             except requests.HTTPError as e:
                 self.log(
                     'warning', f"Runtime /alive failed, but pod says it's ready: {e}"
@@ -397,182 +350,39 @@ def _wait_until_alive_impl(self):
 
     def close(self, timeout: int = 10):
         if self.config.sandbox.keep_runtime_alive or self.attach_to_existing:
-            self.session.close()
+            super().close()
             return
-        if self.runtime_id and self.session:
-            try:
-                with self._send_request(
-                    'POST',
-                    f'{self.config.sandbox.remote_runtime_api_url}/stop',
-                    is_retry=False,
-                    json={'runtime_id': self.runtime_id},
-                    timeout=timeout,
-                ):
-                    self.log('debug', 'Runtime stopped.')
-            except Exception as e:
-                raise e
-            finally:
-                self.session.close()
-
-    def run_action(self, action: Action, is_retry: bool = False) -> Observation:
-        if action.timeout is None:
-            action.timeout = self.config.sandbox.timeout
-        if isinstance(action, FileEditAction):
-            return self.edit(action)
-        with self.action_semaphore:
-            if not action.runnable:
-                return NullObservation('')
-            action_type = action.action  # type: ignore[attr-defined]
-            if action_type not in ACTION_TYPE_TO_CLASS:
-                raise ValueError(f'Action {action_type} does not exist.')
-            if not hasattr(self, action_type):
-                return ErrorObservation(
-                    f'[Runtime (ID={self.runtime_id})] Action {action_type} is not supported in the current runtime.',
-                    error_id='AGENT_ERROR$BAD_ACTION',
-                )
+        try:
+            with self._send_runtime_api_request(
+                'POST',
+                f'{self.config.sandbox.remote_runtime_api_url}/stop',
+                json={'runtime_id': self.runtime_id},
+                timeout=timeout,
+            ):
+                self.log('debug', 'Runtime stopped.')
+        except Exception as e:
+            raise e
+        finally:
+            super().close()
 
-            assert action.timeout is not None
+    def _send_runtime_api_request(self, method, url, **kwargs):
+        return send_request(self.session, method, url, **kwargs)
 
-            try:
-                request_body = {'action': event_to_dict(action)}
-                self.log('debug', f'Request body: {request_body}')
-                with self._send_request(
-                    'POST',
-                    f'{self.runtime_url}/execute_action',
-                    is_retry=False,
-                    json=request_body,
-                    # wait a few more seconds to get the timeout error from client side
-                    timeout=action.timeout + 5,
-                ) as response:
-                    output = response.json()
-                obs = observation_from_dict(output)
-                obs._cause = action.id  # type: ignore[attr-defined]
-            except requests.Timeout:
-                raise AgentRuntimeTimeoutError(
-                    f'Runtime failed to return execute_action before the requested timeout of {action.timeout}s'
-                )
-            return obs
-
-    def _send_request(self, method, url, is_retry=False, **kwargs):
-        is_runtime_request = self.runtime_url and self.runtime_url in url
+    def _send_action_server_request(self, method, url, **kwargs):
         try:
-            return send_request(self.session, method, url, **kwargs)
+            return super()._send_action_server_request(method, url, **kwargs)
         except requests.Timeout:
             self.log('error', 'No response received within the timeout period.')
             raise
         except RequestHTTPError as e:
-            if is_runtime_request and e.response.status_code in (404, 502):
+            if e.response.status_code in (404, 502):
                 raise AgentRuntimeDisconnectedError(
                     f'{e.response.status_code} error while connecting to {self.runtime_url}'
                 ) from e
-            elif is_runtime_request and e.response.status_code == 503:
-                if not is_retry:
-                    self.log('warning', 'Runtime appears to be paused. Resuming...')
-                    self._resume_runtime()
-                    self._wait_until_alive()
-                    return self._send_request(method, url, True, **kwargs)
-                else:
-                    raise AgentRuntimeUnavailableError(
-                        f'{e.response.status_code} error while connecting to {self.runtime_url}'
-                    ) from e
-
+            elif e.response.status_code == 503:
+                self.log('warning', 'Runtime appears to be paused. Resuming...')
+                self._resume_runtime()
+                self._wait_until_alive()
+                return super()._send_action_server_request(method, url, **kwargs)
             else:
                 raise e
-
-    def run(self, action: CmdRunAction) -> Observation:
-        return self.run_action(action)
-
-    def run_ipython(self, action: IPythonRunCellAction) -> Observation:
-        return self.run_action(action)
-
-    def read(self, action: FileReadAction) -> Observation:
-        return self.run_action(action)
-
-    def write(self, action: FileWriteAction) -> Observation:
-        return self.run_action(action)
-
-    def browse(self, action: BrowseURLAction) -> Observation:
-        return self.run_action(action)
-
-    def browse_interactive(self, action: BrowseInteractiveAction) -> Observation:
-        return self.run_action(action)
-
-    def copy_to(
-        self, host_src: str, sandbox_dest: str, recursive: bool = False
-    ) -> None:
-        if not os.path.exists(host_src):
-            raise FileNotFoundError(f'Source file {host_src} does not exist')
-
-        try:
-            if recursive:
-                with tempfile.NamedTemporaryFile(
-                    suffix='.zip', delete=False
-                ) as temp_zip:
-                    temp_zip_path = temp_zip.name
-
-                with ZipFile(temp_zip_path, 'w') as zipf:
-                    for root, _, files in os.walk(host_src):
-                        for file in files:
-                            file_path = os.path.join(root, file)
-                            arcname = os.path.relpath(
-                                file_path, os.path.dirname(host_src)
-                            )
-                            zipf.write(file_path, arcname)
-
-                upload_data = {'file': open(temp_zip_path, 'rb')}
-            else:
-                upload_data = {'file': open(host_src, 'rb')}
-
-            params = {'destination': sandbox_dest, 'recursive': str(recursive).lower()}
-
-            with self._send_request(
-                'POST',
-                f'{self.runtime_url}/upload_file',
-                is_retry=False,
-                files=upload_data,
-                params=params,
-                timeout=300,
-            ) as response:
-                self.log(
-                    'debug',
-                    f'Copy completed: host:{host_src} -> runtime:{sandbox_dest}. Response: {response.text}',
-                )
-        finally:
-            if recursive:
-                os.unlink(temp_zip_path)
-            self.log(
-                'debug', f'Copy completed: host:{host_src} -> runtime:{sandbox_dest}'
-            )
-
-    def list_files(self, path: str | None = None) -> list[str]:
-        data = {}
-        if path is not None:
-            data['path'] = path
-
-        with self._send_request(
-            'POST',
-            f'{self.runtime_url}/list_files',
-            is_retry=False,
-            json=data,
-            timeout=30,
-        ) as response:
-            response_json = response.json()
-        assert isinstance(response_json, list)
-        return response_json
-
-    def copy_from(self, path: str) -> Path:
-        """Zip all files in the sandbox and return as a stream of bytes."""
-        params = {'path': path}
-        with self._send_request(
-            'GET',
-            f'{self.runtime_url}/download_files',
-            is_retry=False,
-            params=params,
-            stream=True,
-            timeout=30,
-        ) as response:
-            temp_file = tempfile.NamedTemporaryFile(delete=False)
-            for chunk in response.iter_content(chunk_size=8192):
-                if chunk:  # filter out keep-alive new chunks
-                    temp_file.write(chunk)
-            return Path(temp_file.name)
diff --git a/openhands/runtime/impl/runloop/runloop_runtime.py b/openhands/runtime/impl/runloop/runloop_runtime.py
index 368244a03c07..2e51ea409323 100644
--- a/openhands/runtime/impl/runloop/runloop_runtime.py
+++ b/openhands/runtime/impl/runloop/runloop_runtime.py
@@ -1,82 +1,26 @@
 import logging
-import threading
-import time
 from typing import Callable
 
-import requests
 import tenacity
 from runloop_api_client import Runloop
 from runloop_api_client.types import DevboxView
 from runloop_api_client.types.shared_params import LaunchParameters
 
 from openhands.core.config import AppConfig
-from openhands.core.exceptions import (
-    AgentRuntimeNotReadyError,
-    AgentRuntimeUnavailableError,
-)
 from openhands.core.logger import openhands_logger as logger
 from openhands.events import EventStream
-from openhands.runtime.impl.eventstream.eventstream_runtime import EventStreamRuntime
+from openhands.runtime.impl.action_execution.action_execution_client import (
+    ActionExecutionClient,
+)
 from openhands.runtime.plugins import PluginRequirement
 from openhands.runtime.utils.command import get_remote_startup_command
-from openhands.runtime.utils.log_streamer import LogStreamer
-from openhands.runtime.utils.request import send_request
 from openhands.utils.tenacity_stop import stop_if_should_exit
 
 CONTAINER_NAME_PREFIX = 'openhands-runtime-'
 
 
-class RunloopLogStreamer(LogStreamer):
-    """Streams Runloop devbox logs to stdout.
-
-    This class provides a way to stream logs from a Runloop devbox directly to stdout
-    through the provided logging function.
-    """
-
-    def __init__(
-        self,
-        runloop_api_client: Runloop,
-        devbox_id: str,
-        logFn: Callable,
-    ):
-        self.runloop_api_client = runloop_api_client
-        self.devbox_id = devbox_id
-        self.log = logFn
-        self.log_index = 0
-        self._stop_event = threading.Event()
-
-        # Start the stdout streaming thread
-        self.stdout_thread = threading.Thread(target=self._stream_logs)
-        self.stdout_thread.daemon = True
-        self.stdout_thread.start()
-
-    def _stream_logs(self):
-        """Stream logs from the Runloop devbox."""
-        try:
-            while True:
-                raw_logs = self.runloop_api_client.devboxes.logs.list(
-                    self.devbox_id
-                ).logs[self.log_index :]
-                logs = [
-                    log.message
-                    for log in raw_logs
-                    if log.message and log.cmd_id is None
-                ]
-
-                self.log_index += len(raw_logs)
-                if self._stop_event.is_set():
-                    break
-                if logs:
-                    for log_line in logs:
-                        self.log('debug', f'[inside devbox] {log_line}')
-
-                time.sleep(1)
-        except Exception as e:
-            self.log('error', f'Error streaming runloop logs: {e}')
-
-
-class RunloopRuntime(EventStreamRuntime):
-    """The RunloopRuntime class is an EventStreamRuntime that utilizes Runloop Devbox as a runtime environment."""
+class RunloopRuntime(ActionExecutionClient):
+    """The RunloopRuntime class is an DockerRuntime that utilizes Runloop Devbox as a runtime environment."""
 
     _sandbox_port: int = 4444
     _vscode_port: int = 4445
@@ -98,10 +42,8 @@ def __init__(
         self.runloop_api_client = Runloop(
             bearer_token=config.runloop_api_key,
         )
-        self.session = requests.Session()
         self.container_name = CONTAINER_NAME_PREFIX + sid
-        self.action_semaphore = threading.Semaphore(1)  # Ensure one action at a time
-        self.init_base_runtime(
+        super().__init__(
             config,
             event_stream,
             sid,
@@ -112,9 +54,11 @@ def __init__(
             headless_mode,
         )
         # Buffer for container logs
-        self.log_streamer: LogStreamer | None = None
         self._vscode_url: str | None = None
 
+    def _get_action_execution_server_host(self):
+        return self.api_url
+
     @tenacity.retry(
         stop=tenacity.stop_after_attempt(120),
         wait=tenacity.wait_fixed(1),
@@ -203,15 +147,11 @@ async def connect(self):
             port=self._sandbox_port,
         )
 
-        # Hook up logs
-        self.log_streamer = RunloopLogStreamer(
-            self.runloop_api_client, self.devbox.id, logger.info
-        )
         self.api_url = tunnel.url
         logger.info(f'Container started. Server url: {self.api_url}')
 
         # End Runloop connect
-        # NOTE: Copied from EventStreamRuntime
+        # NOTE: Copied from DockerRuntime
         logger.info('Waiting for client to become ready...')
         self.send_status_message('STATUS$WAITING_FOR_CLIENT')
         self._wait_until_alive()
@@ -230,27 +170,10 @@ async def connect(self):
         reraise=(ConnectionRefusedError,),
     )
     def _wait_until_alive(self):
-        if not self.log_streamer:
-            raise AgentRuntimeNotReadyError('Runtime client is not ready.')
-        response = send_request(
-            self.session,
-            'GET',
-            f'{self.api_url}/alive',
-            timeout=5,
-        )
-        if response.status_code == 200:
-            return
-        else:
-            msg = f'Action execution API is not alive. Response: {response}'
-            logger.error(msg)
-            raise AgentRuntimeUnavailableError(msg)
+        super().check_if_alive()
 
     def close(self, rm_all_containers: bool | None = True):
-        if self.log_streamer:
-            self.log_streamer.close()
-
-        if self.session:
-            self.session.close()
+        super().close()
 
         if self.attach_to_existing:
             return
@@ -260,42 +183,24 @@ def close(self, rm_all_containers: bool | None = True):
 
     @property
     def vscode_url(self) -> str | None:
-        if self.vscode_enabled and self.devbox and self.devbox.status == 'running':
-            if self._vscode_url is not None:
-                return self._vscode_url
-
-            try:
-                with send_request(
-                    self.session,
-                    'GET',
-                    f'{self.api_url}/vscode/connection_token',
-                    timeout=10,
-                ) as response:
-                    response_json = response.json()
-                    assert isinstance(response_json, dict)
-                    if response_json['token'] is None:
-                        return None
-                    token = response_json['token']
-
-                self._vscode_url = (
-                    self.runloop_api_client.devboxes.create_tunnel(
-                        id=self.devbox.id,
-                        port=self._vscode_port,
-                    ).url
-                    + f'/?tkn={token}&folder={self.config.workspace_mount_path_in_sandbox}'
-                )
+        if self._vscode_url is not None:  # cached value
+            return self._vscode_url
+        token = super().get_vscode_token()
+        if not token:
+            return None
+        if not self.devbox:
+            return None
+        self._vscode_url = (
+            self.runloop_api_client.devboxes.create_tunnel(
+                id=self.devbox.id,
+                port=self._vscode_port,
+            ).url
+            + f'/?tkn={token}&folder={self.config.workspace_mount_path_in_sandbox}'
+        )
 
-                self.log(
-                    'debug',
-                    f'VSCode URL: {self._vscode_url}',
-                )
+        self.log(
+            'debug',
+            f'VSCode URL: {self._vscode_url}',
+        )
 
-                return self._vscode_url
-            except Exception as e:
-                self.log(
-                    'error',
-                    f'Failed to create vscode tunnel {e}',
-                )
-                return None
-        else:
-            return None
+        return self._vscode_url
diff --git a/openhands/runtime/plugins/agent_skills/utils/config.py b/openhands/runtime/plugins/agent_skills/utils/config.py
index f0084c540393..2b0f0f4ead26 100644
--- a/openhands/runtime/plugins/agent_skills/utils/config.py
+++ b/openhands/runtime/plugins/agent_skills/utils/config.py
@@ -5,9 +5,9 @@
 
 # ==================================================================================================
 # OPENAI
-# TODO: Move this to EventStream Actions when EventStreamRuntime is fully implemented
+# TODO: Move this to EventStream Actions when DockerRuntime is fully implemented
 # NOTE: we need to get env vars inside functions because they will be set in IPython
-# AFTER the agentskills is imported (the case for EventStreamRuntime)
+# AFTER the agentskills is imported (the case for DockerRuntime)
 # ==================================================================================================
 def _get_openai_api_key():
     return os.getenv('OPENAI_API_KEY', os.getenv('SANDBOX_ENV_OPENAI_API_KEY', ''))
diff --git a/openhands/server/config/openhands_config.py b/openhands/server/config/openhands_config.py
index 80a577494b53..c4d472e06b85 100644
--- a/openhands/server/config/openhands_config.py
+++ b/openhands/server/config/openhands_config.py
@@ -16,7 +16,10 @@ class OpenhandsConfig(OpenhandsConfigInterface):
         'openhands.server.middleware.AttachConversationMiddleware'
     )
     settings_store_class: str = (
-        'openhands.storage.file_settings_store.FileSettingsStore'
+        'openhands.storage.settings.file_settings_store.FileSettingsStore'
+    )
+    conversation_store_class: str = (
+        'openhands.storage.conversation.file_conversation_store.FileConversationStore'
     )
 
     def verify_config(self):
diff --git a/openhands/server/data_models/conversation_metadata.py b/openhands/server/data_models/conversation_metadata.py
new file mode 100644
index 000000000000..8aa43a623bd9
--- /dev/null
+++ b/openhands/server/data_models/conversation_metadata.py
@@ -0,0 +1,8 @@
+from dataclasses import dataclass
+
+
+@dataclass
+class ConversationMetadata:
+    conversation_id: str
+    github_user_id: str
+    selected_repository: str | None
diff --git a/openhands/server/listen_socket.py b/openhands/server/listen_socket.py
index 5a5e82757e51..4bd7b8071960 100644
--- a/openhands/server/listen_socket.py
+++ b/openhands/server/listen_socket.py
@@ -4,6 +4,7 @@
 from socketio.exceptions import ConnectionRefusedError
 
 from openhands.core.logger import openhands_logger as logger
+from openhands.core.schema.agent import AgentState
 from openhands.events.action import (
     NullAction,
 )
@@ -13,13 +14,10 @@
 from openhands.events.observation.agent import AgentStateChangedObservation
 from openhands.events.serialization import event_to_dict
 from openhands.events.stream import AsyncEventStreamWrapper
-from openhands.server.routes.settings import SettingsStoreImpl
+from openhands.server.routes.settings import ConversationStoreImpl, SettingsStoreImpl
 from openhands.server.session.manager import ConversationDoesNotExistError
 from openhands.server.shared import config, openhands_config, session_manager, sio
 from openhands.server.types import AppMode
-from openhands.storage.conversation.conversation_store import (
-    ConversationStore,
-)
 from openhands.utils.async_utils import call_sync_from_async
 
 
@@ -44,7 +42,9 @@ async def connect(connection_id: str, environ, auth):
 
         logger.info(f'User {user_id} is connecting to conversation {conversation_id}')
 
-        conversation_store = await ConversationStore.get_instance(config)
+        conversation_store = await ConversationStoreImpl.get_instance(
+            config, github_token
+        )
         metadata = await conversation_store.get_metadata(conversation_id)
         if metadata.github_user_id != user_id:
             logger.error(
@@ -80,10 +80,11 @@ async def connect(connection_id: str, environ, auth):
         ):
             continue
         elif isinstance(event, AgentStateChangedObservation):
+            if event.agent_state == AgentState.INIT:
+                await sio.emit('oh_event', event_to_dict(event), to=connection_id)
             agent_state_changed = event
-            continue
-        await sio.emit('oh_event', event_to_dict(event), to=connection_id)
-
+        else:
+            await sio.emit('oh_event', event_to_dict(event), to=connection_id)
     if agent_state_changed:
         await sio.emit('oh_event', event_to_dict(agent_state_changed), to=connection_id)
 
diff --git a/openhands/server/routes/new_conversation.py b/openhands/server/routes/new_conversation.py
index 8dd75eb63249..6b16698d3a73 100644
--- a/openhands/server/routes/new_conversation.py
+++ b/openhands/server/routes/new_conversation.py
@@ -6,13 +6,10 @@
 from pydantic import BaseModel
 
 from openhands.core.logger import openhands_logger as logger
-from openhands.server.routes.settings import SettingsStoreImpl
+from openhands.server.data_models.conversation_metadata import ConversationMetadata
+from openhands.server.routes.settings import ConversationStoreImpl, SettingsStoreImpl
 from openhands.server.session.conversation_init_data import ConversationInitData
 from openhands.server.shared import config, session_manager
-from openhands.storage.conversation.conversation_store import (
-    ConversationMetadata,
-    ConversationStore,
-)
 from openhands.utils.async_utils import call_sync_from_async
 
 app = APIRouter(prefix='/api')
@@ -41,15 +38,12 @@ async def new_conversation(request: Request, data: InitSessionRequest):
     session_init_args: dict = {}
     if settings:
         session_init_args = {**settings.__dict__, **session_init_args}
-    if data.args:
-        for key, value in data.args.items():
-            session_init_args[key.lower()] = value
 
     session_init_args['github_token'] = github_token
     session_init_args['selected_repository'] = data.selected_repository
     conversation_init_data = ConversationInitData(**session_init_args)
 
-    conversation_store = await ConversationStore.get_instance(config)
+    conversation_store = await ConversationStoreImpl.get_instance(config, github_token)
 
     conversation_id = uuid.uuid4().hex
     while await conversation_store.exists(conversation_id):
diff --git a/openhands/server/routes/settings.py b/openhands/server/routes/settings.py
index e5eaa7035ec7..81637e8e45ef 100644
--- a/openhands/server/routes/settings.py
+++ b/openhands/server/routes/settings.py
@@ -4,12 +4,17 @@
 from openhands.core.logger import openhands_logger as logger
 from openhands.server.settings import Settings
 from openhands.server.shared import config, openhands_config
-from openhands.storage.settings_store import SettingsStore
+from openhands.storage.conversation.conversation_store import ConversationStore
+from openhands.storage.settings.settings_store import SettingsStore
 from openhands.utils.import_utils import get_impl
 
 app = APIRouter(prefix='/api')
 
 SettingsStoreImpl = get_impl(SettingsStore, openhands_config.settings_store_class)  # type: ignore
+ConversationStoreImpl = get_impl(
+    ConversationStore,  # type: ignore
+    openhands_config.conversation_store_class,
+)
 
 
 @app.get('/settings')
@@ -22,9 +27,14 @@ async def load_settings(
     try:
         settings_store = await SettingsStoreImpl.get_instance(config, github_token)
         settings = await settings_store.load()
-        if settings:
-            # For security reasons we don't ever send the api key to the client
-            settings.llm_api_key = None
+        if not settings:
+            return JSONResponse(
+                status_code=status.HTTP_404_NOT_FOUND,
+                content={'error': 'Settings not found'},
+            )
+
+        # For security reasons we don't ever send the api key to the client
+        settings.llm_api_key = 'SET' if settings.llm_api_key else None
         return settings
     except Exception as e:
         logger.warning(f'Invalid token: {e}')
@@ -45,11 +55,13 @@ async def store_settings(
     try:
         settings_store = await SettingsStoreImpl.get_instance(config, github_token)
         existing_settings = await settings_store.load()
+
         if existing_settings:
-            settings = Settings(**{**existing_settings.__dict__, **settings.__dict__})
+            # LLM key isn't on the frontend, so we need to keep it if unset
             if settings.llm_api_key is None:
                 settings.llm_api_key = existing_settings.llm_api_key
         await settings_store.store(settings)
+
         return JSONResponse(
             status_code=status.HTTP_200_OK,
             content={'message': 'Settings stored'},
diff --git a/openhands/server/session/session.py b/openhands/server/session/session.py
index da412a435c40..2cba6657057e 100644
--- a/openhands/server/session/session.py
+++ b/openhands/server/session/session.py
@@ -85,11 +85,9 @@ async def initialize_agent(
         # override default LLM config
 
         default_llm_config = self.config.get_llm_config()
-        default_llm_config.model = settings.llm_model or default_llm_config.model
-        default_llm_config.api_key = settings.llm_api_key or default_llm_config.api_key
-        default_llm_config.base_url = (
-            settings.llm_base_url or default_llm_config.base_url
-        )
+        default_llm_config.model = settings.llm_model or ''
+        default_llm_config.api_key = settings.llm_api_key
+        default_llm_config.base_url = settings.llm_base_url
 
         # TODO: override other LLM config & agent config groups (#2075)
 
diff --git a/openhands/storage/conversation/conversation_store.py b/openhands/storage/conversation/conversation_store.py
index 461c1a98b707..41d9452ab8f8 100644
--- a/openhands/storage/conversation/conversation_store.py
+++ b/openhands/storage/conversation/conversation_store.py
@@ -1,43 +1,31 @@
-import json
-from dataclasses import dataclass
-
-from openhands.core.config.app_config import AppConfig
-from openhands.storage import get_file_store
-from openhands.storage.files import FileStore
-from openhands.storage.locations import get_conversation_metadata_filename
-from openhands.utils.async_utils import call_sync_from_async
+from __future__ import annotations
 
+from abc import ABC, abstractmethod
 
-@dataclass
-class ConversationMetadata:
-    conversation_id: str
-    github_user_id: str
-    selected_repository: str | None
+from openhands.core.config.app_config import AppConfig
+from openhands.server.data_models.conversation_metadata import ConversationMetadata
 
 
-@dataclass
-class ConversationStore:
-    file_store: FileStore
+class ConversationStore(ABC):
+    """
+    Storage for conversation metadata. May or may not support multiple users depending on the environment
+    """
 
+    @abstractmethod
     async def save_metadata(self, metadata: ConversationMetadata):
-        json_str = json.dumps(metadata.__dict__)
-        path = get_conversation_metadata_filename(metadata.conversation_id)
-        await call_sync_from_async(self.file_store.write, path, json_str)
+        """Store conversation metadata"""
 
+    @abstractmethod
     async def get_metadata(self, conversation_id: str) -> ConversationMetadata:
-        path = get_conversation_metadata_filename(conversation_id)
-        json_str = await call_sync_from_async(self.file_store.read, path)
-        return ConversationMetadata(**json.loads(json_str))
+        """Load conversation metadata"""
 
+    @abstractmethod
     async def exists(self, conversation_id: str) -> bool:
-        path = get_conversation_metadata_filename(conversation_id)
-        try:
-            await call_sync_from_async(self.file_store.read, path)
-            return True
-        except FileNotFoundError:
-            return False
+        """Check if conversation exists"""
 
     @classmethod
-    async def get_instance(cls, config: AppConfig):
-        file_store = get_file_store(config.file_store, config.file_store_path)
-        return ConversationStore(file_store)
+    @abstractmethod
+    async def get_instance(
+        cls, config: AppConfig, token: str | None
+    ) -> ConversationStore:
+        """Get a store for the user represented by the token given"""
diff --git a/openhands/storage/conversation/file_conversation_store.py b/openhands/storage/conversation/file_conversation_store.py
new file mode 100644
index 000000000000..b77555fcd51e
--- /dev/null
+++ b/openhands/storage/conversation/file_conversation_store.py
@@ -0,0 +1,43 @@
+from __future__ import annotations
+
+import json
+from dataclasses import dataclass
+
+from openhands.core.config.app_config import AppConfig
+from openhands.storage import get_file_store
+from openhands.storage.conversation.conversation_store import ConversationStore
+from openhands.server.data_models.conversation_metadata import ConversationMetadata
+from openhands.storage.files import FileStore
+from openhands.storage.locations import get_conversation_metadata_filename
+from openhands.utils.async_utils import call_sync_from_async
+
+
+@dataclass
+class FileConversationStore(ConversationStore):
+    file_store: FileStore
+
+    async def save_metadata(self, metadata: ConversationMetadata):
+        json_str = json.dumps(metadata.__dict__)
+        path = self.get_conversation_metadata_filename(metadata.conversation_id)
+        await call_sync_from_async(self.file_store.write, path, json_str)
+
+    async def get_metadata(self, conversation_id: str) -> ConversationMetadata:
+        path = self.get_conversation_metadata_filename(conversation_id)
+        json_str = await call_sync_from_async(self.file_store.read, path)
+        return ConversationMetadata(**json.loads(json_str))
+
+    async def exists(self, conversation_id: str) -> bool:
+        path = self.get_conversation_metadata_filename(conversation_id)
+        try:
+            await call_sync_from_async(self.file_store.read, path)
+            return True
+        except FileNotFoundError:
+            return False
+
+    def get_conversation_metadata_filename(self, conversation_id: str) -> str:
+        return get_conversation_metadata_filename(conversation_id)
+
+    @classmethod
+    async def get_instance(cls, config: AppConfig, token: str | None):
+        file_store = get_file_store(config.file_store, config.file_store_path)
+        return FileConversationStore(file_store)
diff --git a/openhands/storage/file_settings_store.py b/openhands/storage/settings/file_settings_store.py
similarity index 94%
rename from openhands/storage/file_settings_store.py
rename to openhands/storage/settings/file_settings_store.py
index b3cb9bb8ea9b..413376759c8d 100644
--- a/openhands/storage/file_settings_store.py
+++ b/openhands/storage/settings/file_settings_store.py
@@ -7,7 +7,7 @@
 from openhands.server.settings import Settings
 from openhands.storage import get_file_store
 from openhands.storage.files import FileStore
-from openhands.storage.settings_store import SettingsStore
+from openhands.storage.settings.settings_store import SettingsStore
 from openhands.utils.async_utils import call_sync_from_async
 
 
diff --git a/openhands/storage/settings_store.py b/openhands/storage/settings/settings_store.py
similarity index 100%
rename from openhands/storage/settings_store.py
rename to openhands/storage/settings/settings_store.py
diff --git a/poetry.lock b/poetry.lock
index c22cf67a563a..2cd8ae911b76 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -553,17 +553,17 @@ files = [
 
 [[package]]
 name = "boto3"
-version = "1.35.88"
+version = "1.35.90"
 description = "The AWS SDK for Python"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "boto3-1.35.88-py3-none-any.whl", hash = "sha256:7bc9b27ad87607256470c70a86c8b8c319ddd6ecae89cc191687cbf8ccb7b6a6"},
-    {file = "boto3-1.35.88.tar.gz", hash = "sha256:43c6a7a70bb226770a82a601870136e3bb3bf2808f4576ab5b9d7d140dbf1323"},
+    {file = "boto3-1.35.90-py3-none-any.whl", hash = "sha256:b0874233057995a8f0c813f5b45a36c09630e74c43d7a7c64db2feef2915d493"},
+    {file = "boto3-1.35.90.tar.gz", hash = "sha256:dc56caaaab2157a4bfc109c88b50cd032f3ac66c06d17f8ee335b798eaf53e5c"},
 ]
 
 [package.dependencies]
-botocore = ">=1.35.88,<1.36.0"
+botocore = ">=1.35.90,<1.36.0"
 jmespath = ">=0.7.1,<2.0.0"
 s3transfer = ">=0.10.0,<0.11.0"
 
@@ -572,13 +572,13 @@ crt = ["botocore[crt] (>=1.21.0,<2.0a0)"]
 
 [[package]]
 name = "botocore"
-version = "1.35.88"
+version = "1.35.90"
 description = "Low-level, data-driven core of boto 3."
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "botocore-1.35.88-py3-none-any.whl", hash = "sha256:e60cc3fbe8d7a10f70e7e852d76be2b29f23ead418a5899d366ea32b1eacb5a5"},
-    {file = "botocore-1.35.88.tar.gz", hash = "sha256:58dcd9a464c354b8c6c25261d8de830d175d9739eae568bf0c52e57116fb03c6"},
+    {file = "botocore-1.35.90-py3-none-any.whl", hash = "sha256:51dcbe1b32e2ac43dac17091f401a00ce5939f76afe999081802009cce1e92e4"},
+    {file = "botocore-1.35.90.tar.gz", hash = "sha256:f007f58e8e3c1ad0412a6ddfae40ed92a7bca571c068cb959902bcf107f2ae48"},
 ]
 
 [package.dependencies]
@@ -3739,13 +3739,13 @@ types-tqdm = "*"
 
 [[package]]
 name = "litellm"
-version = "1.55.12"
+version = "1.56.4"
 description = "Library to easily interface with LLM API providers"
 optional = false
 python-versions = "!=2.7.*,!=3.0.*,!=3.1.*,!=3.2.*,!=3.3.*,!=3.4.*,!=3.5.*,!=3.6.*,!=3.7.*,>=3.8"
 files = [
-    {file = "litellm-1.55.12-py3-none-any.whl", hash = "sha256:d034c3d6cdd5b8dd2c56f1100eb14f41f920b7673ac943d38fb2d7155ae5774b"},
-    {file = "litellm-1.55.12.tar.gz", hash = "sha256:6d93025ebf29ae3d6929a90c44d648ba6804fdbc1bb1c3a72d7dddd08f6229dc"},
+    {file = "litellm-1.56.4-py3-none-any.whl", hash = "sha256:699a8db46f7de045069a77c435e13244b5fdaf5df1c8cb5e6ad675ef7e104ccd"},
+    {file = "litellm-1.56.4.tar.gz", hash = "sha256:2808ca21878d200f7676a3d11e5bf2b5e3349ae504628f279cd7297c7dbd2038"},
 ]
 
 [package.dependencies]
@@ -3763,7 +3763,7 @@ tokenizers = "*"
 
 [package.extras]
 extra-proxy = ["azure-identity (>=1.15.0,<2.0.0)", "azure-keyvault-secrets (>=4.8.0,<5.0.0)", "google-cloud-kms (>=2.21.3,<3.0.0)", "prisma (==0.11.0)", "resend (>=0.8.0,<0.9.0)"]
-proxy = ["PyJWT (>=2.8.0,<3.0.0)", "apscheduler (>=3.10.4,<4.0.0)", "backoff", "cryptography (>=42.0.5,<43.0.0)", "fastapi (>=0.111.0,<0.112.0)", "fastapi-sso (>=0.10.0,<0.11.0)", "gunicorn (>=22.0.0,<23.0.0)", "orjson (>=3.9.7,<4.0.0)", "pynacl (>=1.5.0,<2.0.0)", "python-multipart (>=0.0.9,<0.0.10)", "pyyaml (>=6.0.1,<7.0.0)", "rq", "uvicorn (>=0.22.0,<0.23.0)"]
+proxy = ["PyJWT (>=2.8.0,<3.0.0)", "apscheduler (>=3.10.4,<4.0.0)", "backoff", "cryptography (>=43.0.1,<44.0.0)", "fastapi (>=0.115.5,<0.116.0)", "fastapi-sso (>=0.16.0,<0.17.0)", "gunicorn (>=22.0.0,<23.0.0)", "orjson (>=3.9.7,<4.0.0)", "pynacl (>=1.5.0,<2.0.0)", "python-multipart (>=0.0.18,<0.0.19)", "pyyaml (>=6.0.1,<7.0.0)", "rq", "uvicorn (>=0.22.0,<0.23.0)"]
 
 [[package]]
 name = "llama-cloud"
@@ -4614,12 +4614,12 @@ type = ["mypy (==1.11.2)"]
 
 [[package]]
 name = "modal"
-version = "0.70.0"
+version = "0.70.2"
 description = "Python client library for Modal"
 optional = false
 python-versions = ">=3.9"
 files = [
-    {file = "modal-0.70.0-py3-none-any.whl", hash = "sha256:034d46315bfc42d38000390a0a09529e7f5d647bb0ceea22cb1cccc23d0708f7"},
+    {file = "modal-0.70.2-py3-none-any.whl", hash = "sha256:14cd112313ab8f364fe6252795b872805ad6c91945e1216d0984dd43d89b2f57"},
 ]
 
 [package.dependencies]
@@ -7036,13 +7036,13 @@ XlsxWriter = ">=0.5.7"
 
 [[package]]
 name = "python-socketio"
-version = "5.12.0"
+version = "5.12.1"
 description = "Socket.IO server and client for Python"
 optional = false
 python-versions = ">=3.8"
 files = [
-    {file = "python_socketio-5.12.0-py3-none-any.whl", hash = "sha256:50fe22fd2b0aa634df3e74489e42217b09af2fb22eee45f2c006df36d1d08cb9"},
-    {file = "python_socketio-5.12.0.tar.gz", hash = "sha256:39b55bff4ef6ac5c39b8bbc38fa61962e22e15349b038c1ca7ee2e18824e06dc"},
+    {file = "python_socketio-5.12.1-py3-none-any.whl", hash = "sha256:24a0ea7cfff0e021eb28c68edbf7914ee4111bdf030b95e4d250c4dc9af7a386"},
+    {file = "python_socketio-5.12.1.tar.gz", hash = "sha256:0299ff1f470b676c09c1bfab1dead25405077d227b2c13cf217a34dadc68ba9c"},
 ]
 
 [package.dependencies]
diff --git a/pyproject.toml b/pyproject.toml
index 4a4131e325b5..155f62b8c764 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -100,6 +100,7 @@ reportlab = "*"
 [tool.coverage.run]
 concurrency = ["gevent"]
 
+
 [tool.poetry.group.runtime.dependencies]
 jupyterlab = "*"
 notebook = "*"
@@ -129,6 +130,7 @@ ignore = ["D1"]
 [tool.ruff.lint.pydocstyle]
 convention = "google"
 
+
 [tool.poetry.group.evaluation.dependencies]
 streamlit = "*"
 whatthepatch = "*"
diff --git a/tests/runtime/conftest.py b/tests/runtime/conftest.py
index aa08a2cb7333..062fc2ed9fa1 100644
--- a/tests/runtime/conftest.py
+++ b/tests/runtime/conftest.py
@@ -12,7 +12,7 @@
 from openhands.core.logger import openhands_logger as logger
 from openhands.events import EventStream
 from openhands.runtime.base import Runtime
-from openhands.runtime.impl.eventstream.eventstream_runtime import EventStreamRuntime
+from openhands.runtime.impl.docker.docker_runtime import DockerRuntime
 from openhands.runtime.impl.remote.remote_runtime import RemoteRuntime
 from openhands.runtime.impl.runloop.runloop_runtime import RunloopRuntime
 from openhands.runtime.plugins import AgentSkillsRequirement, JupyterRequirement
@@ -20,7 +20,7 @@
 from openhands.utils.async_utils import call_async_from_sync
 
 TEST_IN_CI = os.getenv('TEST_IN_CI', 'False').lower() in ['true', '1', 'yes']
-TEST_RUNTIME = os.getenv('TEST_RUNTIME', 'eventstream').lower()
+TEST_RUNTIME = os.getenv('TEST_RUNTIME', 'docker').lower()
 RUN_AS_OPENHANDS = os.getenv('RUN_AS_OPENHANDS', 'True').lower() in ['true', '1', 'yes']
 test_mount_path = ''
 project_dir = os.path.dirname(
@@ -62,7 +62,7 @@ def _remove_folder(folder: str) -> bool:
 
 
 def _close_test_runtime(runtime: Runtime) -> None:
-    if isinstance(runtime, EventStreamRuntime):
+    if isinstance(runtime, DockerRuntime):
         runtime.close(rm_all_containers=False)
     else:
         runtime.close()
@@ -129,8 +129,8 @@ def cleanup():
 # Depending on TEST_RUNTIME, feed the appropriate box class(es) to the test.
 def get_runtime_classes() -> list[type[Runtime]]:
     runtime = TEST_RUNTIME
-    if runtime.lower() == 'eventstream':
-        return [EventStreamRuntime]
+    if runtime.lower() == 'docker' or runtime.lower() == 'eventstream':
+        return [DockerRuntime]
     elif runtime.lower() == 'remote':
         return [RemoteRuntime]
     elif runtime.lower() == 'runloop':
@@ -173,7 +173,7 @@ def runtime_cls(request):
 
 
 # TODO: We will change this to `run_as_user` when `ServerRuntime` is deprecated.
-# since `EventStreamRuntime` supports running as an arbitrary user.
+# since `DockerRuntime` supports running as an arbitrary user.
 @pytest.fixture(scope='module', params=get_run_as_openhands())
 def run_as_openhands(request):
     time.sleep(1)
diff --git a/tests/unit/test_codeact_agent.py b/tests/unit/test_codeact_agent.py
index bccd3c1190d3..bc5d772442ab 100644
--- a/tests/unit/test_codeact_agent.py
+++ b/tests/unit/test_codeact_agent.py
@@ -3,14 +3,37 @@
 import pytest
 
 from openhands.agenthub.codeact_agent.codeact_agent import CodeActAgent
+from openhands.agenthub.codeact_agent.function_calling import (
+    _BROWSER_DESCRIPTION,
+    _BROWSER_TOOL_DESCRIPTION,
+    BrowserTool,
+    CmdRunTool,
+    IPythonTool,
+    LLMBasedFileEditTool,
+    StrReplaceEditorTool,
+    WebReadTool,
+    get_tools,
+    response_to_actions,
+)
 from openhands.core.config import AgentConfig, LLMConfig
-from openhands.core.message import TextContent
+from openhands.core.exceptions import FunctionCallNotExistsError
+from openhands.core.message import ImageContent, TextContent
+from openhands.events.action import (
+    AgentFinishAction,
+    CmdRunAction,
+    MessageAction,
+)
+from openhands.events.event import EventSource, FileEditSource, FileReadSource
+from openhands.events.observation.browse import BrowserOutputObservation
 from openhands.events.observation.commands import (
     CmdOutputObservation,
     IPythonRunCellObservation,
 )
 from openhands.events.observation.delegate import AgentDelegateObservation
 from openhands.events.observation.error import ErrorObservation
+from openhands.events.observation.files import FileEditObservation, FileReadObservation
+from openhands.events.observation.reject import UserRejectObservation
+from openhands.events.tool import ToolCallMetadata
 from openhands.llm.llm import LLM
 
 
@@ -102,3 +125,387 @@ def test_unknown_observation_message(agent: CodeActAgent):
 
     with pytest.raises(ValueError, match='Unknown observation type'):
         agent.get_observation_message(obs, tool_call_id_to_message={})
+
+
+def test_file_edit_observation_message(agent: CodeActAgent):
+    agent.config.function_calling = False
+    obs = FileEditObservation(
+        path='/test/file.txt',
+        prev_exist=True,
+        old_content='old content',
+        new_content='new content',
+        content='diff content',
+        impl_source=FileEditSource.LLM_BASED_EDIT,
+    )
+
+    results = agent.get_observation_message(obs, tool_call_id_to_message={})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'user'
+    assert len(result.content) == 1
+    assert isinstance(result.content[0], TextContent)
+    assert '[Existing file /test/file.txt is edited with' in result.content[0].text
+
+
+def test_file_read_observation_message(agent: CodeActAgent):
+    agent.config.function_calling = False
+    obs = FileReadObservation(
+        path='/test/file.txt',
+        content='File content',
+        impl_source=FileReadSource.DEFAULT,
+    )
+
+    results = agent.get_observation_message(obs, tool_call_id_to_message={})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'user'
+    assert len(result.content) == 1
+    assert isinstance(result.content[0], TextContent)
+    assert result.content[0].text == 'File content'
+
+
+def test_browser_output_observation_message(agent: CodeActAgent):
+    agent.config.function_calling = False
+    obs = BrowserOutputObservation(
+        url='http://example.com',
+        trigger_by_action='browse',
+        screenshot='',
+        content='Page loaded',
+        error=False,
+    )
+
+    results = agent.get_observation_message(obs, tool_call_id_to_message={})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'user'
+    assert len(result.content) == 1
+    assert isinstance(result.content[0], TextContent)
+    assert '[Current URL: http://example.com]' in result.content[0].text
+
+
+def test_user_reject_observation_message(agent: CodeActAgent):
+    agent.config.function_calling = False
+    obs = UserRejectObservation('Action rejected')
+
+    results = agent.get_observation_message(obs, tool_call_id_to_message={})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'user'
+    assert len(result.content) == 1
+    assert isinstance(result.content[0], TextContent)
+    assert 'Action rejected' in result.content[0].text
+    assert '[Last action has been rejected by the user]' in result.content[0].text
+
+
+def test_function_calling_observation_message(agent: CodeActAgent):
+    agent.config.function_calling = True
+    mock_response = {
+        'id': 'mock_id',
+        'total_calls_in_response': 1,
+        'choices': [{'message': {'content': 'Task completed'}}],
+    }
+    obs = CmdOutputObservation(
+        command='echo hello',
+        content='Command output',
+        command_id=1,
+        exit_code=0,
+    )
+    obs.tool_call_metadata = ToolCallMetadata(
+        tool_call_id='123',
+        function_name='execute_bash',
+        model_response=mock_response,
+        total_calls_in_response=1,
+    )
+
+    results = agent.get_observation_message(obs, tool_call_id_to_message={})
+    assert len(results) == 0  # No direct message when using function calling
+
+
+def test_message_action_with_image(agent: CodeActAgent):
+    action = MessageAction(
+        content='Message with image',
+        image_urls=['http://example.com/image.jpg'],
+    )
+    action._source = EventSource.AGENT
+
+    results = agent.get_action_message(action, {})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'assistant'
+    assert len(result.content) == 2
+    assert isinstance(result.content[0], TextContent)
+    assert isinstance(result.content[1], ImageContent)
+    assert result.content[0].text == 'Message with image'
+    assert result.content[1].image_urls == ['http://example.com/image.jpg']
+
+
+def test_user_cmd_action_message(agent: CodeActAgent):
+    action = CmdRunAction(command='ls -l')
+    action._source = EventSource.USER
+
+    results = agent.get_action_message(action, {})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'user'
+    assert len(result.content) == 1
+    assert isinstance(result.content[0], TextContent)
+    assert 'User executed the command' in result.content[0].text
+    assert 'ls -l' in result.content[0].text
+
+
+def test_agent_finish_action_with_tool_metadata(agent: CodeActAgent):
+    mock_response = {
+        'id': 'mock_id',
+        'total_calls_in_response': 1,
+        'choices': [{'message': {'content': 'Task completed'}}],
+    }
+
+    action = AgentFinishAction(thought='Initial thought')
+    action._source = EventSource.AGENT
+    action.tool_call_metadata = ToolCallMetadata(
+        tool_call_id='123',
+        function_name='finish',
+        model_response=mock_response,
+        total_calls_in_response=1,
+    )
+
+    results = agent.get_action_message(action, {})
+    assert len(results) == 1
+
+    result = results[0]
+    assert result is not None
+    assert result.role == 'assistant'
+    assert len(result.content) == 1
+    assert isinstance(result.content[0], TextContent)
+    assert 'Initial thought\nTask completed' in result.content[0].text
+
+
+def test_reset(agent: CodeActAgent):
+    # Add some state
+    action = MessageAction(content='test')
+    action._source = EventSource.AGENT
+    agent.pending_actions.append(action)
+
+    # Reset
+    agent.reset()
+
+    # Verify state is cleared
+    assert len(agent.pending_actions) == 0
+
+
+def test_step_with_pending_actions(agent: CodeActAgent):
+    # Add a pending action
+    pending_action = MessageAction(content='test')
+    pending_action._source = EventSource.AGENT
+    agent.pending_actions.append(pending_action)
+
+    # Step should return the pending action
+    result = agent.step(Mock())
+    assert result == pending_action
+    assert len(agent.pending_actions) == 0
+
+
+def test_get_tools_default():
+    tools = get_tools(
+        codeact_enable_jupyter=True,
+        codeact_enable_llm_editor=True,
+        codeact_enable_browsing=True,
+    )
+    assert len(tools) > 0
+
+    # Check required tools are present
+    tool_names = [tool['function']['name'] for tool in tools]
+    assert 'execute_bash' in tool_names
+    assert 'execute_ipython_cell' in tool_names
+    assert 'edit_file' in tool_names
+    assert 'web_read' in tool_names
+
+
+def test_get_tools_with_options():
+    # Test with all options enabled
+    tools = get_tools(
+        codeact_enable_browsing=True,
+        codeact_enable_jupyter=True,
+        codeact_enable_llm_editor=True,
+    )
+    tool_names = [tool['function']['name'] for tool in tools]
+    assert 'browser' in tool_names
+    assert 'execute_ipython_cell' in tool_names
+    assert 'edit_file' in tool_names
+
+    # Test with all options disabled
+    tools = get_tools(
+        codeact_enable_browsing=False,
+        codeact_enable_jupyter=False,
+        codeact_enable_llm_editor=False,
+    )
+    tool_names = [tool['function']['name'] for tool in tools]
+    assert 'browser' not in tool_names
+    assert 'execute_ipython_cell' not in tool_names
+    assert 'edit_file' not in tool_names
+
+
+def test_cmd_run_tool():
+    assert CmdRunTool['type'] == 'function'
+    assert CmdRunTool['function']['name'] == 'execute_bash'
+    assert 'command' in CmdRunTool['function']['parameters']['properties']
+    assert CmdRunTool['function']['parameters']['required'] == ['command']
+
+
+def test_ipython_tool():
+    assert IPythonTool['type'] == 'function'
+    assert IPythonTool['function']['name'] == 'execute_ipython_cell'
+    assert 'code' in IPythonTool['function']['parameters']['properties']
+    assert IPythonTool['function']['parameters']['required'] == ['code']
+
+
+def test_llm_based_file_edit_tool():
+    assert LLMBasedFileEditTool['type'] == 'function'
+    assert LLMBasedFileEditTool['function']['name'] == 'edit_file'
+
+    properties = LLMBasedFileEditTool['function']['parameters']['properties']
+    assert 'path' in properties
+    assert 'content' in properties
+    assert 'start' in properties
+    assert 'end' in properties
+
+    assert LLMBasedFileEditTool['function']['parameters']['required'] == [
+        'path',
+        'content',
+    ]
+
+
+def test_str_replace_editor_tool():
+    assert StrReplaceEditorTool['type'] == 'function'
+    assert StrReplaceEditorTool['function']['name'] == 'str_replace_editor'
+
+    properties = StrReplaceEditorTool['function']['parameters']['properties']
+    assert 'command' in properties
+    assert 'path' in properties
+    assert 'file_text' in properties
+    assert 'old_str' in properties
+    assert 'new_str' in properties
+    assert 'insert_line' in properties
+    assert 'view_range' in properties
+
+    assert StrReplaceEditorTool['function']['parameters']['required'] == [
+        'command',
+        'path',
+    ]
+
+
+def test_web_read_tool():
+    assert WebReadTool['type'] == 'function'
+    assert WebReadTool['function']['name'] == 'web_read'
+    assert 'url' in WebReadTool['function']['parameters']['properties']
+    assert WebReadTool['function']['parameters']['required'] == ['url']
+
+
+def test_browser_tool():
+    assert BrowserTool['type'] == 'function'
+    assert BrowserTool['function']['name'] == 'browser'
+    assert 'code' in BrowserTool['function']['parameters']['properties']
+    assert BrowserTool['function']['parameters']['required'] == ['code']
+    # Check that the description includes all the functions
+    description = _BROWSER_TOOL_DESCRIPTION
+    assert 'goto(' in description
+    assert 'go_back()' in description
+    assert 'go_forward()' in description
+    assert 'noop(' in description
+    assert 'scroll(' in description
+    assert 'fill(' in description
+    assert 'select_option(' in description
+    assert 'click(' in description
+    assert 'dblclick(' in description
+    assert 'hover(' in description
+    assert 'press(' in description
+    assert 'focus(' in description
+    assert 'clear(' in description
+    assert 'drag_and_drop(' in description
+    assert 'upload_file(' in description
+
+    # Test BrowserTool definition
+    assert BrowserTool['type'] == 'function'
+    assert BrowserTool['function']['name'] == 'browser'
+    assert BrowserTool['function']['description'] == _BROWSER_DESCRIPTION
+    assert BrowserTool['function']['parameters']['type'] == 'object'
+    assert 'code' in BrowserTool['function']['parameters']['properties']
+    assert BrowserTool['function']['parameters']['required'] == ['code']
+    assert (
+        BrowserTool['function']['parameters']['properties']['code']['type'] == 'string'
+    )
+    assert 'description' in BrowserTool['function']['parameters']['properties']['code']
+
+
+def test_mock_function_calling():
+    # Test mock function calling when LLM doesn't support it
+    llm = Mock()
+    llm.is_function_calling_active = lambda: False
+    config = AgentConfig()
+    config.use_microagents = False
+    agent = CodeActAgent(llm=llm, config=config)
+    assert agent.mock_function_calling is True
+
+
+def test_response_to_actions_invalid_tool():
+    # Test response with invalid tool call
+    mock_response = Mock()
+    mock_response.choices = [Mock()]
+    mock_response.choices[0].message = Mock()
+    mock_response.choices[0].message.content = 'Invalid tool'
+    mock_response.choices[0].message.tool_calls = [Mock()]
+    mock_response.choices[0].message.tool_calls[0].id = 'tool_call_10'
+    mock_response.choices[0].message.tool_calls[0].function = Mock()
+    mock_response.choices[0].message.tool_calls[0].function.name = 'invalid_tool'
+    mock_response.choices[0].message.tool_calls[0].function.arguments = '{}'
+
+    with pytest.raises(FunctionCallNotExistsError):
+        response_to_actions(mock_response)
+
+
+def test_step_with_no_pending_actions():
+    # Mock the LLM response
+    mock_response = Mock()
+    mock_response.id = 'mock_id'
+    mock_response.total_calls_in_response = 1
+    mock_response.choices = [Mock()]
+    mock_response.choices[0].message = Mock()
+    mock_response.choices[0].message.content = 'Task completed'
+    mock_response.choices[0].message.tool_calls = []
+
+    llm = Mock()
+    llm.completion = Mock(return_value=mock_response)
+    llm.is_function_calling_active = Mock(return_value=True)  # Enable function calling
+    llm.is_caching_prompt_active = Mock(return_value=False)
+
+    # Create agent with mocked LLM
+    config = AgentConfig()
+    config.use_microagents = False
+    agent = CodeActAgent(llm=llm, config=config)
+
+    # Test step with no pending actions
+    state = Mock()
+    state.history = []
+    state.latest_user_message = None
+    state.latest_user_message_id = None
+    state.latest_user_message_timestamp = None
+    state.latest_user_message_cause = None
+    state.latest_user_message_timeout = None
+    state.latest_user_message_llm_metrics = None
+    state.latest_user_message_tool_call_metadata = None
+
+    action = agent.step(state)
+    assert isinstance(action, MessageAction)
+    assert action.content == 'Task completed'
diff --git a/tests/unit/test_file_settings_store.py b/tests/unit/test_file_settings_store.py
index 14842758fa77..c20153c9fdce 100644
--- a/tests/unit/test_file_settings_store.py
+++ b/tests/unit/test_file_settings_store.py
@@ -5,8 +5,8 @@
 
 from openhands.core.config.app_config import AppConfig
 from openhands.server.settings import Settings
-from openhands.storage.file_settings_store import FileSettingsStore
 from openhands.storage.files import FileStore
+from openhands.storage.settings.file_settings_store import FileSettingsStore
 
 
 @pytest.fixture
@@ -15,18 +15,18 @@ def mock_file_store():
 
 
 @pytest.fixture
-def session_init_store(mock_file_store):
+def file_settings_store(mock_file_store):
     return FileSettingsStore(mock_file_store)
 
 
 @pytest.mark.asyncio
-async def test_load_nonexistent_data(session_init_store):
-    session_init_store.file_store.read.side_effect = FileNotFoundError()
-    assert await session_init_store.load() is None
+async def test_load_nonexistent_data(file_settings_store):
+    file_settings_store.file_store.read.side_effect = FileNotFoundError()
+    assert await file_settings_store.load() is None
 
 
 @pytest.mark.asyncio
-async def test_store_and_load_data(session_init_store):
+async def test_store_and_load_data(file_settings_store):
     # Test data
     init_data = Settings(
         language='python',
@@ -40,19 +40,19 @@ async def test_store_and_load_data(session_init_store):
     )
 
     # Store data
-    await session_init_store.store(init_data)
+    await file_settings_store.store(init_data)
 
     # Verify store called with correct JSON
     expected_json = json.dumps(init_data.__dict__)
-    session_init_store.file_store.write.assert_called_once_with(
+    file_settings_store.file_store.write.assert_called_once_with(
         'settings.json', expected_json
     )
 
     # Setup mock for load
-    session_init_store.file_store.read.return_value = expected_json
+    file_settings_store.file_store.read.return_value = expected_json
 
     # Load and verify data
-    loaded_data = await session_init_store.load()
+    loaded_data = await file_settings_store.load()
     assert loaded_data is not None
     assert loaded_data.language == init_data.language
     assert loaded_data.agent == init_data.agent
@@ -69,7 +69,7 @@ async def test_get_instance():
     config = AppConfig(file_store='local', file_store_path='/test/path')
 
     with patch(
-        'openhands.storage.file_settings_store.get_file_store'
+        'openhands.storage.settings.file_settings_store.get_file_store'
     ) as mock_get_store:
         mock_store = MagicMock(spec=FileStore)
         mock_get_store.return_value = mock_store