diff --git a/.github/workflows/eval-runner.yml b/.github/workflows/eval-runner.yml
index 9b2576a2644e..b1ace09b35de 100644
--- a/.github/workflows/eval-runner.yml
+++ b/.github/workflows/eval-runner.yml
@@ -1,4 +1,4 @@
-name: Run Evaluation
+name: Run SWE-Bench Evaluation
 
 on:
   pull_request:
@@ -58,24 +58,6 @@ jobs:
           echo "api_key = \"$DEEPSEEK_API_KEY\"" >> config.toml
           echo "temperature = 0.0" >> config.toml
 
-      - name: Run integration test evaluation
-        env:
-          ALLHANDS_API_KEY: ${{ secrets.ALLHANDS_EVAL_RUNTIME_API_KEY }}
-          RUNTIME: remote
-          SANDBOX_REMOTE_RUNTIME_API_URL: https://runtime.eval.all-hands.dev
-          EVAL_DOCKER_IMAGE_PREFIX: us-central1-docker.pkg.dev/evaluation-092424/swe-bench-images
-
-        run: |
-          poetry run ./evaluation/integration_tests/scripts/run_infer.sh llm.eval HEAD CodeActAgent '' $N_PROCESSES
-
-          # get evaluation report
-          REPORT_FILE=$(find evaluation/evaluation_outputs/outputs/integration_tests/CodeActAgent/deepseek-chat_maxiter_10_N* -name "report.md" -type f | head -n 1)
-          echo "REPORT_FILE: $REPORT_FILE"
-          echo "INTEGRATION_TEST_REPORT<<EOF" >> $GITHUB_ENV
-          cat $REPORT_FILE >> $GITHUB_ENV
-          echo >> $GITHUB_ENV
-          echo "EOF" >> $GITHUB_ENV
-
       - name: Run SWE-Bench evaluation
         env:
           ALLHANDS_API_KEY: ${{ secrets.ALLHANDS_EVAL_RUNTIME_API_KEY }}
@@ -143,9 +125,6 @@ jobs:
               **SWE-Bench Evaluation Report**
               ${{ env.SWEBENCH_REPORT }}
               ---
-              **Integration Tests Evaluation Report**
-              ${{ env.INTEGRATION_TEST_REPORT }}
-              ---
               You can download the full evaluation outputs [here](${{ env.ARTIFACT_URL }}).
 
       - name: Post to a Slack channel
diff --git a/.github/workflows/fe-unit-tests.yml b/.github/workflows/fe-unit-tests.yml
index 2bced7406e6c..b720bfe34c28 100644
--- a/.github/workflows/fe-unit-tests.yml
+++ b/.github/workflows/fe-unit-tests.yml
@@ -35,6 +35,9 @@ jobs:
       - name: Install dependencies
         working-directory: ./frontend
         run: npm ci
+      - name: Run TypeScript compilation
+        working-directory: ./frontend
+        run: npm run make-i18n && tsc
       - name: Run tests and collect coverage
         working-directory: ./frontend
         run: npm run test:coverage
diff --git a/.github/workflows/integration-runner.yml b/.github/workflows/integration-runner.yml
new file mode 100644
index 000000000000..120572aa0cdd
--- /dev/null
+++ b/.github/workflows/integration-runner.yml
@@ -0,0 +1,158 @@
+name: Run Integration Tests
+
+on:
+  pull_request:
+    types: [labeled]
+  workflow_dispatch:
+    inputs:
+      reason:
+        description: 'Reason for manual trigger'
+        required: true
+        default: ''
+  schedule:
+    - cron: '30 22 * * *'  # Runs at 10:30pm UTC every day
+
+env:
+  N_PROCESSES: 10 # Global configuration for number of parallel processes for evaluation
+
+jobs:
+  run-integration-tests:
+    if: github.event.label.name == 'integration-test' || github.event_name == 'workflow_dispatch' || github.event_name == 'schedule'
+    runs-on: ubuntu-latest
+    permissions:
+      contents: "read"
+      id-token: "write"
+      pull-requests: "write"
+      issues: "write"
+    strategy:
+      matrix:
+        python-version: ["3.12"]
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+
+      - name: Install poetry via pipx
+        run: pipx install poetry
+
+      - name: Set up Python
+        uses: actions/setup-python@v5
+        with:
+          python-version: ${{ matrix.python-version }}
+          cache: "poetry"
+
+      - name: Comment on PR if 'integration-test' label is present
+        if: github.event_name == 'pull_request' && github.event.label.name == 'integration-test'
+        uses: KeisukeYamashita/create-comment@v1
+        with:
+          unique: false
+          comment: |
+            Hi! I started running the integration tests on your PR. You will receive a comment with the results shortly.
+
+      - name: Install Python dependencies using Poetry
+        run: poetry install --without evaluation,llama-index
+
+      - name: Configure config.toml for testing with Haiku
+        env:
+          LLM_MODEL: "litellm_proxy/claude-3-5-haiku-20241022"
+          LLM_API_KEY: ${{ secrets.LLM_API_KEY }}
+          LLM_BASE_URL: ${{ secrets.LLM_BASE_URL }}
+        run: |
+          echo "[llm.eval]" > config.toml
+          echo "model = \"$LLM_MODEL\"" >> config.toml
+          echo "api_key = \"$LLM_API_KEY\"" >> config.toml
+          echo "base_url = \"$LLM_BASE_URL\"" >> config.toml
+          echo "temperature = 0.0" >> config.toml
+
+      - name: Build environment
+        run: make build
+
+      - name: Run integration test evaluation for Haiku
+        env:
+          SANDBOX_FORCE_REBUILD_RUNTIME: True
+        run: |
+          poetry run ./evaluation/integration_tests/scripts/run_infer.sh llm.eval HEAD CodeActAgent '' $N_PROCESSES '' 'haiku_run'
+
+          # get integration tests report
+          REPORT_FILE_HAIKU=$(find evaluation/evaluation_outputs/outputs/integration_tests/CodeActAgent/*haiku*_maxiter_10_N* -name "report.md" -type f | head -n 1)
+          echo "REPORT_FILE: $REPORT_FILE_HAIKU"
+          echo "INTEGRATION_TEST_REPORT_HAIKU<<EOF" >> $GITHUB_ENV
+          cat $REPORT_FILE_HAIKU >> $GITHUB_ENV
+          echo >> $GITHUB_ENV
+          echo "EOF" >> $GITHUB_ENV
+
+      - name: Wait a little bit
+        run: sleep 10
+
+      - name: Configure config.toml for testing with DeepSeek
+        env:
+          LLM_MODEL: "litellm_proxy/deepseek-chat"
+          LLM_API_KEY: ${{ secrets.LLM_API_KEY }}
+          LLM_BASE_URL: ${{ secrets.LLM_BASE_URL }}
+        run: |
+          echo "[llm.eval]" > config.toml
+          echo "model = \"$LLM_MODEL\"" >> config.toml
+          echo "api_key = \"$LLM_API_KEY\"" >> config.toml
+          echo "base_url = \"$LLM_BASE_URL\"" >> config.toml
+          echo "temperature = 0.0" >> config.toml
+
+      - name: Run integration test evaluation for DeepSeek
+        env:
+          SANDBOX_FORCE_REBUILD_RUNTIME: True
+        run: |
+          poetry run ./evaluation/integration_tests/scripts/run_infer.sh llm.eval HEAD CodeActAgent '' $N_PROCESSES '' 'deepseek_run'
+
+          # get integration tests report
+          REPORT_FILE_DEEPSEEK=$(find evaluation/evaluation_outputs/outputs/integration_tests/CodeActAgent/deepseek*_maxiter_10_N* -name "report.md" -type f | head -n 1)
+          echo "REPORT_FILE: $REPORT_FILE_DEEPSEEK"
+          echo "INTEGRATION_TEST_REPORT_DEEPSEEK<<EOF" >> $GITHUB_ENV
+          cat $REPORT_FILE_DEEPSEEK >> $GITHUB_ENV
+          echo >> $GITHUB_ENV
+          echo "EOF" >> $GITHUB_ENV
+
+      - name: Create archive of evaluation outputs
+        run: |
+          TIMESTAMP=$(date +'%y-%m-%d-%H-%M')
+          cd evaluation/evaluation_outputs/outputs  # Change to the outputs directory
+          tar -czvf ../../../integration_tests_${TIMESTAMP}.tar.gz integration_tests/CodeActAgent/*  # Only include the actual result directories
+
+      - name: Upload evaluation results as artifact
+        uses: actions/upload-artifact@v4
+        id: upload_results_artifact
+        with:
+          name: integration-test-outputs-${{ github.run_id }}-${{ github.run_attempt }}
+          path: integration_tests_*.tar.gz
+
+      - name: Get artifact URLs
+        run: |
+          echo "ARTIFACT_URL=${{ steps.upload_results_artifact.outputs.artifact-url }}" >> $GITHUB_ENV
+
+      - name: Set timestamp and trigger reason
+        run: |
+          echo "TIMESTAMP=$(date +'%Y-%m-%d-%H-%M')" >> $GITHUB_ENV
+          if [[ "${{ github.event_name }}" == "pull_request" ]]; then
+            echo "TRIGGER_REASON=pr-${{ github.event.pull_request.number }}" >> $GITHUB_ENV
+          elif [[ "${{ github.event_name }}" == "workflow_dispatch" ]]; then
+            echo "TRIGGER_REASON=manual-${{ github.event.inputs.reason }}" >> $GITHUB_ENV
+          else
+            echo "TRIGGER_REASON=nightly-scheduled" >> $GITHUB_ENV
+          fi
+
+      - name: Comment with results and artifact link
+        id: create_comment
+        uses: KeisukeYamashita/create-comment@v1
+        with:
+          # if triggered by PR, use PR number, otherwise use 5318 as fallback issue number for manual triggers
+          number: ${{ github.event_name == 'pull_request' && github.event.pull_request.number || 5318 }}
+          unique: false
+          comment: |
+              Trigger by: ${{ github.event_name == 'pull_request' && format('Pull Request (integration-test label on PR #{0})', github.event.pull_request.number) || (github.event_name == 'workflow_dispatch' && format('Manual Trigger: {0}', github.event.inputs.reason)) || 'Nightly Scheduled Run' }}
+              Commit: ${{ github.sha }}
+              **Integration Tests Report (Haiku)**
+              Haiku LLM Test Results:
+              ${{ env.INTEGRATION_TEST_REPORT_HAIKU }}
+              ---
+              **Integration Tests Report (DeepSeek)**
+              DeepSeek LLM Test Results:
+              ${{ env.INTEGRATION_TEST_REPORT_DEEPSEEK }}
+              ---
+              Download testing outputs (includes both Haiku and DeepSeek results): [Download](${{ steps.upload_results_artifact.outputs.artifact-url }})
diff --git a/.github/workflows/lint-fix.yml b/.github/workflows/lint-fix.yml
index 9fa97eaaf2f1..dca35010fb80 100644
--- a/.github/workflows/lint-fix.yml
+++ b/.github/workflows/lint-fix.yml
@@ -5,9 +5,10 @@ on:
     types: [labeled]
 
 jobs:
-  lint-fix:
+  # Frontend lint fixes
+  lint-fix-frontend:
     if: github.event.label.name == 'lint-fix'
-    name: Fix linting issues
+    name: Fix frontend linting issues
     runs-on: ubuntu-latest
     permissions:
       contents: write
@@ -20,7 +21,6 @@ jobs:
           fetch-depth: 0
           token: ${{ secrets.GITHUB_TOKEN }}
 
-      # Frontend lint fixes
       - name: Install Node.js 20
         uses: actions/setup-node@v4
         with:
@@ -34,7 +34,36 @@ jobs:
           cd frontend
           npm run lint:fix
 
-      # Python lint fixes
+      # Commit and push changes if any
+      - name: Check for changes
+        id: git-check
+        run: |
+          git diff --quiet || echo "changes=true" >> $GITHUB_OUTPUT
+      - name: Commit and push if there are changes
+        if: steps.git-check.outputs.changes == 'true'
+        run: |
+          git config --local user.email "openhands@all-hands.dev"
+          git config --local user.name "OpenHands Bot"
+          git add -A
+          git commit -m "🤖 Auto-fix frontend linting issues"
+          git push
+
+  # Python lint fixes
+  lint-fix-python:
+    if: github.event.label.name == 'lint-fix'
+    name: Fix Python linting issues
+    runs-on: ubuntu-latest
+    permissions:
+      contents: write
+      pull-requests: write
+    steps:
+      - uses: actions/checkout@v4
+        with:
+          ref: ${{ github.head_ref }}
+          repository: ${{ github.event.pull_request.head.repo.full_name }}
+          fetch-depth: 0
+          token: ${{ secrets.GITHUB_TOKEN }}
+
       - name: Set up python
         uses: actions/setup-python@v5
         with:
@@ -58,5 +87,5 @@ jobs:
           git config --local user.email "openhands@all-hands.dev"
           git config --local user.name "OpenHands Bot"
           git add -A
-          git commit -m "🤖 Auto-fix linting issues"
+          git commit -m "🤖 Auto-fix Python linting issues"
           git push
diff --git a/.github/workflows/lint.yml b/.github/workflows/lint.yml
index b6a9d327d860..1bfc8c91c6a4 100644
--- a/.github/workflows/lint.yml
+++ b/.github/workflows/lint.yml
@@ -30,10 +30,11 @@ jobs:
         run: |
           cd frontend
           npm install --frozen-lockfile
-      - name: Lint
+      - name: Lint and TypeScript compilation
         run: |
           cd frontend
           npm run lint
+          npm run make-i18n && tsc
 
   # Run lint on the python code
   lint-python:
diff --git a/.github/workflows/openhands-resolver.yml b/.github/workflows/openhands-resolver.yml
index f24a8e90cbfb..2719c3773607 100644
--- a/.github/workflows/openhands-resolver.yml
+++ b/.github/workflows/openhands-resolver.yml
@@ -16,6 +16,11 @@ on:
         type: string
         default: "main"
         description: "Target branch to pull and create PR against"
+      base_container_image:
+        required: false
+        type: string
+        default: ""
+        description: "Custom sandbox env"
     secrets:
       LLM_MODEL:
         required: true
@@ -139,6 +144,7 @@ jobs:
 
           echo "MAX_ITERATIONS=${{ inputs.max_iterations || 50 }}" >> $GITHUB_ENV
           echo "SANDBOX_ENV_GITHUB_TOKEN=${{ secrets.GITHUB_TOKEN }}" >> $GITHUB_ENV
+          echo "SANDBOX_ENV_BASE_CONTAINER_IMAGE=${{ inputs.base_container_image }}" >> $GITHUB_ENV
 
           # Set branch variables
           echo "TARGET_BRANCH=${{ inputs.target_branch }}" >> $GITHUB_ENV
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
index 847b6c469812..b1914cbd5b29 100644
--- a/CONTRIBUTING.md
+++ b/CONTRIBUTING.md
@@ -21,14 +21,14 @@ There are many ways that you can contribute:
 
 1. **Download and use** OpenHands, and send [issues](https://github.com/All-Hands-AI/OpenHands/issues) when you encounter something that isn't working or a feature that you'd like to see.
 2. **Send feedback** after each session by [clicking the thumbs-up thumbs-down buttons](https://docs.all-hands.dev/modules/usage/feedback), so we can see where things are working and failing, and also build an open dataset for training code agents.
-3. **Improve the Codebase** by sending PRs (see details below). In particular, we have some [good first issues](https://github.com/All-Hands-AI/OpenHands/labels/good%20first%20issue) that may be ones to start on.
+3. **Improve the Codebase** by sending [PRs](#sending-pull-requests-to-openhands) (see details below). In particular, we have some [good first issues](https://github.com/All-Hands-AI/OpenHands/labels/good%20first%20issue) that may be ones to start on.
 
 ## What can I build?
 Here are a few ways you can help improve the codebase.
 
 #### UI/UX
 We're always looking to improve the look and feel of the application. If you've got a small fix
-for something that's bugging you, feel free to open up a PR that changes the `./frontend` directory.
+for something that's bugging you, feel free to open up a PR that changes the [`./frontend`](./frontend) directory.
 
 If you're looking to make a bigger change, add a new UI element, or significantly alter the style
 of the application, please open an issue first, or better, join the #frontend channel in our Slack
@@ -46,7 +46,7 @@ We use the [SWE-bench](https://www.swebench.com/) benchmark to test our agent. Y
 channel in Slack to learn more.
 
 #### Adding a new agent
-You may want to experiment with building new types of agents. You can add an agent to `openhands/agenthub`
+You may want to experiment with building new types of agents. You can add an agent to [`openhands/agenthub`](./openhands/agenthub)
 to help expand the capabilities of OpenHands.
 
 #### Adding a new runtime
@@ -57,8 +57,8 @@ If you work for a company that provides a cloud-based runtime, you could help us
 by implementing the [interface specified here](https://github.com/All-Hands-AI/OpenHands/blob/main/openhands/runtime/base.py).
 
 #### Testing
-When you write code, it is also good to write tests. Please navigate to the `tests` folder to see existing test suites.
-At the moment, we have two kinds of tests: `unit` and `integration`. Please refer to the README for each test suite. These tests also run on GitHub's continuous integration to ensure quality of the project.
+When you write code, it is also good to write tests. Please navigate to the [`./tests`](./tests) folder to see existing test suites.
+At the moment, we have two kinds of tests: [`unit`](./tests/unit) and [`integration`](./evaluation/integration_tests). Please refer to the README for each test suite. These tests also run on GitHub's continuous integration to ensure quality of the project.
 
 ## Sending Pull Requests to OpenHands
 
@@ -103,7 +103,7 @@ Further, if you see an issue you like, please leave a "thumbs-up" or a comment,
 
 ### Making Pull Requests
 
-We're generally happy to consider all PRs, with the evaluation process varying based on the type of change:
+We're generally happy to consider all [PRs](https://github.com/All-Hands-AI/OpenHands/pulls), with the evaluation process varying based on the type of change:
 
 #### For Small Improvements
 
diff --git a/docs/modules/usage/configuration-options.md b/docs/modules/usage/configuration-options.md
new file mode 100644
index 000000000000..7a2718d7d786
--- /dev/null
+++ b/docs/modules/usage/configuration-options.md
@@ -0,0 +1,465 @@
+# Configuration Options
+
+This guide details all configuration options available for OpenHands, helping you customize its behavior and integrate it with other services.
+
+:::note
+If you are running in [GUI Mode](https://docs.all-hands.dev/modules/usage/how-to/gui-mode), the settings available in the Settings UI will always
+take precedence.
+:::
+
+---
+
+# Table of Contents
+
+1. [Core Configuration](#core-configuration)
+   - [API Keys](#api-keys)
+   - [Workspace](#workspace)
+   - [Debugging and Logging](#debugging-and-logging)
+   - [Session Management](#session-management)
+   - [Trajectories](#trajectories)
+   - [File Store](#file-store)
+   - [Task Management](#task-management)
+   - [Sandbox Configuration](#sandbox-configuration)
+   - [Miscellaneous](#miscellaneous)
+2. [LLM Configuration](#llm-configuration)
+   - [AWS Credentials](#aws-credentials)
+   - [API Configuration](#api-configuration)
+   - [Custom LLM Provider](#custom-llm-provider)
+   - [Embeddings](#embeddings)
+   - [Message Handling](#message-handling)
+   - [Model Selection](#model-selection)
+   - [Retrying](#retrying)
+   - [Advanced Options](#advanced-options)
+3. [Agent Configuration](#agent-configuration)
+   - [Microagent Configuration](#microagent-configuration)
+   - [Memory Configuration](#memory-configuration)
+   - [LLM Configuration](#llm-configuration-2)
+   - [ActionSpace Configuration](#actionspace-configuration)
+   - [Microagent Usage](#microagent-usage)
+4. [Sandbox Configuration](#sandbox-configuration-2)
+   - [Execution](#execution)
+   - [Container Image](#container-image)
+   - [Networking](#networking)
+   - [Linting and Plugins](#linting-and-plugins)
+   - [Dependencies and Environment](#dependencies-and-environment)
+   - [Evaluation](#evaluation)
+5. [Security Configuration](#security-configuration)
+   - [Confirmation Mode](#confirmation-mode)
+   - [Security Analyzer](#security-analyzer)
+
+---
+
+## Core Configuration
+
+The core configuration options are defined in the `[core]` section of the `config.toml` file.
+
+**API Keys**
+- `e2b_api_key`
+  - Type: `str`
+  - Default: `""`
+  - Description: API key for E2B
+
+- `modal_api_token_id`
+  - Type: `str`
+  - Default: `""`
+  - Description: API token ID for Modal
+
+- `modal_api_token_secret`
+  - Type: `str`
+  - Default: `""`
+  - Description: API token secret for Modal
+
+**Workspace**
+- `workspace_base`
+  - Type: `str`
+  - Default: `"./workspace"`
+  - Description: Base path for the workspace
+
+- `cache_dir`
+  - Type: `str`
+  - Default: `"/tmp/cache"`
+  - Description: Cache directory path
+
+**Debugging and Logging**
+- `debug`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Enable debugging
+
+- `disable_color`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Disable color in terminal output
+
+**Trajectories**
+- `trajectories_path`
+  - Type: `str`
+  - Default: `"./trajectories"`
+  - Description: Path to store trajectories (can be a folder or a file). If it's a folder, the trajectories will be saved in a file named with the session id name and .json extension, in that folder.
+
+**File Store**
+- `file_store_path`
+  - Type: `str`
+  - Default: `"/tmp/file_store"`
+  - Description: File store path
+
+- `file_store`
+  - Type: `str`
+  - Default: `"memory"`
+  - Description: File store type
+
+- `file_uploads_allowed_extensions`
+  - Type: `list of str`
+  - Default: `[".*"]`
+  - Description: List of allowed file extensions for uploads
+
+- `file_uploads_max_file_size_mb`
+  - Type: `int`
+  - Default: `0`
+  - Description: Maximum file size for uploads, in megabytes
+
+- `file_uploads_restrict_file_types`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Restrict file types for file uploads
+
+- `file_uploads_allowed_extensions`
+  - Type: `list of str`
+  - Default: `[".*"]`
+  - Description: List of allowed file extensions for uploads
+
+**Task Management**
+- `max_budget_per_task`
+  - Type: `float`
+  - Default: `0.0`
+  - Description: Maximum budget per task (0.0 means no limit)
+
+- `max_iterations`
+  - Type: `int`
+  - Default: `100`
+  - Description: Maximum number of iterations
+
+**Sandbox Configuration**
+- `workspace_mount_path_in_sandbox`
+  - Type: `str`
+  - Default: `"/workspace"`
+  - Description: Path to mount the workspace in the sandbox
+
+- `workspace_mount_path`
+  - Type: `str`
+  - Default: `""`
+  - Description: Path to mount the workspace
+
+- `workspace_mount_rewrite`
+  - Type: `str`
+  - Default: `""`
+  - Description: Path to rewrite the workspace mount path to. You can usually ignore this, it refers to special cases of running inside another container.
+
+**Miscellaneous**
+- `run_as_openhands`
+  - Type: `bool`
+  - Default: `true`
+  - Description: Run as OpenHands
+
+- `runtime`
+  - Type: `str`
+  - Default: `"eventstream"`
+  - Description: Runtime environment
+
+- `default_agent`
+  - Type: `str`
+  - Default: `"CodeActAgent"`
+  - Description: Name of the default agent
+
+- `jwt_secret`
+  - Type: `str`
+  - Default: `uuid.uuid4().hex`
+  - Description: JWT secret for authentication. Please set it to your own value.
+
+## LLM Configuration
+
+The LLM (Large Language Model) configuration options are defined in the `[llm]` section of the `config.toml` file.
+
+To use these with the docker command, pass in `-e LLM_<option>`. Example: `-e LLM_NUM_RETRIES`.
+
+**AWS Credentials**
+- `aws_access_key_id`
+  - Type: `str`
+  - Default: `""`
+  - Description: AWS access key ID
+
+- `aws_region_name`
+  - Type: `str`
+  - Default: `""`
+  - Description: AWS region name
+
+- `aws_secret_access_key`
+  - Type: `str`
+  - Default: `""`
+  - Description: AWS secret access key
+
+**API Configuration**
+- `api_key`
+  - Type: `str`
+  - Default: `None`
+  - Description: API key to use
+
+- `base_url`
+  - Type: `str`
+  - Default: `""`
+  - Description: API base URL
+
+- `api_version`
+  - Type: `str`
+  - Default: `""`
+  - Description: API version
+
+- `input_cost_per_token`
+  - Type: `float`
+  - Default: `0.0`
+  - Description: Cost per input token
+
+- `output_cost_per_token`
+  - Type: `float`
+  - Default: `0.0`
+  - Description: Cost per output token
+
+**Custom LLM Provider**
+- `custom_llm_provider`
+  - Type: `str`
+  - Default: `""`
+  - Description: Custom LLM provider
+
+**Embeddings**
+- `embedding_base_url`
+  - Type: `str`
+  - Default: `""`
+  - Description: Embedding API base URL
+
+- `embedding_deployment_name`
+  - Type: `str`
+  - Default: `""`
+  - Description: Embedding deployment name
+
+- `embedding_model`
+  - Type: `str`
+  - Default: `"local"`
+  - Description: Embedding model to use
+
+**Message Handling**
+- `max_message_chars`
+  - Type: `int`
+  - Default: `30000`
+  - Description: The approximate maximum number of characters in the content of an event included in the prompt to the LLM. Larger observations are truncated.
+
+- `max_input_tokens`
+  - Type: `int`
+  - Default: `0`
+  - Description: Maximum number of input tokens
+
+- `max_output_tokens`
+  - Type: `int`
+  - Default: `0`
+  - Description: Maximum number of output tokens
+
+**Model Selection**
+- `model`
+  - Type: `str`
+  - Default: `"claude-3-5-sonnet-20241022"`
+  - Description: Model to use
+
+**Retrying**
+- `num_retries`
+  - Type: `int`
+  - Default: `8`
+  - Description: Number of retries to attempt
+
+- `retry_max_wait`
+  - Type: `int`
+  - Default: `120`
+  - Description: Maximum wait time (in seconds) between retry attempts
+
+- `retry_min_wait`
+  - Type: `int`
+  - Default: `15`
+  - Description: Minimum wait time (in seconds) between retry attempts
+
+- `retry_multiplier`
+  - Type: `float`
+  - Default: `2.0`
+  - Description: Multiplier for exponential backoff calculation
+
+**Advanced Options**
+- `drop_params`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Drop any unmapped (unsupported) params without causing an exception
+
+- `caching_prompt`
+  - Type: `bool`
+  - Default: `true`
+  - Description: Using the prompt caching feature if provided by the LLM and supported
+
+- `ollama_base_url`
+  - Type: `str`
+  - Default: `""`
+  - Description: Base URL for the OLLAMA API
+
+- `temperature`
+  - Type: `float`
+  - Default: `0.0`
+  - Description: Temperature for the API
+
+- `timeout`
+  - Type: `int`
+  - Default: `0`
+  - Description: Timeout for the API
+
+- `top_p`
+  - Type: `float`
+  - Default: `1.0`
+  - Description: Top p for the API
+
+- `disable_vision`
+  - Type: `bool`
+  - Default: `None`
+  - Description: If model is vision capable, this option allows to disable image processing (useful for cost reduction)
+
+## Agent Configuration
+
+The agent configuration options are defined in the `[agent]` and `[agent.<agent_name>]` sections of the `config.toml` file.
+
+**Microagent Configuration**
+- `micro_agent_name`
+  - Type: `str`
+  - Default: `""`
+  - Description: Name of the micro agent to use for this agent
+
+**Memory Configuration**
+- `memory_enabled`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Whether long-term memory (embeddings) is enabled
+
+- `memory_max_threads`
+  - Type: `int`
+  - Default: `3`
+  - Description: The maximum number of threads indexing at the same time for embeddings
+
+**LLM Configuration**
+- `llm_config`
+  - Type: `str`
+  - Default: `'your-llm-config-group'`
+  - Description: The name of the LLM config to use
+
+**ActionSpace Configuration**
+- `function_calling`
+  - Type: `bool`
+  - Default: `true`
+  - Description: Whether function calling is enabled
+
+- `codeact_enable_browsing`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Whether browsing delegate is enabled in the action space (only works with function calling)
+
+- `codeact_enable_llm_editor`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Whether LLM editor is enabled in the action space (only works with function calling)
+
+- `codeact_enable_jupyter`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Whether Jupyter is enabled in the action space
+
+**Microagent Usage**
+- `use_microagents`
+  - Type: `bool`
+  - Default: `true`
+  - Description: Whether to use microagents at all
+
+- `disabled_microagents`
+  - Type: `list of str`
+  - Default: `None`
+  - Description: A list of microagents to disable
+
+## Sandbox Configuration
+
+The sandbox configuration options are defined in the `[sandbox]` section of the `config.toml` file.
+
+To use these with the docker command, pass in `-e SANDBOX_<option>`. Example: `-e SANDBOX_TIMEOUT`.
+
+**Execution**
+- `timeout`
+  - Type: `int`
+  - Default: `120`
+  - Description: Sandbox timeout in seconds
+
+- `user_id`
+  - Type: `int`
+  - Default: `1000`
+  - Description: Sandbox user ID
+
+**Container Image**
+- `base_container_image`
+  - Type: `str`
+  - Default: `"nikolaik/python-nodejs:python3.12-nodejs22"`
+  - Description: Container image to use for the sandbox
+
+**Networking**
+- `use_host_network`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Use host network
+
+**Linting and Plugins**
+- `enable_auto_lint`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Enable auto linting after editing
+
+- `initialize_plugins`
+  - Type: `bool`
+  - Default: `true`
+  - Description: Whether to initialize plugins
+
+**Dependencies and Environment**
+- `runtime_extra_deps`
+  - Type: `str`
+  - Default: `""`
+  - Description: Extra dependencies to install in the runtime image
+
+- `runtime_startup_env_vars`
+  - Type: `dict`
+  - Default: `{}`
+  - Description: Environment variables to set at the launch of the runtime
+
+**Evaluation**
+- `browsergym_eval_env`
+  - Type: `str`
+  - Default: `""`
+  - Description: BrowserGym environment to use for evaluation
+
+## Security Configuration
+
+The security configuration options are defined in the `[security]` section of the `config.toml` file.
+
+To use these with the docker command, pass in `-e SECURITY_<option>`. Example: `-e SECURITY_CONFIRMATION_MODE`.
+
+**Confirmation Mode**
+- `confirmation_mode`
+  - Type: `bool`
+  - Default: `false`
+  - Description: Enable confirmation mode
+
+**Security Analyzer**
+- `security_analyzer`
+  - Type: `str`
+  - Default: `""`
+  - Description: The security analyzer to use
+
+---
+
+> **Note**: Adjust configurations carefully, especially for memory, security, and network-related settings to ensure optimal performance and security.
+Please note that the configuration options may be subject to change in future versions of OpenHands. It's recommended to refer to the official documentation for the most up-to-date information.
diff --git a/docs/modules/usage/how-to/github-action.md b/docs/modules/usage/how-to/github-action.md
index 4864736e3cac..dff627cd9d50 100644
--- a/docs/modules/usage/how-to/github-action.md
+++ b/docs/modules/usage/how-to/github-action.md
@@ -37,12 +37,15 @@ the [README for the OpenHands Resolver](https://github.com/All-Hands-AI/OpenHand
 
 You can provide custom directions for OpenHands by following the [README for the resolver](https://github.com/All-Hands-AI/OpenHands/blob/main/openhands/resolver/README.md#providing-custom-instructions).
 
-### Configure custom macro
+### Custom configurations
 
-To customize the default macro (`@openhands-agent`):
+Github resolver will automatically check for valid [repository secrets](https://docs.github.com/en/actions/security-for-github-actions/security-guides/using-secrets-in-github-actions?tool=webui#creating-secrets-for-a-repository) or [repository variables](https://docs.github.com/en/actions/writing-workflows/choosing-what-your-workflow-does/store-information-in-variables#creating-configuration-variables-for-a-repository) to customize its behavior. The customization options you can set are:
 
-1. [Create a repository variable](https://docs.github.com/en/actions/writing-workflows/choosing-what-your-workflow-does/store-information-in-variables#creating-configuration-variables-for-a-repository) named `OPENHANDS_MACRO`
-2. Assign the variable a custom value
+| **Attribute name**               | **Type** | **Purpose**                                                                                         | **Example**                                     |
+| -------------------------------- | -------- | --------------------------------------------------------------------------------------------------- | ----------------------------------------------- |
+| `OPENHANDS_MAX_ITER`             | Variable | Set max limit for agent iterations                                                                  | `OPENHANDS_MAX_ITER=10`                         |
+| `OPENHANDS_MACRO`                | Variable | Customize default macro for invoking the resolver                                                   | `OPENHANDS_MACRO=@resolveit`                    |
+| `OPENHANDS_BASE_CONTAINER_IMAGE` | Variable | Custom Sandbox ([learn more](https://docs.all-hands.dev/modules/usage/how-to/custom-sandbox-guide)) | `OPENHANDS_BASE_CONTAINER_IMAGE="custom_image"` |
 
 ## Writing Effective .openhands_instructions Files
 
@@ -55,6 +58,7 @@ The `.openhands_instructions` file is a file that you can put in the root direct
 2. **Repository Structure**: Explain the key directories and their purposes, especially highlighting where different types of code (e.g., frontend, backend) are located.
 
 3. **Development Workflows**: Document the essential commands for:
+
    - Building and setting up the project
    - Running tests
    - Linting and code quality checks
@@ -69,24 +73,29 @@ The `.openhands_instructions` file is a file that you can put in the root direct
 
 ```markdown
 # Repository Overview
+
 [Brief description of the project]
 
 ## General Setup
+
 - Main build command
 - Development environment setup
 - Pre-commit checks
 
 ## Backend
+
 - Location and structure
 - Testing instructions
 - Environment requirements
 
 ## Frontend
+
 - Setup prerequisites
 - Build and test commands
 - Environment variables
 
 ## Additional Guidelines
+
 - Code style requirements
 - Special considerations
 - Common workflows
diff --git a/docs/sidebars.ts b/docs/sidebars.ts
index 7ce0a1f210c2..44f8c7b85037 100644
--- a/docs/sidebars.ts
+++ b/docs/sidebars.ts
@@ -100,6 +100,11 @@ const sidebars: SidebarsConfig = {
           label: 'Runtime Configuration',
           id: 'usage/runtimes',
         },
+        {
+          type: 'doc',
+          label: 'Configuration Options',
+          id: 'usage/configuration-options',
+        },
         {
           type: 'doc',
           label: 'Custom Sandbox',
diff --git a/docs/src/components/HomepageHeader/HomepageHeader.tsx b/docs/src/components/HomepageHeader/HomepageHeader.tsx
index f421b2897add..aabbef67df5a 100644
--- a/docs/src/components/HomepageHeader/HomepageHeader.tsx
+++ b/docs/src/components/HomepageHeader/HomepageHeader.tsx
@@ -23,7 +23,7 @@ export function HomepageHeader() {
           <a href="https://codecov.io/github/All-Hands-AI/OpenHands?branch=main"><img alt="CodeCov" src="https://img.shields.io/codecov/c/github/All-Hands-AI/OpenHands?style=for-the-badge&color=blue" /></a>
           <a href="https://github.com/All-Hands-AI/OpenHands/blob/main/LICENSE"><img src="https://img.shields.io/github/license/All-Hands-AI/OpenHands?style=for-the-badge&color=blue" alt="MIT License" /></a>
           <br/>
-          <a href="https://join.slack.com/t/opendevin/shared_invite/zt-2oikve2hu-UDxHeo8nsE69y6T7yFX_BA"><img src="https://img.shields.io/badge/Slack-Join%20Us-red?logo=slack&logoColor=white&style=for-the-badge" alt="Join our Slack community" /></a>
+          <a href="https://join.slack.com/t/openhands-ai/shared_invite/zt-2tom0er4l-JeNUGHt_AxpEfIBstbLPiw"><img src="https://img.shields.io/badge/Slack-Join%20Us-red?logo=slack&logoColor=white&style=for-the-badge" alt="Join our Slack community" /></a>
           <a href="https://discord.gg/ESHStjSjD4"><img src="https://img.shields.io/badge/Discord-Join%20Us-purple?logo=discord&logoColor=white&style=for-the-badge" alt="Join our Discord community" /></a>
           <a href="https://github.com/All-Hands-AI/OpenHands/blob/main/CREDITS.md"><img src="https://img.shields.io/badge/Project-Credits-blue?style=for-the-badge&color=FFE165&logo=github&logoColor=white" alt="Credits" /></a>
           <br/>
diff --git a/evaluation/README.md b/evaluation/README.md
index 8ef9bcce65df..e87c0657daab 100644
--- a/evaluation/README.md
+++ b/evaluation/README.md
@@ -6,9 +6,9 @@ This folder contains code and resources to run experiments and evaluations.
 
 ### Setup
 
-Before starting evaluation, follow the instructions here [here](https://github.com/All-Hands-AI/OpenHands/blob/main/Development.md) to setup your local development environment and LLM.
+Before starting evaluation, follow the instructions [here](https://github.com/All-Hands-AI/OpenHands/blob/main/Development.md) to setup your local development environment and LLM.
 
-Once you are done with setup, you can follow the benchmark-specific instructions in each subdirectory of the evaluation directory.
+Once you are done with setup, you can follow the benchmark-specific instructions in each subdirectory of the [evaluation directory](#supported-benchmarks).
 Generally these will involve running `run_infer.py` to perform inference with the agents.
 
 ### Implementing and Evaluating an Agent
@@ -42,7 +42,7 @@ temperature = 0.0
 
 ## Supported Benchmarks
 
-The OpenHands evaluation harness supports a wide variety of benchmarks across software engineering, web browsing, and miscellaneous assistance tasks.
+The OpenHands evaluation harness supports a wide variety of benchmarks across [software engineering](#software-engineering), [web browsing](#web-browsing), and [miscellaneous assistance](#misc-assistance) tasks.
 
 ### Software Engineering
 
@@ -83,7 +83,7 @@ You can start your own fork of [our huggingface evaluation outputs](https://hugg
 
 To learn more about how to integrate your benchmark into OpenHands, check out [tutorial here](https://docs.all-hands.dev/modules/usage/how-to/evaluation-harness). Briefly,
 
-- Each subfolder contains a specific benchmark or experiment. For example, `evaluation/benchmarks/swe_bench` should contain
+- Each subfolder contains a specific benchmark or experiment. For example, [`evaluation/benchmarks/swe_bench`](./benchmarks/swe_bench) should contain
 all the preprocessing/evaluation/analysis scripts.
 - Raw data and experimental records should not be stored within this repo.
 - For model outputs, they should be stored at [this huggingface space](https://huggingface.co/spaces/OpenHands/evaluation) for visualization.
diff --git a/evaluation/integration_tests/run_infer.py b/evaluation/integration_tests/run_infer.py
index 5e3205fefe2e..2da68b9b82b9 100644
--- a/evaluation/integration_tests/run_infer.py
+++ b/evaluation/integration_tests/run_infer.py
@@ -48,13 +48,19 @@ def get_config(
             # use default base_container_image
             enable_auto_lint=True,
             use_host_network=False,
-            timeout=100,
+            timeout=300,
+            # Add platform to the sandbox config to solve issue 4401
+            platform='linux/amd64',
             api_key=os.environ.get('ALLHANDS_API_KEY', None),
             remote_runtime_api_url=os.environ.get('SANDBOX_REMOTE_RUNTIME_API_URL'),
+            keep_runtime_alive=False,
+            remote_runtime_init_timeout=3600,
         ),
         # do not mount workspace
         workspace_base=None,
         workspace_mount_path=None,
+        # debug
+        debug=True,
     )
     config.set_llm_config(
         update_llm_config_for_completions_logging(
@@ -107,31 +113,37 @@ def process_instance(
     # =============================================
     # create sandbox and run the agent
     # =============================================
-
     runtime: Runtime = create_runtime(config)
     call_async_from_sync(runtime.connect)
+    try:
+        test_class.initialize_runtime(runtime)
+
+        # Here's how you can run the agent (similar to the `main` function) and get the final task state
+        state: State | None = asyncio.run(
+            run_controller(
+                config=config,
+                initial_user_action=MessageAction(content=instruction),
+                runtime=runtime,
+                fake_user_response_fn=FAKE_RESPONSES[metadata.agent_class],
+            )
+        )
+        if state is None:
+            raise ValueError('State should not be None.')
 
-    test_class.initialize_runtime(runtime)
+        # # =============================================
+        # # result evaluation
+        # # =============================================
 
-    # Here's how you can run the agent (similar to the `main` function) and get the final task state
-    state: State | None = asyncio.run(
-        run_controller(
-            config=config,
-            initial_user_action=MessageAction(content=instruction),
-            runtime=runtime,
-            fake_user_response_fn=FAKE_RESPONSES[metadata.agent_class],
-        )
-    )
-    if state is None:
-        raise ValueError('State should not be None.')
+        histories = state.history
 
-    # # =============================================
-    # # result evaluation
-    # # =============================================
+        # some basic check
+        logger.info(f'Total events in history: {len(histories)}')
+        assert len(histories) > 0, 'History should not be empty'
 
-    histories = [event_to_dict(event) for event in state.history]
-    test_result: TestResult = test_class.verify_result(runtime, histories)
-    metrics = state.metrics.get() if state.metrics else None
+        test_result: TestResult = test_class.verify_result(runtime, histories)
+        metrics = state.metrics.get() if state.metrics else None
+    finally:
+        runtime.close()
 
     # Save the output
     output = EvalOutput(
@@ -139,7 +151,7 @@ def process_instance(
         instance=instance.to_dict(),
         instruction=instruction,
         metadata=metadata,
-        history=histories,
+        history=[event_to_dict(event) for event in histories],
         metrics=metrics,
         error=state.last_error if state and state.last_error else None,
         test_result=test_result.model_dump(),
@@ -206,6 +218,8 @@ def load_integration_tests() -> pd.DataFrame:
     )
 
     df = pd.read_json(output_file, lines=True, orient='records')
+
+    # record success and reason for failure for the final report
     df['success'] = df['test_result'].apply(lambda x: x['success'])
     df['reason'] = df['test_result'].apply(lambda x: x['reason'])
     logger.info('-' * 100)
@@ -219,9 +233,16 @@ def load_integration_tests() -> pd.DataFrame:
     )
     logger.info('-' * 100)
 
+    # record cost for each instance, with 3 decimal places
+    df['cost'] = df['metrics'].apply(lambda x: round(x['accumulated_cost'], 3))
+    logger.info(f'Total cost: USD {df["cost"].sum():.2f}')
+
     report_file = os.path.join(metadata.eval_output_dir, 'report.md')
     with open(report_file, 'w') as f:
         f.write(
             f'Success rate: {df["success"].mean():.2%} ({df["success"].sum()}/{len(df)})\n'
         )
-        f.write(df[['instance_id', 'success', 'reason']].to_markdown(index=False))
+        f.write(f'\nTotal cost: USD {df["cost"].sum():.2f}\n')
+        f.write(
+            df[['instance_id', 'success', 'reason', 'cost']].to_markdown(index=False)
+        )
diff --git a/evaluation/integration_tests/tests/t05_simple_browsing.py b/evaluation/integration_tests/tests/t05_simple_browsing.py
index 8f08cb4e7250..96bb47875aec 100644
--- a/evaluation/integration_tests/tests/t05_simple_browsing.py
+++ b/evaluation/integration_tests/tests/t05_simple_browsing.py
@@ -108,6 +108,8 @@ def initialize_runtime(cls, runtime: Runtime) -> None:
 
     @classmethod
     def verify_result(cls, runtime: Runtime, histories: list[Event]) -> TestResult:
+        from openhands.core.logger import openhands_logger as logger
+
         # check if the "The answer is OpenHands is all you need!" is in any message
         message_actions = [
             event
@@ -116,19 +118,29 @@ def verify_result(cls, runtime: Runtime, histories: list[Event]) -> TestResult:
                 event, (MessageAction, AgentFinishAction, AgentDelegateObservation)
             )
         ]
+        logger.debug(f'Total message-like events: {len(message_actions)}')
+
         for event in message_actions:
-            if isinstance(event, AgentDelegateObservation):
-                content = event.content
-            elif isinstance(event, AgentFinishAction):
-                content = event.outputs.get('content', '')
-            elif isinstance(event, MessageAction):
-                content = event.content
-            else:
-                raise ValueError(f'Unknown event type: {type(event)}')
+            try:
+                if isinstance(event, AgentDelegateObservation):
+                    content = event.content
+                elif isinstance(event, AgentFinishAction):
+                    content = event.outputs.get('content', '')
+                elif isinstance(event, MessageAction):
+                    content = event.content
+                else:
+                    logger.warning(f'Unexpected event type: {type(event)}')
+                    continue
 
-            if 'OpenHands is all you need!' in content:
-                return TestResult(success=True)
+                if 'OpenHands is all you need!' in content:
+                    return TestResult(success=True)
+            except Exception as e:
+                logger.error(f'Error processing event: {e}')
+
+        logger.debug(
+            f'Total messages: {len(message_actions)}. Messages: {message_actions}'
+        )
         return TestResult(
             success=False,
-            reason=f'The answer is not found in any message. Total messages: {len(message_actions)}. Messages: {message_actions}',
+            reason=f'The answer is not found in any message. Total messages: {len(message_actions)}.',
         )
diff --git a/evaluation/integration_tests/tests/t06_github_pr_browsing.py b/evaluation/integration_tests/tests/t06_github_pr_browsing.py
index 52ec927cd334..3c25e0300a35 100644
--- a/evaluation/integration_tests/tests/t06_github_pr_browsing.py
+++ b/evaluation/integration_tests/tests/t06_github_pr_browsing.py
@@ -14,7 +14,9 @@ def initialize_runtime(cls, runtime: Runtime) -> None:
 
     @classmethod
     def verify_result(cls, runtime: Runtime, histories: list[Event]) -> TestResult:
-        # check if the "The answer is OpenHands is all you need!" is in any message
+        from openhands.core.logger import openhands_logger as logger
+
+        # check if the license information is in any message
         message_actions = [
             event
             for event in histories
@@ -22,23 +24,35 @@ def verify_result(cls, runtime: Runtime, histories: list[Event]) -> TestResult:
                 event, (MessageAction, AgentFinishAction, AgentDelegateObservation)
             )
         ]
+        logger.info(f'Total message-like events: {len(message_actions)}')
+
         for event in message_actions:
-            if isinstance(event, AgentDelegateObservation):
-                content = event.content
-            elif isinstance(event, AgentFinishAction):
-                content = event.outputs.get('content', '')
-            elif isinstance(event, MessageAction):
-                content = event.content
-            else:
-                raise ValueError(f'Unknown event type: {type(event)}')
-
-            if (
-                'non-commercial' in content
-                or 'MIT' in content
-                or 'Apache 2.0' in content
-            ):
-                return TestResult(success=True)
+            try:
+                if isinstance(event, AgentDelegateObservation):
+                    content = event.content
+                elif isinstance(event, AgentFinishAction):
+                    content = event.outputs.get('content', '')
+                    if event.thought:
+                        content += f'\n\n{event.thought}'
+                elif isinstance(event, MessageAction):
+                    content = event.content
+                else:
+                    logger.warning(f'Unexpected event type: {type(event)}')
+                    continue
+
+                if (
+                    'non-commercial' in content
+                    or 'MIT' in content
+                    or 'Apache 2.0' in content
+                ):
+                    return TestResult(success=True)
+            except Exception as e:
+                logger.error(f'Error processing event: {e}')
+
+        logger.debug(
+            f'Total messages: {len(message_actions)}. Messages: {message_actions}'
+        )
         return TestResult(
             success=False,
-            reason=f'The answer is not found in any message. Total messages: {len(message_actions)}. Messages: {message_actions}',
+            reason=f'The answer is not found in any message. Total messages: {len(message_actions)}.',
         )
diff --git a/frontend/__tests__/components/chat/chat-interface.test.tsx b/frontend/__tests__/components/chat/chat-interface.test.tsx
index 0953f43353ed..8596d3acd3d7 100644
--- a/frontend/__tests__/components/chat/chat-interface.test.tsx
+++ b/frontend/__tests__/components/chat/chat-interface.test.tsx
@@ -2,11 +2,11 @@ import { afterEach, beforeAll, describe, expect, it, vi } from "vitest";
 import { act, screen, waitFor, within } from "@testing-library/react";
 import userEvent from "@testing-library/user-event";
 import { renderWithProviders } from "test-utils";
-import { ChatInterface } from "#/components/chat-interface";
 import { addUserMessage } from "#/state/chat-slice";
 import { SUGGESTIONS } from "#/utils/suggestions";
 import * as ChatSlice from "#/state/chat-slice";
 import { WsClientProviderStatus } from "#/context/ws-client-provider";
+import { ChatInterface } from "#/routes/_oh.app/chat-interface";
 
 // eslint-disable-next-line @typescript-eslint/no-unused-vars
 const renderChatInterface = (messages: (Message | ErrorMessage)[]) =>
@@ -18,7 +18,11 @@ describe("Empty state", () => {
   }));
 
   const { useWsClient: useWsClientMock } = vi.hoisted(() => ({
-    useWsClient: vi.fn(() => ({ send: sendMock, status: WsClientProviderStatus.ACTIVE, isLoadingMessages: false })),
+    useWsClient: vi.fn(() => ({
+      send: sendMock,
+      status: WsClientProviderStatus.ACTIVE,
+      isLoadingMessages: false,
+    })),
   }));
 
   beforeAll(() => {
@@ -84,7 +88,9 @@ describe("Empty state", () => {
     async () => {
       // this is to test that the message is in the UI before the socket is called
       useWsClientMock.mockImplementation(() => ({
-        send: sendMock, status: WsClientProviderStatus.ACTIVE, isLoadingMessages: false
+        send: sendMock,
+        status: WsClientProviderStatus.ACTIVE,
+        isLoadingMessages: false,
       }));
       const addUserMessageSpy = vi.spyOn(ChatSlice, "addUserMessage");
       const user = userEvent.setup();
@@ -112,7 +118,9 @@ describe("Empty state", () => {
     "should send the message to the socket only if the runtime is active",
     async () => {
       useWsClientMock.mockImplementation(() => ({
-        send: sendMock, status: WsClientProviderStatus.ACTIVE, isLoadingMessages: false
+        send: sendMock,
+        status: WsClientProviderStatus.ACTIVE,
+        isLoadingMessages: false,
       }));
       const user = userEvent.setup();
       const { rerender } = renderWithProviders(<ChatInterface />, {
@@ -121,7 +129,6 @@ describe("Empty state", () => {
         },
       });
 
-
       const suggestions = screen.getByTestId("suggestions");
       const displayedSuggestions = within(suggestions).getAllByRole("button");
 
@@ -129,7 +136,9 @@ describe("Empty state", () => {
       expect(sendMock).not.toHaveBeenCalled();
 
       useWsClientMock.mockImplementation(() => ({
-        send: sendMock, status: WsClientProviderStatus.ACTIVE, isLoadingMessages: false
+        send: sendMock,
+        status: WsClientProviderStatus.ACTIVE,
+        isLoadingMessages: false,
       }));
       rerender(<ChatInterface />);
 
@@ -330,10 +339,16 @@ describe.skip("ChatInterface", () => {
     rerender(<ChatInterface />);
 
     // Verify only one button is shown
-    const pushToPrButton = screen.getByRole("button", { name: "Push changes to PR" });
+    const pushToPrButton = screen.getByRole("button", {
+      name: "Push changes to PR",
+    });
     expect(pushToPrButton).toBeInTheDocument();
-    expect(screen.queryByRole("button", { name: "Push to Branch" })).not.toBeInTheDocument();
-    expect(screen.queryByRole("button", { name: "Push & Create PR" })).not.toBeInTheDocument();
+    expect(
+      screen.queryByRole("button", { name: "Push to Branch" }),
+    ).not.toBeInTheDocument();
+    expect(
+      screen.queryByRole("button", { name: "Push & Create PR" }),
+    ).not.toBeInTheDocument();
   });
 
   it("should render feedback actions if there are more than 3 messages", () => {
@@ -379,4 +394,4 @@ describe.skip("ChatInterface", () => {
     );
     it.todo("should render the actions once more after new messages are added");
   });
-});
\ No newline at end of file
+});
diff --git a/frontend/__tests__/components/file-explorer/file-explorer.test.tsx b/frontend/__tests__/components/file-explorer/file-explorer.test.tsx
index ce78b2da3ffa..6b360520347d 100644
--- a/frontend/__tests__/components/file-explorer/file-explorer.test.tsx
+++ b/frontend/__tests__/components/file-explorer/file-explorer.test.tsx
@@ -4,7 +4,7 @@ import { renderWithProviders } from "test-utils";
 import { describe, it, expect, vi, Mock, afterEach } from "vitest";
 import toast from "#/utils/toast";
 import AgentState from "#/types/agent-state";
-import FileExplorer from "#/components/file-explorer/file-explorer";
+import { FileExplorer } from "#/routes/_oh.app._index/file-explorer/file-explorer";
 import OpenHands from "#/api/open-hands";
 
 const toastSpy = vi.spyOn(toast, "error");
diff --git a/frontend/__tests__/routes/_oh.test.tsx b/frontend/__tests__/routes/_oh.test.tsx
index 9dbf3b786f24..a5e106f1fc98 100644
--- a/frontend/__tests__/routes/_oh.test.tsx
+++ b/frontend/__tests__/routes/_oh.test.tsx
@@ -3,7 +3,7 @@ import { createRemixStub } from "@remix-run/testing";
 import { screen, waitFor, within } from "@testing-library/react";
 import { renderWithProviders } from "test-utils";
 import userEvent from "@testing-library/user-event";
-import MainApp from "#/routes/_oh";
+import MainApp from "#/routes/_oh/route";
 import * as CaptureConsent from "#/utils/handle-capture-consent";
 import i18n from "#/i18n";
 
diff --git a/frontend/package-lock.json b/frontend/package-lock.json
index dc288d58bd2f..73a34437874b 100644
--- a/frontend/package-lock.json
+++ b/frontend/package-lock.json
@@ -1,12 +1,12 @@
 {
   "name": "openhands-frontend",
-  "version": "0.14.2",
+  "version": "0.14.3",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "openhands-frontend",
-      "version": "0.14.2",
+      "version": "0.14.3",
       "dependencies": {
         "@monaco-editor/react": "^4.6.0",
         "@nextui-org/react": "^2.4.8",
diff --git a/frontend/package.json b/frontend/package.json
index bbecd79cd31a..197def0bf0fc 100644
--- a/frontend/package.json
+++ b/frontend/package.json
@@ -1,6 +1,6 @@
 {
   "name": "openhands-frontend",
-  "version": "0.14.2",
+  "version": "0.14.3",
   "private": true,
   "type": "module",
   "engines": {
diff --git a/frontend/src/components/event-handler.tsx b/frontend/src/components/event-handler.tsx
deleted file mode 100644
index 13c769582658..000000000000
--- a/frontend/src/components/event-handler.tsx
+++ /dev/null
@@ -1,193 +0,0 @@
-import React from "react";
-import { useDispatch, useSelector } from "react-redux";
-import toast from "react-hot-toast";
-import posthog from "posthog-js";
-import {
-  useWsClient,
-  WsClientProviderStatus,
-} from "#/context/ws-client-provider";
-import { ErrorObservation } from "#/types/core/observations";
-import { addErrorMessage, addUserMessage } from "#/state/chat-slice";
-import {
-  getCloneRepoCommand,
-  getGitHubTokenCommand,
-} from "#/services/terminal-service";
-import {
-  clearFiles,
-  clearInitialQuery,
-  clearSelectedRepository,
-  setImportedProjectZip,
-} from "#/state/initial-query-slice";
-import store, { RootState } from "#/store";
-import { createChatMessage } from "#/services/chat-service";
-import { isGitHubErrorReponse } from "#/api/github";
-import { base64ToBlob } from "#/utils/base64-to-blob";
-import { setCurrentAgentState } from "#/state/agent-slice";
-import AgentState from "#/types/agent-state";
-import { generateAgentStateChangeEvent } from "#/services/agent-state-service";
-import { useGitHubUser } from "#/hooks/query/use-github-user";
-import { useUploadFiles } from "#/hooks/mutation/use-upload-files";
-import { useAuth } from "#/context/auth-context";
-import { useEndSession } from "#/hooks/use-end-session";
-import { useUserPrefs } from "#/context/user-prefs-context";
-
-interface ServerError {
-  error: boolean | string;
-  message: string;
-  [key: string]: unknown;
-}
-
-const isServerError = (data: object): data is ServerError => "error" in data;
-
-const isErrorObservation = (data: object): data is ErrorObservation =>
-  "observation" in data && data.observation === "error";
-
-export function EventHandler({ children }: React.PropsWithChildren) {
-  const { setToken, gitHubToken } = useAuth();
-  const { settings } = useUserPrefs();
-  const { events, status, send } = useWsClient();
-  const statusRef = React.useRef<WsClientProviderStatus | null>(null);
-  const runtimeActive = status === WsClientProviderStatus.ACTIVE;
-  const dispatch = useDispatch();
-  const { files, importedProjectZip, initialQuery } = useSelector(
-    (state: RootState) => state.initalQuery,
-  );
-  const endSession = useEndSession();
-
-  // FIXME: Bad practice - should be handled with state
-  const { selectedRepository } = useSelector(
-    (state: RootState) => state.initalQuery,
-  );
-
-  const { data: user } = useGitHubUser();
-  const { mutate: uploadFiles } = useUploadFiles();
-
-  const sendInitialQuery = (query: string, base64Files: string[]) => {
-    const timestamp = new Date().toISOString();
-    send(createChatMessage(query, base64Files, timestamp));
-  };
-  const userId = React.useMemo(() => {
-    if (user && !isGitHubErrorReponse(user)) return user.id;
-    return null;
-  }, [user]);
-
-  React.useEffect(() => {
-    if (!events.length) {
-      return;
-    }
-    const event = events[events.length - 1];
-    if (event.token && typeof event.token === "string") {
-      setToken(event.token);
-      return;
-    }
-
-    if (isServerError(event)) {
-      if (event.error_code === 401) {
-        toast.error("Session expired.");
-        endSession();
-        return;
-      }
-
-      if (typeof event.error === "string") {
-        toast.error(event.error);
-      } else {
-        toast.error(event.message);
-      }
-      return;
-    }
-
-    if (event.type === "error") {
-      const message: string = `${event.message}`;
-      if (message.startsWith("Agent reached maximum")) {
-        // We set the agent state to paused here - if the user clicks resume, it auto updates the max iterations
-        send(generateAgentStateChangeEvent(AgentState.PAUSED));
-      }
-    }
-
-    if (isErrorObservation(event)) {
-      dispatch(
-        addErrorMessage({
-          id: event.extras?.error_id,
-          message: event.message,
-        }),
-      );
-    }
-  }, [events.length]);
-
-  React.useEffect(() => {
-    if (statusRef.current === status) {
-      return; // This is a check because of strict mode - if the status did not change, don't do anything
-    }
-    statusRef.current = status;
-
-    if (status === WsClientProviderStatus.ACTIVE) {
-      let additionalInfo = "";
-      if (gitHubToken && selectedRepository) {
-        send(getCloneRepoCommand(gitHubToken, selectedRepository));
-        additionalInfo = `Repository ${selectedRepository} has been cloned to /workspace. Please check the /workspace for files.`;
-        dispatch(clearSelectedRepository()); // reset selected repository; maybe better to move this to '/'?
-      }
-      // if there's an uploaded project zip, add it to the chat
-      else if (importedProjectZip) {
-        additionalInfo = `Files have been uploaded. Please check the /workspace for files.`;
-      }
-
-      if (initialQuery) {
-        if (additionalInfo) {
-          sendInitialQuery(`${initialQuery}\n\n[${additionalInfo}]`, files);
-        } else {
-          sendInitialQuery(initialQuery, files);
-        }
-        dispatch(clearFiles()); // reset selected files
-        dispatch(clearInitialQuery()); // reset initial query
-      }
-    }
-
-    if (status === WsClientProviderStatus.OPENING && initialQuery) {
-      dispatch(
-        addUserMessage({
-          content: initialQuery,
-          imageUrls: files,
-          timestamp: new Date().toISOString(),
-        }),
-      );
-    }
-
-    if (status === WsClientProviderStatus.STOPPED) {
-      store.dispatch(setCurrentAgentState(AgentState.STOPPED));
-    }
-  }, [status]);
-
-  React.useEffect(() => {
-    if (runtimeActive && userId && gitHubToken) {
-      // Export if the user valid, this could happen mid-session so it is handled here
-      send(getGitHubTokenCommand(gitHubToken));
-    }
-  }, [userId, gitHubToken, runtimeActive]);
-
-  React.useEffect(() => {
-    if (runtimeActive && importedProjectZip) {
-      const blob = base64ToBlob(importedProjectZip);
-      const file = new File([blob], "imported-project.zip", {
-        type: blob.type,
-      });
-      uploadFiles(
-        { files: [file] },
-        {
-          onError: () => {
-            toast.error("Failed to upload project files.");
-          },
-        },
-      );
-      dispatch(setImportedProjectZip(null));
-    }
-  }, [runtimeActive, importedProjectZip]);
-
-  React.useEffect(() => {
-    if (settings.LLM_API_KEY) {
-      posthog.capture("user_activated");
-    }
-  }, [settings.LLM_API_KEY]);
-
-  return children;
-}
diff --git a/frontend/src/components/file-explorer/file-explorer.tsx b/frontend/src/components/file-explorer/file-explorer.tsx
deleted file mode 100644
index 5c82a7fa8482..000000000000
--- a/frontend/src/components/file-explorer/file-explorer.tsx
+++ /dev/null
@@ -1,307 +0,0 @@
-import React from "react";
-import {
-  IoIosArrowBack,
-  IoIosArrowForward,
-  IoIosRefresh,
-  IoIosCloudUpload,
-} from "react-icons/io";
-import { useDispatch, useSelector } from "react-redux";
-import { IoFileTray } from "react-icons/io5";
-import { useTranslation } from "react-i18next";
-import { twMerge } from "tailwind-merge";
-import AgentState from "#/types/agent-state";
-import { addAssistantMessage } from "#/state/chat-slice";
-import IconButton from "../icon-button";
-import ExplorerTree from "./explorer-tree";
-import toast from "#/utils/toast";
-import { RootState } from "#/store";
-import { I18nKey } from "#/i18n/declaration";
-import OpenHands from "#/api/open-hands";
-import VSCodeIcon from "#/assets/vscode-alt.svg?react";
-import { useListFiles } from "#/hooks/query/use-list-files";
-import { FileUploadSuccessResponse } from "#/api/open-hands.types";
-import { useUploadFiles } from "#/hooks/mutation/use-upload-files";
-
-interface ExplorerActionsProps {
-  onRefresh: () => void;
-  onUpload: () => void;
-  toggleHidden: () => void;
-  isHidden: boolean;
-}
-
-function ExplorerActions({
-  toggleHidden,
-  onRefresh,
-  onUpload,
-  isHidden,
-}: ExplorerActionsProps) {
-  return (
-    <div
-      className={twMerge(
-        "transform flex h-[24px] items-center gap-1",
-        isHidden ? "right-3" : "right-2",
-      )}
-    >
-      {!isHidden && (
-        <>
-          <IconButton
-            icon={
-              <IoIosRefresh
-                size={16}
-                className="text-neutral-400 hover:text-neutral-100 transition"
-              />
-            }
-            testId="refresh"
-            ariaLabel="Refresh workspace"
-            onClick={onRefresh}
-          />
-          <IconButton
-            icon={
-              <IoIosCloudUpload
-                size={16}
-                className="text-neutral-400 hover:text-neutral-100 transition"
-              />
-            }
-            testId="upload"
-            ariaLabel="Upload File"
-            onClick={onUpload}
-          />
-        </>
-      )}
-
-      <IconButton
-        icon={
-          isHidden ? (
-            <IoIosArrowForward
-              size={20}
-              className="text-neutral-400 hover:text-neutral-100 transition"
-            />
-          ) : (
-            <IoIosArrowBack
-              size={20}
-              className="text-neutral-400 hover:text-neutral-100 transition"
-            />
-          )
-        }
-        testId="toggle"
-        ariaLabel={isHidden ? "Open workspace" : "Close workspace"}
-        onClick={toggleHidden}
-      />
-    </div>
-  );
-}
-
-interface FileExplorerProps {
-  isOpen: boolean;
-  onToggle: () => void;
-}
-
-function FileExplorer({ isOpen, onToggle }: FileExplorerProps) {
-  const [isDragging, setIsDragging] = React.useState(false);
-
-  const { curAgentState } = useSelector((state: RootState) => state.agent);
-  const fileInputRef = React.useRef<HTMLInputElement | null>(null);
-  const dispatch = useDispatch();
-  const { t } = useTranslation();
-  const selectFileInput = () => {
-    fileInputRef.current?.click(); // Trigger the file browser
-  };
-
-  const { data: paths, refetch, error } = useListFiles();
-
-  const handleUploadSuccess = (data: FileUploadSuccessResponse) => {
-    const uploadedCount = data.uploaded_files.length;
-    const skippedCount = data.skipped_files.length;
-
-    if (uploadedCount > 0) {
-      toast.success(
-        `upload-success-${new Date().getTime()}`,
-        t(I18nKey.EXPLORER$UPLOAD_SUCCESS_MESSAGE, {
-          count: uploadedCount,
-        }),
-      );
-    }
-
-    if (skippedCount > 0) {
-      const message = t(I18nKey.EXPLORER$UPLOAD_PARTIAL_SUCCESS_MESSAGE, {
-        count: skippedCount,
-      });
-      toast.info(message);
-    }
-
-    if (uploadedCount === 0 && skippedCount === 0) {
-      toast.info(t(I18nKey.EXPLORER$NO_FILES_UPLOADED_MESSAGE));
-    }
-  };
-
-  const handleUploadError = (e: Error) => {
-    toast.error(
-      `upload-error-${new Date().getTime()}`,
-      e.message || t(I18nKey.EXPLORER$UPLOAD_ERROR_MESSAGE),
-    );
-  };
-
-  const { mutate: uploadFiles } = useUploadFiles();
-
-  const refreshWorkspace = () => {
-    if (
-      curAgentState !== AgentState.LOADING &&
-      curAgentState !== AgentState.STOPPED
-    ) {
-      refetch();
-    }
-  };
-
-  const uploadFileData = (files: FileList) => {
-    uploadFiles(
-      { files: Array.from(files) },
-      { onSuccess: handleUploadSuccess, onError: handleUploadError },
-    );
-    refreshWorkspace();
-  };
-
-  const handleVSCodeClick = async (e: React.MouseEvent) => {
-    e.preventDefault();
-    try {
-      const response = await OpenHands.getVSCodeUrl();
-      if (response.vscode_url) {
-        dispatch(
-          addAssistantMessage(
-            "You opened VS Code. Please inform the agent of any changes you made to the workspace or environment. To avoid conflicts, it's best to pause the agent before making any changes.",
-          ),
-        );
-        window.open(response.vscode_url, "_blank");
-      } else {
-        toast.error(
-          `open-vscode-error-${new Date().getTime()}`,
-          t(I18nKey.EXPLORER$VSCODE_SWITCHING_ERROR_MESSAGE, {
-            error: response.error,
-          }),
-        );
-      }
-    } catch (exp_error) {
-      toast.error(
-        `open-vscode-error-${new Date().getTime()}`,
-        t(I18nKey.EXPLORER$VSCODE_SWITCHING_ERROR_MESSAGE, {
-          error: String(exp_error),
-        }),
-      );
-    }
-  };
-
-  React.useEffect(() => {
-    refreshWorkspace();
-  }, [curAgentState]);
-
-  return (
-    <div
-      data-testid="file-explorer"
-      className="relative h-full"
-      onDragEnter={() => {
-        setIsDragging(true);
-      }}
-      onDragEnd={() => {
-        setIsDragging(false);
-      }}
-    >
-      {isDragging && (
-        <div
-          data-testid="dropzone"
-          onDragLeave={() => setIsDragging(false)}
-          onDrop={(event) => {
-            event.preventDefault();
-            const { files: droppedFiles } = event.dataTransfer;
-            if (droppedFiles.length > 0) {
-              uploadFileData(droppedFiles);
-            }
-            setIsDragging(false);
-          }}
-          onDragOver={(event) => event.preventDefault()}
-          className="z-10 absolute flex flex-col justify-center items-center bg-black top-0 bottom-0 left-0 right-0 opacity-65"
-        >
-          <IoFileTray size={32} />
-          <p className="font-bold text-xl">
-            {t(I18nKey.EXPLORER$LABEL_DROP_FILES)}
-          </p>
-        </div>
-      )}
-      <div
-        className={twMerge(
-          "bg-neutral-800 h-full border-r-1 border-r-neutral-600 flex flex-col",
-          !isOpen ? "w-12" : "w-60",
-        )}
-      >
-        <div className="flex flex-col relative h-full px-3 py-2 overflow-hidden">
-          <div className="sticky top-0 bg-neutral-800">
-            <div
-              className={twMerge(
-                "flex items-center",
-                !isOpen ? "justify-center" : "justify-between",
-              )}
-            >
-              {isOpen && (
-                <div className="text-neutral-300 font-bold text-sm">
-                  {t(I18nKey.EXPLORER$LABEL_WORKSPACE)}
-                </div>
-              )}
-              <ExplorerActions
-                isHidden={!isOpen}
-                toggleHidden={onToggle}
-                onRefresh={refreshWorkspace}
-                onUpload={selectFileInput}
-              />
-            </div>
-          </div>
-          {!error && (
-            <div className="overflow-auto flex-grow min-h-0">
-              <div style={{ display: !isOpen ? "none" : "block" }}>
-                <ExplorerTree files={paths || []} />
-              </div>
-            </div>
-          )}
-          {error && (
-            <div className="flex flex-col items-center justify-center h-full">
-              <p className="text-neutral-300 text-sm">{error.message}</p>
-            </div>
-          )}
-          {isOpen && (
-            <button
-              type="button"
-              onClick={handleVSCodeClick}
-              disabled={
-                curAgentState === AgentState.INIT ||
-                curAgentState === AgentState.LOADING
-              }
-              className={twMerge(
-                "mt-auto mb-2 w-full h-10 text-white rounded flex items-center justify-center gap-2 transition-colors",
-                curAgentState === AgentState.INIT ||
-                  curAgentState === AgentState.LOADING
-                  ? "bg-neutral-600 cursor-not-allowed"
-                  : "bg-[#4465DB] hover:bg-[#3451C7]",
-              )}
-              aria-label="Open in VS Code"
-            >
-              <VSCodeIcon width={20} height={20} />
-              Open in VS Code
-            </button>
-          )}
-        </div>
-        <input
-          data-testid="file-input"
-          type="file"
-          multiple
-          ref={fileInputRef}
-          style={{ display: "none" }}
-          onChange={(event) => {
-            const { files: selectedFiles } = event.target;
-            if (selectedFiles && selectedFiles.length > 0) {
-              uploadFileData(selectedFiles);
-            }
-          }}
-        />
-      </div>
-    </div>
-  );
-}
-
-export default FileExplorer;
diff --git a/frontend/src/components/file-explorer/tree-node.tsx b/frontend/src/components/file-explorer/tree-node.tsx
index 07012f2a2c18..5300cae19868 100644
--- a/frontend/src/components/file-explorer/tree-node.tsx
+++ b/frontend/src/components/file-explorer/tree-node.tsx
@@ -10,15 +10,11 @@ interface TitleProps {
   name: string;
   type: "folder" | "file";
   isOpen: boolean;
-  onClick: () => void;
 }
 
-function Title({ name, type, isOpen, onClick }: TitleProps) {
+function Title({ name, type, isOpen }: TitleProps) {
   return (
-    <div
-      onClick={onClick}
-      className="cursor-pointer text-nowrap rounded-[5px] p-1 nowrap flex items-center gap-2 aria-selected:bg-neutral-600 aria-selected:text-white hover:text-white"
-    >
+    <div className="cursor-pointer text-nowrap rounded-[5px] p-1 nowrap flex items-center gap-2 aria-selected:bg-neutral-600 aria-selected:text-white hover:text-white">
       <div className="flex-shrink-0">
         {type === "folder" && <FolderIcon isOpen={isOpen} />}
         {type === "file" && <FileIcon filename={name} />}
@@ -84,13 +80,13 @@ function TreeNode({ path, defaultOpen = false }: TreeNodeProps) {
         type={isDirectory ? "button" : "submit"}
         name="file"
         value={path}
+        onClick={handleClick}
         className="flex items-center justify-between w-full px-1"
       >
         <Title
           name={filename}
           type={isDirectory ? "folder" : "file"}
           isOpen={isOpen}
-          onClick={handleClick}
         />
 
         {modifiedFiles[path] && (
diff --git a/frontend/src/components/modals/account-settings-modal.tsx b/frontend/src/components/modals/account-settings-form.tsx
similarity index 96%
rename from frontend/src/components/modals/account-settings-modal.tsx
rename to frontend/src/components/modals/account-settings-form.tsx
index 59b25cc0de95..3b41ab4332f7 100644
--- a/frontend/src/components/modals/account-settings-modal.tsx
+++ b/frontend/src/components/modals/account-settings-form.tsx
@@ -14,19 +14,19 @@ import { useAuth } from "#/context/auth-context";
 import { useUserPrefs } from "#/context/user-prefs-context";
 import { handleCaptureConsent } from "#/utils/handle-capture-consent";
 
-interface AccountSettingsModalProps {
+interface AccountSettingsFormProps {
   onClose: () => void;
   selectedLanguage: string;
   gitHubError: boolean;
   analyticsConsent: string | null;
 }
 
-function AccountSettingsModal({
+export function AccountSettingsForm({
   onClose,
   selectedLanguage,
   gitHubError,
   analyticsConsent,
-}: AccountSettingsModalProps) {
+}: AccountSettingsFormProps) {
   const { gitHubToken, setGitHubToken, logout } = useAuth();
   const { saveSettings } = useUserPrefs();
   const { t } = useTranslation();
@@ -136,5 +136,3 @@ function AccountSettingsModal({
     </ModalBody>
   );
 }
-
-export default AccountSettingsModal;
diff --git a/frontend/src/context/user-prefs-context.tsx b/frontend/src/context/user-prefs-context.tsx
index e3573c9234c0..060749463da5 100644
--- a/frontend/src/context/user-prefs-context.tsx
+++ b/frontend/src/context/user-prefs-context.tsx
@@ -1,4 +1,5 @@
 import React from "react";
+import posthog from "posthog-js";
 import {
   getSettings,
   Settings,
@@ -28,6 +29,12 @@ function UserPrefsProvider({ children }: React.PropsWithChildren) {
     setSettingsAreUpToDate(checkIfSettingsAreUpToDate());
   };
 
+  React.useEffect(() => {
+    if (settings.LLM_API_KEY) {
+      posthog.capture("user_activated");
+    }
+  }, [settings.LLM_API_KEY]);
+
   const value = React.useMemo(
     () => ({
       settings,
diff --git a/frontend/src/context/ws-client-provider.tsx b/frontend/src/context/ws-client-provider.tsx
index 9160f217d2c8..89483b234ae1 100644
--- a/frontend/src/context/ws-client-provider.tsx
+++ b/frontend/src/context/ws-client-provider.tsx
@@ -136,7 +136,7 @@ export function WsClientProvider({
     // create a new one
     if (
       !sio ||
-      (tokenRef.current && token !== tokenRef.current) ||
+      (tokenRef.current && token && token !== tokenRef.current) ||
       ghToken !== ghTokenRef.current
     ) {
       sio?.disconnect();
diff --git a/frontend/src/hooks/query/use-conversation-config.ts b/frontend/src/hooks/query/use-conversation-config.ts
new file mode 100644
index 000000000000..729c6c969d13
--- /dev/null
+++ b/frontend/src/hooks/query/use-conversation-config.ts
@@ -0,0 +1,32 @@
+import { useQuery } from "@tanstack/react-query";
+import React from "react";
+import {
+  useWsClient,
+  WsClientProviderStatus,
+} from "#/context/ws-client-provider";
+import OpenHands from "#/api/open-hands";
+
+export const useConversationConfig = () => {
+  const { status } = useWsClient();
+
+  const query = useQuery({
+    queryKey: ["conversation_config"],
+    queryFn: OpenHands.getRuntimeId,
+    enabled: status === WsClientProviderStatus.ACTIVE,
+  });
+
+  React.useEffect(() => {
+    if (query.data) {
+      const { runtime_id: runtimeId } = query.data;
+
+      // eslint-disable-next-line no-console
+      console.log(
+        "Runtime ID: %c%s",
+        "background: #444; color: #ffeb3b; font-weight: bold; padding: 2px 4px; border-radius: 4px;",
+        runtimeId,
+      );
+    }
+  }, [query.data]);
+
+  return query;
+};
diff --git a/frontend/src/hooks/query/use-vscode-url.ts b/frontend/src/hooks/query/use-vscode-url.ts
new file mode 100644
index 000000000000..9c913e57cf4b
--- /dev/null
+++ b/frontend/src/hooks/query/use-vscode-url.ts
@@ -0,0 +1,43 @@
+import { useQuery } from "@tanstack/react-query";
+import React from "react";
+import { useTranslation } from "react-i18next";
+import { useDispatch } from "react-redux";
+import toast from "#/utils/toast";
+import { addAssistantMessage } from "#/state/chat-slice";
+import { I18nKey } from "#/i18n/declaration";
+import OpenHands from "#/api/open-hands";
+
+export const useVSCodeUrl = () => {
+  const { t } = useTranslation();
+  const dispatch = useDispatch();
+
+  const data = useQuery({
+    queryKey: ["vscode_url"],
+    queryFn: OpenHands.getVSCodeUrl,
+    enabled: false,
+  });
+
+  const { data: vscodeUrlObject, isFetching } = data;
+
+  React.useEffect(() => {
+    if (isFetching) return;
+
+    if (vscodeUrlObject?.vscode_url) {
+      dispatch(
+        addAssistantMessage(
+          "You opened VS Code. Please inform the agent of any changes you made to the workspace or environment. To avoid conflicts, it's best to pause the agent before making any changes.",
+        ),
+      );
+      window.open(vscodeUrlObject.vscode_url, "_blank");
+    } else if (vscodeUrlObject?.error) {
+      toast.error(
+        `open-vscode-error-${new Date().getTime()}`,
+        t(I18nKey.EXPLORER$VSCODE_SWITCHING_ERROR_MESSAGE, {
+          error: vscodeUrlObject.error,
+        }),
+      );
+    }
+  }, [vscodeUrlObject, isFetching]);
+
+  return data;
+};
diff --git a/frontend/src/routes/_oh._index/import-project-suggestion-box.tsx b/frontend/src/routes/_oh._index/import-project-suggestion-box.tsx
new file mode 100644
index 000000000000..e76317001a01
--- /dev/null
+++ b/frontend/src/routes/_oh._index/import-project-suggestion-box.tsx
@@ -0,0 +1,30 @@
+import { SuggestionBox } from "./suggestion-box";
+
+interface ImportProjectSuggestionBoxProps {
+  onChange: (event: React.ChangeEvent<HTMLInputElement>) => void;
+}
+
+export function ImportProjectSuggestionBox({
+  onChange,
+}: ImportProjectSuggestionBoxProps) {
+  return (
+    <SuggestionBox
+      title="+ Import Project"
+      content={
+        <label htmlFor="import-project" className="w-full flex justify-center">
+          <span className="border-2 border-dashed border-neutral-600 rounded px-2 py-1 cursor-pointer">
+            Upload a .zip
+          </span>
+          <input
+            hidden
+            type="file"
+            accept="application/zip"
+            id="import-project"
+            multiple={false}
+            onChange={onChange}
+          />
+        </label>
+      }
+    />
+  );
+}
diff --git a/frontend/src/routes/_oh._index/route.tsx b/frontend/src/routes/_oh._index/route.tsx
index 5bca097ba516..6134c493fe94 100644
--- a/frontend/src/routes/_oh._index/route.tsx
+++ b/frontend/src/routes/_oh._index/route.tsx
@@ -2,7 +2,6 @@ import { useLocation, useNavigate } from "@remix-run/react";
 import React from "react";
 import { useDispatch } from "react-redux";
 import posthog from "posthog-js";
-import { SuggestionBox } from "./suggestion-box";
 import { TaskForm } from "./task-form";
 import { HeroHeading } from "./hero-heading";
 import { setImportedProjectZip } from "#/state/initial-query-slice";
@@ -13,6 +12,7 @@ import { useGitHubUser } from "#/hooks/query/use-github-user";
 import { useGitHubAuthUrl } from "#/hooks/use-github-auth-url";
 import { useConfig } from "#/hooks/query/use-config";
 import { useAuth } from "#/context/auth-context";
+import { ImportProjectSuggestionBox } from "./import-project-suggestion-box";
 
 function Home() {
   const { token, gitHubToken } = useAuth();
@@ -47,6 +47,7 @@ function Home() {
         <div className="flex flex-col gap-2 w-full">
           <TaskForm ref={formRef} />
         </div>
+
         <div className="flex gap-4 w-full">
           <GitHubRepositoriesSuggestionBox
             handleSubmit={() => formRef.current?.requestSubmit()}
@@ -55,39 +56,18 @@ function Home() {
             }
             gitHubAuthUrl={gitHubAuthUrl}
             user={user || null}
-            // onEndReached={}
           />
-          <SuggestionBox
-            title="+ Import Project"
-            content={
-              <label
-                htmlFor="import-project"
-                className="w-full flex justify-center"
-              >
-                <span className="border-2 border-dashed border-neutral-600 rounded px-2 py-1 cursor-pointer">
-                  Upload a .zip
-                </span>
-                <input
-                  hidden
-                  type="file"
-                  accept="application/zip"
-                  id="import-project"
-                  multiple={false}
-                  onChange={async (event) => {
-                    if (event.target.files) {
-                      const zip = event.target.files[0];
-                      dispatch(
-                        setImportedProjectZip(await convertZipToBase64(zip)),
-                      );
-                      posthog.capture("zip_file_uploaded");
-                      formRef.current?.requestSubmit();
-                    } else {
-                      // TODO: handle error
-                    }
-                  }}
-                />
-              </label>
-            }
+          <ImportProjectSuggestionBox
+            onChange={async (event) => {
+              if (event.target.files) {
+                const zip = event.target.files[0];
+                dispatch(setImportedProjectZip(await convertZipToBase64(zip)));
+                posthog.capture("zip_file_uploaded");
+                formRef.current?.requestSubmit();
+              } else {
+                // TODO: handle error
+              }
+            }}
           />
         </div>
       </div>
diff --git a/frontend/src/routes/_oh.app._index/constants.ts b/frontend/src/routes/_oh.app._index/constants.ts
new file mode 100644
index 000000000000..b4b512172ae4
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/constants.ts
@@ -0,0 +1,11 @@
+export const ASSET_FILE_TYPES = [
+  ".png",
+  ".jpg",
+  ".jpeg",
+  ".bmp",
+  ".gif",
+  ".pdf",
+  ".mp4",
+  ".webm",
+  ".ogg",
+];
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/buttons/open-vscode-button.tsx b/frontend/src/routes/_oh.app._index/file-explorer/buttons/open-vscode-button.tsx
new file mode 100644
index 000000000000..0c8dfbc3f40c
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/buttons/open-vscode-button.tsx
@@ -0,0 +1,30 @@
+import { cn } from "#/utils/utils";
+import VSCodeIcon from "#/assets/vscode-alt.svg?react";
+
+interface OpenVSCodeButtonProps {
+  isDisabled: boolean;
+  onClick: () => void;
+}
+
+export function OpenVSCodeButton({
+  isDisabled,
+  onClick,
+}: OpenVSCodeButtonProps) {
+  return (
+    <button
+      type="button"
+      onClick={onClick}
+      disabled={isDisabled}
+      className={cn(
+        "mt-auto mb-2 w-full h-10 text-white rounded flex items-center justify-center gap-2 transition-colors",
+        isDisabled
+          ? "bg-neutral-600 cursor-not-allowed"
+          : "bg-[#4465DB] hover:bg-[#3451C7]",
+      )}
+      aria-label="Open in VS Code"
+    >
+      <VSCodeIcon width={20} height={20} />
+      Open in VS Code
+    </button>
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/buttons/refresh-icon-button.tsx b/frontend/src/routes/_oh.app._index/file-explorer/buttons/refresh-icon-button.tsx
new file mode 100644
index 000000000000..d21ab4160b35
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/buttons/refresh-icon-button.tsx
@@ -0,0 +1,22 @@
+import { IoIosRefresh } from "react-icons/io";
+import IconButton from "#/components/icon-button";
+
+interface RefreshIconButtonProps {
+  onClick: () => void;
+}
+
+export function RefreshIconButton({ onClick }: RefreshIconButtonProps) {
+  return (
+    <IconButton
+      icon={
+        <IoIosRefresh
+          size={16}
+          className="text-neutral-400 hover:text-neutral-100 transition"
+        />
+      }
+      testId="refresh"
+      ariaLabel="Refresh workspace"
+      onClick={onClick}
+    />
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/buttons/toggle-workspace-icon-button.tsx b/frontend/src/routes/_oh.app._index/file-explorer/buttons/toggle-workspace-icon-button.tsx
new file mode 100644
index 000000000000..5d42eeba0495
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/buttons/toggle-workspace-icon-button.tsx
@@ -0,0 +1,33 @@
+import { IoIosArrowForward, IoIosArrowBack } from "react-icons/io";
+import IconButton from "#/components/icon-button";
+
+interface ToggleWorkspaceIconButtonProps {
+  onClick: () => void;
+  isHidden: boolean;
+}
+
+export function ToggleWorkspaceIconButton({
+  onClick,
+  isHidden,
+}: ToggleWorkspaceIconButtonProps) {
+  return (
+    <IconButton
+      icon={
+        isHidden ? (
+          <IoIosArrowForward
+            size={20}
+            className="text-neutral-400 hover:text-neutral-100 transition"
+          />
+        ) : (
+          <IoIosArrowBack
+            size={20}
+            className="text-neutral-400 hover:text-neutral-100 transition"
+          />
+        )
+      }
+      testId="toggle"
+      ariaLabel={isHidden ? "Open workspace" : "Close workspace"}
+      onClick={onClick}
+    />
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/buttons/upload-icon-button.tsx b/frontend/src/routes/_oh.app._index/file-explorer/buttons/upload-icon-button.tsx
new file mode 100644
index 000000000000..b10ede48d806
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/buttons/upload-icon-button.tsx
@@ -0,0 +1,22 @@
+import { IoIosCloudUpload } from "react-icons/io";
+import IconButton from "#/components/icon-button";
+
+interface UploadIconButtonProps {
+  onClick: () => void;
+}
+
+export function UploadIconButton({ onClick }: UploadIconButtonProps) {
+  return (
+    <IconButton
+      icon={
+        <IoIosCloudUpload
+          size={16}
+          className="text-neutral-400 hover:text-neutral-100 transition"
+        />
+      }
+      testId="upload"
+      ariaLabel="Upload File"
+      onClick={onClick}
+    />
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/dropzone.tsx b/frontend/src/routes/_oh.app._index/file-explorer/dropzone.tsx
new file mode 100644
index 000000000000..3713fa2a78fb
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/dropzone.tsx
@@ -0,0 +1,27 @@
+import { useTranslation } from "react-i18next";
+import { IoFileTray } from "react-icons/io5";
+import { I18nKey } from "#/i18n/declaration";
+
+interface DropzoneProps {
+  onDragLeave: () => void;
+  onDrop: (event: React.DragEvent<HTMLDivElement>) => void;
+}
+
+export function Dropzone({ onDragLeave, onDrop }: DropzoneProps) {
+  const { t } = useTranslation();
+
+  return (
+    <div
+      data-testid="dropzone"
+      onDragLeave={onDragLeave}
+      onDrop={onDrop}
+      onDragOver={(event) => event.preventDefault()}
+      className="z-10 absolute flex flex-col justify-center items-center bg-black top-0 bottom-0 left-0 right-0 opacity-65"
+    >
+      <IoFileTray size={32} />
+      <p className="font-bold text-xl">
+        {t(I18nKey.EXPLORER$LABEL_DROP_FILES)}
+      </p>
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/file-explorer-actions.tsx b/frontend/src/routes/_oh.app._index/file-explorer/file-explorer-actions.tsx
new file mode 100644
index 000000000000..7fb9552ba2f3
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/file-explorer-actions.tsx
@@ -0,0 +1,36 @@
+import { cn } from "#/utils/utils";
+import { RefreshIconButton } from "./buttons/refresh-icon-button";
+import { ToggleWorkspaceIconButton } from "./buttons/toggle-workspace-icon-button";
+import { UploadIconButton } from "./buttons/upload-icon-button";
+
+interface ExplorerActionsProps {
+  onRefresh: () => void;
+  onUpload: () => void;
+  toggleHidden: () => void;
+  isHidden: boolean;
+}
+
+export function ExplorerActions({
+  toggleHidden,
+  onRefresh,
+  onUpload,
+  isHidden,
+}: ExplorerActionsProps) {
+  return (
+    <div
+      className={cn(
+        "flex h-[24px] items-center gap-1",
+        isHidden ? "right-3" : "right-2",
+      )}
+    >
+      {!isHidden && (
+        <>
+          <RefreshIconButton onClick={onRefresh} />
+          <UploadIconButton onClick={onUpload} />
+        </>
+      )}
+
+      <ToggleWorkspaceIconButton isHidden={isHidden} onClick={toggleHidden} />
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/file-explorer-header.tsx b/frontend/src/routes/_oh.app._index/file-explorer/file-explorer-header.tsx
new file mode 100644
index 000000000000..d2329889f1fa
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/file-explorer-header.tsx
@@ -0,0 +1,42 @@
+import { useTranslation } from "react-i18next";
+import { I18nKey } from "#/i18n/declaration";
+import { cn } from "#/utils/utils";
+import { ExplorerActions } from "./file-explorer-actions";
+
+interface FileExplorerHeaderProps {
+  isOpen: boolean;
+  onToggle: () => void;
+  onRefreshWorkspace: () => void;
+  onUploadFile: () => void;
+}
+
+export function FileExplorerHeader({
+  isOpen,
+  onToggle,
+  onRefreshWorkspace,
+  onUploadFile,
+}: FileExplorerHeaderProps) {
+  const { t } = useTranslation();
+
+  return (
+    <div
+      className={cn(
+        "sticky top-0 bg-neutral-800",
+        "flex items-center",
+        !isOpen ? "justify-center" : "justify-between",
+      )}
+    >
+      {isOpen && (
+        <div className="text-neutral-300 font-bold text-sm">
+          {t(I18nKey.EXPLORER$LABEL_WORKSPACE)}
+        </div>
+      )}
+      <ExplorerActions
+        isHidden={!isOpen}
+        toggleHidden={onToggle}
+        onRefresh={onRefreshWorkspace}
+        onUpload={onUploadFile}
+      />
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/file-explorer/file-explorer.tsx b/frontend/src/routes/_oh.app._index/file-explorer/file-explorer.tsx
new file mode 100644
index 000000000000..a7979cacd381
--- /dev/null
+++ b/frontend/src/routes/_oh.app._index/file-explorer/file-explorer.tsx
@@ -0,0 +1,156 @@
+import React from "react";
+import { useSelector } from "react-redux";
+import { useTranslation } from "react-i18next";
+import AgentState from "#/types/agent-state";
+import ExplorerTree from "../../../components/file-explorer/explorer-tree";
+import toast from "#/utils/toast";
+import { RootState } from "#/store";
+import { I18nKey } from "#/i18n/declaration";
+import { useListFiles } from "#/hooks/query/use-list-files";
+import { FileUploadSuccessResponse } from "#/api/open-hands.types";
+import { useUploadFiles } from "#/hooks/mutation/use-upload-files";
+import { cn } from "#/utils/utils";
+import { OpenVSCodeButton } from "./buttons/open-vscode-button";
+import { Dropzone } from "./dropzone";
+import { FileExplorerHeader } from "./file-explorer-header";
+import { useVSCodeUrl } from "#/hooks/query/use-vscode-url";
+
+interface FileExplorerProps {
+  isOpen: boolean;
+  onToggle: () => void;
+}
+
+export function FileExplorer({ isOpen, onToggle }: FileExplorerProps) {
+  const { t } = useTranslation();
+
+  const fileInputRef = React.useRef<HTMLInputElement | null>(null);
+  const [isDragging, setIsDragging] = React.useState(false);
+
+  const { curAgentState } = useSelector((state: RootState) => state.agent);
+
+  const { data: paths, refetch, error } = useListFiles();
+  const { mutate: uploadFiles } = useUploadFiles();
+  const { refetch: getVSCodeUrl } = useVSCodeUrl();
+
+  const selectFileInput = () => {
+    fileInputRef.current?.click(); // Trigger the file browser
+  };
+
+  const handleUploadSuccess = (data: FileUploadSuccessResponse) => {
+    const uploadedCount = data.uploaded_files.length;
+    const skippedCount = data.skipped_files.length;
+
+    if (uploadedCount > 0) {
+      toast.success(
+        `upload-success-${new Date().getTime()}`,
+        t(I18nKey.EXPLORER$UPLOAD_SUCCESS_MESSAGE, {
+          count: uploadedCount,
+        }),
+      );
+    }
+
+    if (skippedCount > 0) {
+      const message = t(I18nKey.EXPLORER$UPLOAD_PARTIAL_SUCCESS_MESSAGE, {
+        count: skippedCount,
+      });
+      toast.info(message);
+    }
+
+    if (uploadedCount === 0 && skippedCount === 0) {
+      toast.info(t(I18nKey.EXPLORER$NO_FILES_UPLOADED_MESSAGE));
+    }
+  };
+
+  const handleUploadError = (uploadError: Error) => {
+    toast.error(
+      `upload-error-${new Date().getTime()}`,
+      uploadError.message || t(I18nKey.EXPLORER$UPLOAD_ERROR_MESSAGE),
+    );
+  };
+
+  const refreshWorkspace = () => {
+    if (
+      curAgentState !== AgentState.LOADING &&
+      curAgentState !== AgentState.STOPPED
+    ) {
+      refetch();
+    }
+  };
+
+  const uploadFileData = (files: FileList) => {
+    uploadFiles(
+      { files: Array.from(files) },
+      { onSuccess: handleUploadSuccess, onError: handleUploadError },
+    );
+    refreshWorkspace();
+  };
+
+  const handleDropFiles = (event: React.DragEvent<HTMLDivElement>) => {
+    event.preventDefault();
+    const { files: droppedFiles } = event.dataTransfer;
+    if (droppedFiles.length > 0) {
+      uploadFileData(droppedFiles);
+    }
+    setIsDragging(false);
+  };
+
+  React.useEffect(() => {
+    refreshWorkspace();
+  }, [curAgentState]);
+
+  return (
+    <div
+      data-testid="file-explorer"
+      className="relative h-full"
+      onDragEnter={() => {
+        setIsDragging(true);
+      }}
+      onDragEnd={() => {
+        setIsDragging(false);
+      }}
+    >
+      {isDragging && (
+        <Dropzone
+          onDragLeave={() => setIsDragging(false)}
+          onDrop={handleDropFiles}
+        />
+      )}
+      <div
+        className={cn(
+          "bg-neutral-800 h-full border-r-1 border-r-neutral-600 flex flex-col",
+          !isOpen ? "w-12" : "w-60",
+        )}
+      >
+        <div className="flex flex-col relative h-full px-3 py-2 overflow-hidden">
+          <FileExplorerHeader
+            isOpen={isOpen}
+            onToggle={onToggle}
+            onRefreshWorkspace={refreshWorkspace}
+            onUploadFile={selectFileInput}
+          />
+          {!error && (
+            <div className="overflow-auto flex-grow min-h-0">
+              <div style={{ display: !isOpen ? "none" : "block" }}>
+                <ExplorerTree files={paths || []} />
+              </div>
+            </div>
+          )}
+          {error && (
+            <div className="flex flex-col items-center justify-center h-full">
+              <p className="text-neutral-300 text-sm">{error.message}</p>
+            </div>
+          )}
+          {isOpen && (
+            <OpenVSCodeButton
+              onClick={getVSCodeUrl}
+              isDisabled={
+                curAgentState === AgentState.INIT ||
+                curAgentState === AgentState.LOADING
+              }
+            />
+          )}
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app._index/route.tsx b/frontend/src/routes/_oh.app._index/route.tsx
index 8ca4b5b345b5..99f583ecf74e 100644
--- a/frontend/src/routes/_oh.app._index/route.tsx
+++ b/frontend/src/routes/_oh.app._index/route.tsx
@@ -5,23 +5,12 @@ import { editor } from "monaco-editor";
 import { EditorProps } from "@monaco-editor/react";
 import { RootState } from "#/store";
 import AgentState from "#/types/agent-state";
-import FileExplorer from "#/components/file-explorer/file-explorer";
+import { FileExplorer } from "#/routes/_oh.app._index/file-explorer/file-explorer";
 import CodeEditorComponent from "./code-editor-component";
 import { useFiles } from "#/context/files";
 import { EditorActions } from "#/components/editor-actions";
 import { useSaveFile } from "#/hooks/mutation/use-save-file";
-
-const ASSET_FILE_TYPES = [
-  ".png",
-  ".jpg",
-  ".jpeg",
-  ".bmp",
-  ".gif",
-  ".pdf",
-  ".mp4",
-  ".webm",
-  ".ogg",
-];
+import { ASSET_FILE_TYPES } from "./constants";
 
 export function ErrorBoundary() {
   const error = useRouteError();
diff --git a/frontend/src/routes/_oh.app/action-suggestions.tsx b/frontend/src/routes/_oh.app/action-suggestions.tsx
new file mode 100644
index 000000000000..fc9442e99606
--- /dev/null
+++ b/frontend/src/routes/_oh.app/action-suggestions.tsx
@@ -0,0 +1,90 @@
+import posthog from "posthog-js";
+import React from "react";
+import { SuggestionItem } from "#/components/suggestion-item";
+import { useAuth } from "#/context/auth-context";
+import { downloadWorkspace } from "#/utils/download-workspace";
+
+interface ActionSuggestionsProps {
+  onSuggestionsClick: (value: string) => void;
+}
+
+export function ActionSuggestions({
+  onSuggestionsClick,
+}: ActionSuggestionsProps) {
+  const { gitHubToken } = useAuth();
+
+  const [isDownloading, setIsDownloading] = React.useState(false);
+  const [hasPullRequest, setHasPullRequest] = React.useState(false);
+
+  const handleDownloadWorkspace = async () => {
+    setIsDownloading(true);
+    try {
+      await downloadWorkspace();
+    } catch (error) {
+      // TODO: Handle error
+    } finally {
+      setIsDownloading(false);
+    }
+  };
+
+  return (
+    <div className="flex flex-col gap-2 mb-2">
+      {gitHubToken ? (
+        <div className="flex flex-row gap-2 justify-center w-full">
+          {!hasPullRequest ? (
+            <>
+              <SuggestionItem
+                suggestion={{
+                  label: "Push to Branch",
+                  value:
+                    "Please push the changes to a remote branch on GitHub, but do NOT create a pull request.",
+                }}
+                onClick={(value) => {
+                  posthog.capture("push_to_branch_button_clicked");
+                  onSuggestionsClick(value);
+                }}
+              />
+              <SuggestionItem
+                suggestion={{
+                  label: "Push & Create PR",
+                  value:
+                    "Please push the changes to GitHub and open a pull request.",
+                }}
+                onClick={(value) => {
+                  posthog.capture("create_pr_button_clicked");
+                  onSuggestionsClick(value);
+                  setHasPullRequest(true);
+                }}
+              />
+            </>
+          ) : (
+            <SuggestionItem
+              suggestion={{
+                label: "Push changes to PR",
+                value:
+                  "Please push the latest changes to the existing pull request.",
+              }}
+              onClick={(value) => {
+                posthog.capture("push_to_pr_button_clicked");
+                onSuggestionsClick(value);
+              }}
+            />
+          )}
+        </div>
+      ) : (
+        <SuggestionItem
+          suggestion={{
+            label: !isDownloading
+              ? "Download .zip"
+              : "Downloading, please wait...",
+            value: "Download .zip",
+          }}
+          onClick={() => {
+            posthog.capture("download_workspace_button_clicked");
+            handleDownloadWorkspace();
+          }}
+        />
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app/chat-interface.tsx b/frontend/src/routes/_oh.app/chat-interface.tsx
new file mode 100644
index 000000000000..8b413c550fdd
--- /dev/null
+++ b/frontend/src/routes/_oh.app/chat-interface.tsx
@@ -0,0 +1,144 @@
+import { useDispatch, useSelector } from "react-redux";
+import React from "react";
+import posthog from "posthog-js";
+import { convertImageToBase64 } from "#/utils/convert-image-to-base-64";
+import { FeedbackActions } from "../../components/feedback-actions";
+import { createChatMessage } from "#/services/chat-service";
+import { InteractiveChatBox } from "../../components/interactive-chat-box";
+import { addUserMessage } from "#/state/chat-slice";
+import { RootState } from "#/store";
+import AgentState from "#/types/agent-state";
+import { generateAgentStateChangeEvent } from "#/services/agent-state-service";
+import { FeedbackModal } from "../../components/feedback-modal";
+import { useScrollToBottom } from "#/hooks/use-scroll-to-bottom";
+import TypingIndicator from "../../components/chat/typing-indicator";
+import { ContinueButton } from "../../components/continue-button";
+import { ScrollToBottomButton } from "../../components/scroll-to-bottom-button";
+import { useWsClient } from "#/context/ws-client-provider";
+import { Messages } from "./messages";
+import { LoadingSpinner } from "./loading-spinner";
+import { ChatSuggestions } from "./chat-suggestions";
+import { ActionSuggestions } from "./action-suggestions";
+
+export function ChatInterface() {
+  const { send, isLoadingMessages } = useWsClient();
+  const dispatch = useDispatch();
+
+  const scrollRef = React.useRef<HTMLDivElement>(null);
+  const { scrollDomToBottom, onChatBodyScroll, hitBottom } =
+    useScrollToBottom(scrollRef);
+
+  const { messages } = useSelector((state: RootState) => state.chat);
+  const { curAgentState } = useSelector((state: RootState) => state.agent);
+
+  const [feedbackPolarity, setFeedbackPolarity] = React.useState<
+    "positive" | "negative"
+  >("positive");
+  const [feedbackModalIsOpen, setFeedbackModalIsOpen] = React.useState(false);
+  const [messageToSend, setMessageToSend] = React.useState<string | null>(null);
+
+  const handleSendMessage = async (content: string, files: File[]) => {
+    posthog.capture("user_message_sent", {
+      current_message_count: messages.length,
+    });
+    const promises = files.map((file) => convertImageToBase64(file));
+    const imageUrls = await Promise.all(promises);
+
+    const timestamp = new Date().toISOString();
+    dispatch(addUserMessage({ content, imageUrls, timestamp }));
+    send(createChatMessage(content, imageUrls, timestamp));
+    setMessageToSend(null);
+  };
+
+  const handleStop = () => {
+    posthog.capture("stop_button_clicked");
+    send(generateAgentStateChangeEvent(AgentState.STOPPED));
+  };
+
+  const handleSendContinueMsg = () => {
+    handleSendMessage("Continue", []);
+  };
+
+  const onClickShareFeedbackActionButton = async (
+    polarity: "positive" | "negative",
+  ) => {
+    setFeedbackModalIsOpen(true);
+    setFeedbackPolarity(polarity);
+  };
+
+  const isWaitingForUserInput =
+    curAgentState === AgentState.AWAITING_USER_INPUT ||
+    curAgentState === AgentState.FINISHED;
+
+  return (
+    <div className="h-full flex flex-col justify-between">
+      {messages.length === 0 && (
+        <ChatSuggestions onSuggestionsClick={setMessageToSend} />
+      )}
+
+      <div
+        ref={scrollRef}
+        onScroll={(e) => onChatBodyScroll(e.currentTarget)}
+        className="flex flex-col grow overflow-y-auto overflow-x-hidden px-4 pt-4 gap-2"
+      >
+        {isLoadingMessages && <LoadingSpinner />}
+
+        {!isLoadingMessages && (
+          <Messages
+            messages={messages}
+            isAwaitingUserConfirmation={
+              curAgentState === AgentState.AWAITING_USER_CONFIRMATION
+            }
+          />
+        )}
+
+        {isWaitingForUserInput && (
+          <ActionSuggestions
+            onSuggestionsClick={(value) => handleSendMessage(value, [])}
+          />
+        )}
+      </div>
+
+      <div className="flex flex-col gap-[6px] px-4 pb-4">
+        <div className="flex justify-between relative">
+          <FeedbackActions
+            onPositiveFeedback={() =>
+              onClickShareFeedbackActionButton("positive")
+            }
+            onNegativeFeedback={() =>
+              onClickShareFeedbackActionButton("negative")
+            }
+          />
+
+          <div className="absolute left-1/2 transform -translate-x-1/2 bottom-0">
+            {messages.length > 2 &&
+              curAgentState === AgentState.AWAITING_USER_INPUT && (
+                <ContinueButton onClick={handleSendContinueMsg} />
+              )}
+            {curAgentState === AgentState.RUNNING && <TypingIndicator />}
+          </div>
+
+          {!hitBottom && <ScrollToBottomButton onClick={scrollDomToBottom} />}
+        </div>
+
+        <InteractiveChatBox
+          onSubmit={handleSendMessage}
+          onStop={handleStop}
+          isDisabled={
+            curAgentState === AgentState.LOADING ||
+            curAgentState === AgentState.AWAITING_USER_CONFIRMATION
+          }
+          mode={curAgentState === AgentState.RUNNING ? "stop" : "submit"}
+          value={messageToSend ?? undefined}
+          onChange={setMessageToSend}
+        />
+      </div>
+
+      <FeedbackModal
+        isOpen={feedbackModalIsOpen}
+        onClose={() => setFeedbackModalIsOpen(false)}
+        polarity={feedbackPolarity}
+      />
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app/chat-suggestions.tsx b/frontend/src/routes/_oh.app/chat-suggestions.tsx
new file mode 100644
index 000000000000..1f08ace538f7
--- /dev/null
+++ b/frontend/src/routes/_oh.app/chat-suggestions.tsx
@@ -0,0 +1,29 @@
+import { Suggestions } from "#/components/suggestions";
+import BuildIt from "#/icons/build-it.svg?react";
+import { SUGGESTIONS } from "#/utils/suggestions";
+
+interface ChatSuggestionsProps {
+  onSuggestionsClick: (value: string) => void;
+}
+
+export function ChatSuggestions({ onSuggestionsClick }: ChatSuggestionsProps) {
+  return (
+    <div className="flex flex-col gap-6 h-full px-4 items-center justify-center">
+      <div className="flex flex-col items-center p-4 bg-neutral-700 rounded-xl w-full">
+        <BuildIt width={45} height={54} />
+        <span className="font-semibold text-[20px] leading-6 -tracking-[0.01em] gap-1">
+          Let&apos;s start building!
+        </span>
+      </div>
+      <Suggestions
+        suggestions={Object.entries(SUGGESTIONS.repo)
+          .slice(0, 4)
+          .map(([label, value]) => ({
+            label,
+            value,
+          }))}
+        onSuggestionClick={onSuggestionsClick}
+      />
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app/event-handler.tsx b/frontend/src/routes/_oh.app/event-handler.tsx
new file mode 100644
index 000000000000..2c45f013e2f7
--- /dev/null
+++ b/frontend/src/routes/_oh.app/event-handler.tsx
@@ -0,0 +1,12 @@
+import React from "react";
+import { useWSStatusChange } from "./hooks/use-ws-status-change";
+import { useHandleWSEvents } from "./hooks/use-handle-ws-events";
+import { useHandleRuntimeActive } from "./hooks/use-handle-runtime-active";
+
+export function EventHandler({ children }: React.PropsWithChildren) {
+  useWSStatusChange();
+  useHandleWSEvents();
+  useHandleRuntimeActive();
+
+  return children;
+}
diff --git a/frontend/src/routes/_oh.app/hooks/use-handle-runtime-active.ts b/frontend/src/routes/_oh.app/hooks/use-handle-runtime-active.ts
new file mode 100644
index 000000000000..e5162f4dc0de
--- /dev/null
+++ b/frontend/src/routes/_oh.app/hooks/use-handle-runtime-active.ts
@@ -0,0 +1,65 @@
+import React from "react";
+import toast from "react-hot-toast";
+import { useDispatch, useSelector } from "react-redux";
+import { isGitHubErrorReponse } from "#/api/github";
+import { useAuth } from "#/context/auth-context";
+import {
+  useWsClient,
+  WsClientProviderStatus,
+} from "#/context/ws-client-provider";
+import { getGitHubTokenCommand } from "#/services/terminal-service";
+import { setImportedProjectZip } from "#/state/initial-query-slice";
+import { RootState } from "#/store";
+import { base64ToBlob } from "#/utils/base64-to-blob";
+import { useUploadFiles } from "../../../hooks/mutation/use-upload-files";
+import { useGitHubUser } from "../../../hooks/query/use-github-user";
+
+export const useHandleRuntimeActive = () => {
+  const { gitHubToken } = useAuth();
+  const { status, send } = useWsClient();
+
+  const dispatch = useDispatch();
+
+  const { data: user } = useGitHubUser();
+  const { mutate: uploadFiles } = useUploadFiles();
+
+  const runtimeActive = status === WsClientProviderStatus.ACTIVE;
+
+  const { importedProjectZip } = useSelector(
+    (state: RootState) => state.initalQuery,
+  );
+
+  const userId = React.useMemo(() => {
+    if (user && !isGitHubErrorReponse(user)) return user.id;
+    return null;
+  }, [user]);
+
+  const handleUploadFiles = (zip: string) => {
+    const blob = base64ToBlob(zip);
+    const file = new File([blob], "imported-project.zip", {
+      type: blob.type,
+    });
+    uploadFiles(
+      { files: [file] },
+      {
+        onError: () => {
+          toast.error("Failed to upload project files.");
+        },
+      },
+    );
+    dispatch(setImportedProjectZip(null));
+  };
+
+  React.useEffect(() => {
+    if (runtimeActive && userId && gitHubToken) {
+      // Export if the user valid, this could happen mid-session so it is handled here
+      send(getGitHubTokenCommand(gitHubToken));
+    }
+  }, [userId, gitHubToken, runtimeActive]);
+
+  React.useEffect(() => {
+    if (runtimeActive && importedProjectZip) {
+      handleUploadFiles(importedProjectZip);
+    }
+  }, [runtimeActive, importedProjectZip]);
+};
diff --git a/frontend/src/routes/_oh.app/hooks/use-handle-ws-events.ts b/frontend/src/routes/_oh.app/hooks/use-handle-ws-events.ts
new file mode 100644
index 000000000000..5dfc7f8ca8b7
--- /dev/null
+++ b/frontend/src/routes/_oh.app/hooks/use-handle-ws-events.ts
@@ -0,0 +1,71 @@
+import React from "react";
+import toast from "react-hot-toast";
+import { useDispatch } from "react-redux";
+import { useAuth } from "#/context/auth-context";
+import { useWsClient } from "#/context/ws-client-provider";
+import { generateAgentStateChangeEvent } from "#/services/agent-state-service";
+import { addErrorMessage } from "#/state/chat-slice";
+import AgentState from "#/types/agent-state";
+import { ErrorObservation } from "#/types/core/observations";
+import { useEndSession } from "../../../hooks/use-end-session";
+
+interface ServerError {
+  error: boolean | string;
+  message: string;
+  [key: string]: unknown;
+}
+
+const isServerError = (data: object): data is ServerError => "error" in data;
+
+const isErrorObservation = (data: object): data is ErrorObservation =>
+  "observation" in data && data.observation === "error";
+
+export const useHandleWSEvents = () => {
+  const { events, send } = useWsClient();
+  const { setToken } = useAuth();
+  const endSession = useEndSession();
+  const dispatch = useDispatch();
+
+  React.useEffect(() => {
+    if (!events.length) {
+      return;
+    }
+    const event = events[events.length - 1];
+    if (event.token && typeof event.token === "string") {
+      setToken(event.token);
+      return;
+    }
+
+    if (isServerError(event)) {
+      if (event.error_code === 401) {
+        toast.error("Session expired.");
+        endSession();
+        return;
+      }
+
+      if (typeof event.error === "string") {
+        toast.error(event.error);
+      } else {
+        toast.error(event.message);
+      }
+      return;
+    }
+
+    if (event.type === "error") {
+      const message: string = `${event.message}`;
+      if (message.startsWith("Agent reached maximum")) {
+        // We set the agent state to paused here - if the user clicks resume, it auto updates the max iterations
+        send(generateAgentStateChangeEvent(AgentState.PAUSED));
+      }
+    }
+
+    if (isErrorObservation(event)) {
+      dispatch(
+        addErrorMessage({
+          id: event.extras?.error_id,
+          message: event.message,
+        }),
+      );
+    }
+  }, [events.length]);
+};
diff --git a/frontend/src/routes/_oh.app/hooks/use-ws-status-change.ts b/frontend/src/routes/_oh.app/hooks/use-ws-status-change.ts
new file mode 100644
index 000000000000..a93a5c584d0f
--- /dev/null
+++ b/frontend/src/routes/_oh.app/hooks/use-ws-status-change.ts
@@ -0,0 +1,97 @@
+import React from "react";
+import { useDispatch, useSelector } from "react-redux";
+import { useAuth } from "#/context/auth-context";
+import {
+  useWsClient,
+  WsClientProviderStatus,
+} from "#/context/ws-client-provider";
+import { createChatMessage } from "#/services/chat-service";
+import { getCloneRepoCommand } from "#/services/terminal-service";
+import { setCurrentAgentState } from "#/state/agent-slice";
+import { addUserMessage } from "#/state/chat-slice";
+import {
+  clearSelectedRepository,
+  clearFiles,
+  clearInitialQuery,
+} from "#/state/initial-query-slice";
+import { RootState } from "#/store";
+import AgentState from "#/types/agent-state";
+
+export const useWSStatusChange = () => {
+  const { send, status } = useWsClient();
+  const { gitHubToken } = useAuth();
+  const dispatch = useDispatch();
+
+  const statusRef = React.useRef<WsClientProviderStatus | null>(null);
+
+  const { selectedRepository } = useSelector(
+    (state: RootState) => state.initalQuery,
+  );
+
+  const { files, importedProjectZip, initialQuery } = useSelector(
+    (state: RootState) => state.initalQuery,
+  );
+
+  const sendInitialQuery = (query: string, base64Files: string[]) => {
+    const timestamp = new Date().toISOString();
+    send(createChatMessage(query, base64Files, timestamp));
+  };
+
+  const dispatchCloneRepoCommand = (ghToken: string, repository: string) => {
+    send(getCloneRepoCommand(ghToken, repository));
+    dispatch(clearSelectedRepository());
+  };
+
+  const dispatchInitialQuery = (query: string, additionalInfo: string) => {
+    if (additionalInfo) {
+      sendInitialQuery(`${query}\n\n[${additionalInfo}]`, files);
+    } else {
+      sendInitialQuery(query, files);
+    }
+
+    dispatch(clearFiles()); // reset selected files
+    dispatch(clearInitialQuery()); // reset initial query
+  };
+
+  const handleOnWSActive = () => {
+    let additionalInfo = "";
+
+    if (gitHubToken && selectedRepository) {
+      dispatchCloneRepoCommand(gitHubToken, selectedRepository);
+      additionalInfo = `Repository ${selectedRepository} has been cloned to /workspace. Please check the /workspace for files.`;
+    } else if (importedProjectZip) {
+      // if there's an uploaded project zip, add it to the chat
+      additionalInfo =
+        "Files have been uploaded. Please check the /workspace for files.";
+    }
+
+    if (initialQuery) {
+      dispatchInitialQuery(initialQuery, additionalInfo);
+    }
+  };
+
+  React.useEffect(() => {
+    if (statusRef.current === status) {
+      return; // This is a check because of strict mode - if the status did not change, don't do anything
+    }
+    statusRef.current = status;
+
+    if (status === WsClientProviderStatus.ACTIVE) {
+      handleOnWSActive();
+    }
+
+    if (status === WsClientProviderStatus.OPENING && initialQuery) {
+      dispatch(
+        addUserMessage({
+          content: initialQuery,
+          imageUrls: files,
+          timestamp: new Date().toISOString(),
+        }),
+      );
+    }
+
+    if (status === WsClientProviderStatus.STOPPED) {
+      dispatch(setCurrentAgentState(AgentState.STOPPED));
+    }
+  }, [status]);
+};
diff --git a/frontend/src/routes/_oh.app/loading-spinner.tsx b/frontend/src/routes/_oh.app/loading-spinner.tsx
new file mode 100644
index 000000000000..ba119cb20c6b
--- /dev/null
+++ b/frontend/src/routes/_oh.app/loading-spinner.tsx
@@ -0,0 +1,7 @@
+export function LoadingSpinner() {
+  return (
+    <div className="flex justify-center">
+      <div className="w-6 h-6 border-2 border-t-[4px] border-primary-500 rounded-full animate-spin" />
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh.app/messages.tsx b/frontend/src/routes/_oh.app/messages.tsx
new file mode 100644
index 000000000000..3766aac33103
--- /dev/null
+++ b/frontend/src/routes/_oh.app/messages.tsx
@@ -0,0 +1,33 @@
+import { ChatMessage } from "#/components/chat-message";
+import ConfirmationButtons from "#/components/chat/confirmation-buttons";
+import { ErrorMessage } from "#/components/error-message";
+import { ImageCarousel } from "#/components/image-carousel";
+
+const isErrorMessage = (
+  message: Message | ErrorMessage,
+): message is ErrorMessage => "error" in message;
+
+interface MessagesProps {
+  messages: (Message | ErrorMessage)[];
+  isAwaitingUserConfirmation: boolean;
+}
+
+export function Messages({
+  messages,
+  isAwaitingUserConfirmation,
+}: MessagesProps) {
+  return messages.map((message, index) =>
+    isErrorMessage(message) ? (
+      <ErrorMessage key={index} id={message.id} message={message.message} />
+    ) : (
+      <ChatMessage key={index} type={message.sender} message={message.content}>
+        {message.imageUrls.length > 0 && (
+          <ImageCarousel size="small" images={message.imageUrls} />
+        )}
+        {messages.length - 1 === index &&
+          message.sender === "assistant" &&
+          isAwaitingUserConfirmation && <ConfirmationButtons />}
+      </ChatMessage>
+    ),
+  );
+}
diff --git a/frontend/src/routes/_oh.app.tsx b/frontend/src/routes/_oh.app/route.tsx
similarity index 91%
rename from frontend/src/routes/_oh.app.tsx
rename to frontend/src/routes/_oh.app/route.tsx
index 3b672508a2ef..5a0fc655e9c9 100644
--- a/frontend/src/routes/_oh.app.tsx
+++ b/frontend/src/routes/_oh.app/route.tsx
@@ -2,7 +2,7 @@ import { useDisclosure } from "@nextui-org/react";
 import React from "react";
 import { Outlet } from "@remix-run/react";
 import { useDispatch, useSelector } from "react-redux";
-import Security from "../components/modals/security/security";
+import Security from "#/components/modals/security/security";
 import { Controls } from "#/components/controls";
 import { RootState } from "#/store";
 import { Container } from "#/components/container";
@@ -14,18 +14,20 @@ import GlobeIcon from "#/icons/globe.svg?react";
 import ListIcon from "#/icons/list-type-number.svg?react";
 import { clearJupyter } from "#/state/jupyter-slice";
 import { FilesProvider } from "#/context/files";
-import { ChatInterface } from "#/components/chat-interface";
+import { ChatInterface } from "./chat-interface";
 import { WsClientProvider } from "#/context/ws-client-provider";
-import { EventHandler } from "#/components/event-handler";
+import { EventHandler } from "./event-handler";
 import { useLatestRepoCommit } from "#/hooks/query/use-latest-repo-commit";
 import { useAuth } from "#/context/auth-context";
 import { useUserPrefs } from "#/context/user-prefs-context";
+import { useConversationConfig } from "#/hooks/query/use-conversation-config";
 
 function App() {
   const { token, gitHubToken } = useAuth();
   const { settings } = useUserPrefs();
 
   const dispatch = useDispatch();
+  useConversationConfig();
 
   const { selectedRepository } = useSelector(
     (state: RootState) => state.initalQuery,
@@ -41,7 +43,7 @@ function App() {
   );
 
   const Terminal = React.useMemo(
-    () => React.lazy(() => import("../components/terminal/terminal")),
+    () => React.lazy(() => import("#/components/terminal/terminal")),
     [],
   );
 
diff --git a/frontend/src/routes/_oh.tsx b/frontend/src/routes/_oh.tsx
deleted file mode 100644
index 9a37b8b4d82b..000000000000
--- a/frontend/src/routes/_oh.tsx
+++ /dev/null
@@ -1,268 +0,0 @@
-import React from "react";
-import {
-  useRouteError,
-  isRouteErrorResponse,
-  useLocation,
-  Outlet,
-} from "@remix-run/react";
-import { useDispatch } from "react-redux";
-import CogTooth from "#/assets/cog-tooth";
-import { SettingsForm } from "#/components/form/settings-form";
-import AccountSettingsModal from "#/components/modals/account-settings-modal";
-import { DangerModal } from "#/components/modals/confirmation-modals/danger-modal";
-import { LoadingSpinner } from "#/components/modals/loading-project";
-import { ModalBackdrop } from "#/components/modals/modal-backdrop";
-import { UserActions } from "#/components/user-actions";
-import i18n from "#/i18n";
-import AllHandsLogo from "#/assets/branding/all-hands-logo.svg?react";
-import NewProjectIcon from "#/icons/new-project.svg?react";
-import DocsIcon from "#/icons/docs.svg?react";
-import { WaitlistModal } from "#/components/waitlist-modal";
-import { AnalyticsConsentFormModal } from "#/components/analytics-consent-form-modal";
-import { setCurrentAgentState } from "#/state/agent-slice";
-import AgentState from "#/types/agent-state";
-import { useConfig } from "#/hooks/query/use-config";
-import { useGitHubUser } from "#/hooks/query/use-github-user";
-import { useGitHubAuthUrl } from "#/hooks/use-github-auth-url";
-import { useAIConfigOptions } from "#/hooks/query/use-ai-config-options";
-import { useIsAuthed } from "#/hooks/query/use-is-authed";
-import { useAuth } from "#/context/auth-context";
-import { useEndSession } from "#/hooks/use-end-session";
-import { useUserPrefs } from "#/context/user-prefs-context";
-
-export function ErrorBoundary() {
-  const error = useRouteError();
-
-  if (isRouteErrorResponse(error)) {
-    return (
-      <div>
-        <h1>{error.status}</h1>
-        <p>{error.statusText}</p>
-        <pre>
-          {error.data instanceof Object
-            ? JSON.stringify(error.data)
-            : error.data}
-        </pre>
-      </div>
-    );
-  }
-  if (error instanceof Error) {
-    return (
-      <div>
-        <h1>Uh oh, an error occurred!</h1>
-        <pre>{error.message}</pre>
-      </div>
-    );
-  }
-
-  return (
-    <div>
-      <h1>Uh oh, an unknown error occurred!</h1>
-    </div>
-  );
-}
-
-export default function MainApp() {
-  const { token, gitHubToken, clearToken, logout } = useAuth();
-  const { settings, settingsAreUpToDate } = useUserPrefs();
-
-  const location = useLocation();
-  const dispatch = useDispatch();
-  const endSession = useEndSession();
-
-  // FIXME: Bad practice to use localStorage directly
-  const analyticsConsent = localStorage.getItem("analytics-consent");
-
-  const [accountSettingsModalOpen, setAccountSettingsModalOpen] =
-    React.useState(false);
-  const [settingsModalIsOpen, setSettingsModalIsOpen] = React.useState(false);
-  const [startNewProjectModalIsOpen, setStartNewProjectModalIsOpen] =
-    React.useState(false);
-  const [consentFormIsOpen, setConsentFormIsOpen] = React.useState(
-    !localStorage.getItem("analytics-consent"),
-  );
-
-  const config = useConfig();
-  const user = useGitHubUser();
-  const {
-    data: isAuthed,
-    isFetched,
-    isFetching: isFetchingAuth,
-  } = useIsAuthed();
-  const aiConfigOptions = useAIConfigOptions();
-
-  const gitHubAuthUrl = useGitHubAuthUrl({
-    gitHubToken,
-    appMode: config.data?.APP_MODE || null,
-    gitHubClientId: config.data?.GITHUB_CLIENT_ID || null,
-  });
-
-  React.useEffect(() => {
-    if (isFetched && !isAuthed) clearToken();
-  }, [isFetched, isAuthed]);
-
-  React.useEffect(() => {
-    if (settings.LANGUAGE) {
-      i18n.changeLanguage(settings.LANGUAGE);
-    }
-  }, [settings.LANGUAGE]);
-
-  React.useEffect(() => {
-    // If the github token is invalid, open the account settings modal again
-    if (user.isError) {
-      setAccountSettingsModalOpen(true);
-    }
-  }, [user.isError]);
-
-  const handleAccountSettingsModalClose = () => {
-    // If the user closes the modal without connecting to GitHub,
-    // we need to log them out to clear the invalid token from the
-    // local storage
-    if (user.isError) logout();
-    setAccountSettingsModalOpen(false);
-  };
-
-  const handleEndSession = () => {
-    setStartNewProjectModalIsOpen(false);
-    dispatch(setCurrentAgentState(AgentState.LOADING));
-    endSession();
-  };
-
-  return (
-    <div
-      data-testid="root-layout"
-      className="bg-root-primary p-3 h-screen min-w-[1024px] overflow-x-hidden flex gap-3"
-    >
-      <aside className="px-1 flex flex-col gap-1">
-        <div className="w-[34px] h-[34px] flex items-center justify-center">
-          {user.isLoading && <LoadingSpinner size="small" />}
-          {!user.isLoading && (
-            <button
-              type="button"
-              aria-label="All Hands Logo"
-              onClick={() => {
-                if (location.pathname.startsWith("/app"))
-                  setStartNewProjectModalIsOpen(true);
-              }}
-            >
-              <AllHandsLogo width={34} height={23} />
-            </button>
-          )}
-        </div>
-        <nav className="py-[18px] flex flex-col items-center gap-[18px]">
-          <UserActions
-            user={user.data ? { avatar_url: user.data.avatar_url } : undefined}
-            onLogout={logout}
-            onClickAccountSettings={() => setAccountSettingsModalOpen(true)}
-          />
-          <button
-            type="button"
-            className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
-            onClick={() => setSettingsModalIsOpen(true)}
-            aria-label="Settings"
-          >
-            <CogTooth />
-          </button>
-          <a
-            href="https://docs.all-hands.dev"
-            target="_blank"
-            rel="noreferrer noopener"
-            className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
-            aria-label="Documentation"
-          >
-            <DocsIcon width={28} height={28} />
-          </a>
-          {!!token && (
-            <button
-              data-testid="new-project-button"
-              type="button"
-              aria-label="Start new project"
-              onClick={() => setStartNewProjectModalIsOpen(true)}
-            >
-              <NewProjectIcon width={28} height={28} />
-            </button>
-          )}
-        </nav>
-      </aside>
-      <div className="h-full w-full relative">
-        <Outlet />
-      </div>
-
-      {isAuthed && (!settingsAreUpToDate || settingsModalIsOpen) && (
-        <ModalBackdrop onClose={() => setSettingsModalIsOpen(false)}>
-          <div
-            data-testid="ai-config-modal"
-            className="bg-root-primary w-[384px] p-6 rounded-xl flex flex-col gap-2"
-          >
-            {aiConfigOptions.error && (
-              <p className="text-danger text-xs">
-                {aiConfigOptions.error.message}
-              </p>
-            )}
-            <span className="text-xl leading-6 font-semibold -tracking-[0.01em">
-              AI Provider Configuration
-            </span>
-            <p className="text-xs text-[#A3A3A3]">
-              To continue, connect an OpenAI, Anthropic, or other LLM account
-            </p>
-            <p className="text-xs text-danger">
-              Changing settings during an active session will end the session
-            </p>
-            {aiConfigOptions.isLoading && (
-              <div className="flex justify-center">
-                <LoadingSpinner size="small" />
-              </div>
-            )}
-            {aiConfigOptions.data && (
-              <SettingsForm
-                settings={settings}
-                models={aiConfigOptions.data?.models}
-                agents={aiConfigOptions.data?.agents}
-                securityAnalyzers={aiConfigOptions.data?.securityAnalyzers}
-                onClose={() => {
-                  setSettingsModalIsOpen(false);
-                }}
-              />
-            )}
-          </div>
-        </ModalBackdrop>
-      )}
-      {accountSettingsModalOpen && (
-        <ModalBackdrop onClose={handleAccountSettingsModalClose}>
-          <AccountSettingsModal
-            onClose={handleAccountSettingsModalClose}
-            selectedLanguage={settings.LANGUAGE}
-            gitHubError={user.isError}
-            analyticsConsent={analyticsConsent}
-          />
-        </ModalBackdrop>
-      )}
-      {startNewProjectModalIsOpen && (
-        <ModalBackdrop onClose={() => setStartNewProjectModalIsOpen(false)}>
-          <DangerModal
-            title="Are you sure you want to exit?"
-            description="You will lose any unsaved information."
-            buttons={{
-              danger: {
-                text: "Exit Project",
-                onClick: handleEndSession,
-              },
-              cancel: {
-                text: "Cancel",
-                onClick: () => setStartNewProjectModalIsOpen(false),
-              },
-            }}
-          />
-        </ModalBackdrop>
-      )}
-      {!isFetchingAuth && !isAuthed && config.data?.APP_MODE === "saas" && (
-        <WaitlistModal ghToken={gitHubToken} githubAuthUrl={gitHubAuthUrl} />
-      )}
-      {consentFormIsOpen && (
-        <AnalyticsConsentFormModal
-          onClose={() => setConsentFormIsOpen(false)}
-        />
-      )}
-    </div>
-  );
-}
diff --git a/frontend/src/routes/_oh/buttons/all-hands-logo-button.tsx b/frontend/src/routes/_oh/buttons/all-hands-logo-button.tsx
new file mode 100644
index 000000000000..74ab5f3cee06
--- /dev/null
+++ b/frontend/src/routes/_oh/buttons/all-hands-logo-button.tsx
@@ -0,0 +1,13 @@
+import AllHandsLogo from "#/assets/branding/all-hands-logo.svg?react";
+
+interface AllHandsLogoButtonProps {
+  onClick: () => void;
+}
+
+export function AllHandsLogoButton({ onClick }: AllHandsLogoButtonProps) {
+  return (
+    <button type="button" aria-label="All Hands Logo" onClick={onClick}>
+      <AllHandsLogo width={34} height={23} />
+    </button>
+  );
+}
diff --git a/frontend/src/routes/_oh/buttons/docs-button.tsx b/frontend/src/routes/_oh/buttons/docs-button.tsx
new file mode 100644
index 000000000000..3b805556e3da
--- /dev/null
+++ b/frontend/src/routes/_oh/buttons/docs-button.tsx
@@ -0,0 +1,15 @@
+import DocsIcon from "#/icons/docs.svg?react";
+
+export function DocsButton() {
+  return (
+    <a
+      href="https://docs.all-hands.dev"
+      aria-label="Documentation"
+      target="_blank"
+      rel="noreferrer noopener"
+      className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
+    >
+      <DocsIcon width={28} height={28} />
+    </a>
+  );
+}
diff --git a/frontend/src/routes/_oh/buttons/exit-project-button.tsx b/frontend/src/routes/_oh/buttons/exit-project-button.tsx
new file mode 100644
index 000000000000..e187fe99d19b
--- /dev/null
+++ b/frontend/src/routes/_oh/buttons/exit-project-button.tsx
@@ -0,0 +1,18 @@
+import NewProjectIcon from "#/icons/new-project.svg?react";
+
+interface ExitProjectButtonProps {
+  onClick: () => void;
+}
+
+export function ExitProjectButton({ onClick }: ExitProjectButtonProps) {
+  return (
+    <button
+      data-testid="new-project-button"
+      type="button"
+      aria-label="Start new project"
+      onClick={onClick}
+    >
+      <NewProjectIcon width={28} height={28} />
+    </button>
+  );
+}
diff --git a/frontend/src/routes/_oh/buttons/settings-button.tsx b/frontend/src/routes/_oh/buttons/settings-button.tsx
new file mode 100644
index 000000000000..3e739bcb6986
--- /dev/null
+++ b/frontend/src/routes/_oh/buttons/settings-button.tsx
@@ -0,0 +1,18 @@
+import CogTooth from "#/assets/cog-tooth";
+
+interface SettingsButtonProps {
+  onClick: () => void;
+}
+
+export function SettingsButton({ onClick }: SettingsButtonProps) {
+  return (
+    <button
+      type="button"
+      aria-label="Settings"
+      className="w-8 h-8 rounded-full hover:opacity-80 flex items-center justify-center"
+      onClick={onClick}
+    >
+      <CogTooth />
+    </button>
+  );
+}
diff --git a/frontend/src/routes/_oh/modals/account-settings-modal.tsx b/frontend/src/routes/_oh/modals/account-settings-modal.tsx
new file mode 100644
index 000000000000..d1568940486c
--- /dev/null
+++ b/frontend/src/routes/_oh/modals/account-settings-modal.tsx
@@ -0,0 +1,27 @@
+import { AccountSettingsForm } from "#/components/modals/account-settings-form";
+import { ModalBackdrop } from "#/components/modals/modal-backdrop";
+import { useUserPrefs } from "#/context/user-prefs-context";
+import { useGitHubUser } from "#/hooks/query/use-github-user";
+
+interface AccountSettingsModalProps {
+  onClose: () => void;
+}
+
+export function AccountSettingsModal({ onClose }: AccountSettingsModalProps) {
+  const user = useGitHubUser();
+  const { settings } = useUserPrefs();
+
+  // FIXME: Bad practice to use localStorage directly
+  const analyticsConsent = localStorage.getItem("analytics-consent");
+
+  return (
+    <ModalBackdrop onClose={onClose}>
+      <AccountSettingsForm
+        onClose={onClose}
+        selectedLanguage={settings.LANGUAGE}
+        gitHubError={user.isError}
+        analyticsConsent={analyticsConsent}
+      />
+    </ModalBackdrop>
+  );
+}
diff --git a/frontend/src/routes/_oh/modals/exit-project-confirmation-modal.tsx b/frontend/src/routes/_oh/modals/exit-project-confirmation-modal.tsx
new file mode 100644
index 000000000000..5d425fd4a6a1
--- /dev/null
+++ b/frontend/src/routes/_oh/modals/exit-project-confirmation-modal.tsx
@@ -0,0 +1,42 @@
+import { useDispatch } from "react-redux";
+import { DangerModal } from "#/components/modals/confirmation-modals/danger-modal";
+import { ModalBackdrop } from "#/components/modals/modal-backdrop";
+import { useEndSession } from "#/hooks/use-end-session";
+import { setCurrentAgentState } from "#/state/agent-slice";
+import AgentState from "#/types/agent-state";
+
+interface ExitProjectConfirmationModalProps {
+  onClose: () => void;
+}
+
+export function ExitProjectConfirmationModal({
+  onClose,
+}: ExitProjectConfirmationModalProps) {
+  const dispatch = useDispatch();
+  const endSession = useEndSession();
+
+  const handleEndSession = () => {
+    onClose();
+    dispatch(setCurrentAgentState(AgentState.LOADING));
+    endSession();
+  };
+
+  return (
+    <ModalBackdrop onClose={onClose}>
+      <DangerModal
+        title="Are you sure you want to exit?"
+        description="You will lose any unsaved information."
+        buttons={{
+          danger: {
+            text: "Exit Project",
+            onClick: handleEndSession,
+          },
+          cancel: {
+            text: "Cancel",
+            onClick: onClose,
+          },
+        }}
+      />
+    </ModalBackdrop>
+  );
+}
diff --git a/frontend/src/routes/_oh/modals/settings-modal.tsx b/frontend/src/routes/_oh/modals/settings-modal.tsx
new file mode 100644
index 000000000000..d09b73a33eb1
--- /dev/null
+++ b/frontend/src/routes/_oh/modals/settings-modal.tsx
@@ -0,0 +1,50 @@
+import { SettingsForm } from "#/components/form/settings-form";
+import { LoadingSpinner } from "#/components/modals/loading-project";
+import { ModalBackdrop } from "#/components/modals/modal-backdrop";
+import { useUserPrefs } from "#/context/user-prefs-context";
+import { useAIConfigOptions } from "#/hooks/query/use-ai-config-options";
+
+interface SettingsModalProps {
+  onClose: () => void;
+}
+
+export function SettingsModal({ onClose }: SettingsModalProps) {
+  const { settings } = useUserPrefs();
+  const aiConfigOptions = useAIConfigOptions();
+
+  return (
+    <ModalBackdrop onClose={onClose}>
+      <div
+        data-testid="ai-config-modal"
+        className="bg-root-primary w-[384px] p-6 rounded-xl flex flex-col gap-2"
+      >
+        {aiConfigOptions.error && (
+          <p className="text-danger text-xs">{aiConfigOptions.error.message}</p>
+        )}
+        <span className="text-xl leading-6 font-semibold -tracking-[0.01em">
+          AI Provider Configuration
+        </span>
+        <p className="text-xs text-[#A3A3A3]">
+          To continue, connect an OpenAI, Anthropic, or other LLM account
+        </p>
+        <p className="text-xs text-danger">
+          Changing settings during an active session will end the session
+        </p>
+        {aiConfigOptions.isLoading && (
+          <div className="flex justify-center">
+            <LoadingSpinner size="small" />
+          </div>
+        )}
+        {aiConfigOptions.data && (
+          <SettingsForm
+            settings={settings}
+            models={aiConfigOptions.data?.models}
+            agents={aiConfigOptions.data?.agents}
+            securityAnalyzers={aiConfigOptions.data?.securityAnalyzers}
+            onClose={onClose}
+          />
+        )}
+      </div>
+    </ModalBackdrop>
+  );
+}
diff --git a/frontend/src/routes/_oh/route.tsx b/frontend/src/routes/_oh/route.tsx
new file mode 100644
index 000000000000..328c271add97
--- /dev/null
+++ b/frontend/src/routes/_oh/route.tsx
@@ -0,0 +1,100 @@
+import React from "react";
+import { useRouteError, isRouteErrorResponse, Outlet } from "@remix-run/react";
+import i18n from "#/i18n";
+import { WaitlistModal } from "#/components/waitlist-modal";
+import { AnalyticsConsentFormModal } from "#/components/analytics-consent-form-modal";
+import { useGitHubAuthUrl } from "#/hooks/use-github-auth-url";
+import { useIsAuthed } from "#/hooks/query/use-is-authed";
+import { useAuth } from "#/context/auth-context";
+import { useUserPrefs } from "#/context/user-prefs-context";
+import { Sidebar } from "./sidebar";
+import { useConfig } from "#/hooks/query/use-config";
+
+export function ErrorBoundary() {
+  const error = useRouteError();
+
+  if (isRouteErrorResponse(error)) {
+    return (
+      <div>
+        <h1>{error.status}</h1>
+        <p>{error.statusText}</p>
+        <pre>
+          {error.data instanceof Object
+            ? JSON.stringify(error.data)
+            : error.data}
+        </pre>
+      </div>
+    );
+  }
+  if (error instanceof Error) {
+    return (
+      <div>
+        <h1>Uh oh, an error occurred!</h1>
+        <pre>{error.message}</pre>
+      </div>
+    );
+  }
+
+  return (
+    <div>
+      <h1>Uh oh, an unknown error occurred!</h1>
+    </div>
+  );
+}
+
+export default function MainApp() {
+  const { gitHubToken, clearToken } = useAuth();
+  const { settings } = useUserPrefs();
+
+  const [consentFormIsOpen, setConsentFormIsOpen] = React.useState(
+    !localStorage.getItem("analytics-consent"),
+  );
+
+  const config = useConfig();
+  const {
+    data: isAuthed,
+    isFetched,
+    isFetching: isFetchingAuth,
+  } = useIsAuthed();
+
+  const gitHubAuthUrl = useGitHubAuthUrl({
+    gitHubToken,
+    appMode: config.data?.APP_MODE || null,
+    gitHubClientId: config.data?.GITHUB_CLIENT_ID || null,
+  });
+
+  React.useEffect(() => {
+    if (isFetched && !isAuthed) clearToken();
+  }, [isFetched, isAuthed]);
+
+  React.useEffect(() => {
+    if (settings.LANGUAGE) {
+      i18n.changeLanguage(settings.LANGUAGE);
+    }
+  }, [settings.LANGUAGE]);
+
+  const isInWaitlist =
+    !isFetchingAuth && !isAuthed && config.data?.APP_MODE === "saas";
+
+  return (
+    <div
+      data-testid="root-layout"
+      className="bg-root-primary p-3 h-screen min-w-[1024px] overflow-x-hidden flex gap-3"
+    >
+      <Sidebar />
+
+      <div className="h-full w-full relative">
+        <Outlet />
+      </div>
+
+      {isInWaitlist && (
+        <WaitlistModal ghToken={gitHubToken} githubAuthUrl={gitHubAuthUrl} />
+      )}
+      {consentFormIsOpen && (
+        <AnalyticsConsentFormModal
+          onClose={() => setConsentFormIsOpen(false)}
+        />
+      )}
+    </div>
+  );
+}
diff --git a/frontend/src/routes/_oh/sidebar.tsx b/frontend/src/routes/_oh/sidebar.tsx
new file mode 100644
index 000000000000..b02974fa9e13
--- /dev/null
+++ b/frontend/src/routes/_oh/sidebar.tsx
@@ -0,0 +1,91 @@
+import React from "react";
+import { useLocation } from "react-router-dom";
+import { LoadingSpinner } from "#/components/modals/loading-project";
+import { UserActions } from "#/components/user-actions";
+import { useAuth } from "#/context/auth-context";
+import { useUserPrefs } from "#/context/user-prefs-context";
+import { useGitHubUser } from "#/hooks/query/use-github-user";
+import { useIsAuthed } from "#/hooks/query/use-is-authed";
+import { SettingsModal } from "./modals/settings-modal";
+import { ExitProjectConfirmationModal } from "./modals/exit-project-confirmation-modal";
+import { AllHandsLogoButton } from "./buttons/all-hands-logo-button";
+import { SettingsButton } from "./buttons/settings-button";
+import { DocsButton } from "./buttons/docs-button";
+import { ExitProjectButton } from "./buttons/exit-project-button";
+import { AccountSettingsModal } from "./modals/account-settings-modal";
+
+export function Sidebar() {
+  const location = useLocation();
+
+  const user = useGitHubUser();
+  const { data: isAuthed } = useIsAuthed();
+
+  const { token, logout } = useAuth();
+  const { settingsAreUpToDate } = useUserPrefs();
+
+  const [accountSettingsModalOpen, setAccountSettingsModalOpen] =
+    React.useState(false);
+  const [settingsModalIsOpen, setSettingsModalIsOpen] = React.useState(false);
+  const [startNewProjectModalIsOpen, setStartNewProjectModalIsOpen] =
+    React.useState(false);
+
+  React.useEffect(() => {
+    // If the github token is invalid, open the account settings modal again
+    if (user.isError) {
+      setAccountSettingsModalOpen(true);
+    }
+  }, [user.isError]);
+
+  const handleAccountSettingsModalClose = () => {
+    // If the user closes the modal without connecting to GitHub,
+    // we need to log them out to clear the invalid token from the
+    // local storage
+    if (user.isError) logout();
+    setAccountSettingsModalOpen(false);
+  };
+
+  const handleClickLogo = () => {
+    if (location.pathname.startsWith("/app"))
+      setStartNewProjectModalIsOpen(true);
+  };
+
+  const showSettingsModal =
+    isAuthed && (!settingsAreUpToDate || settingsModalIsOpen);
+
+  return (
+    <>
+      <aside className="px-1 flex flex-col gap-1">
+        <div className="w-[34px] h-[34px] flex items-center justify-center">
+          {user.isLoading && <LoadingSpinner size="small" />}
+          {!user.isLoading && <AllHandsLogoButton onClick={handleClickLogo} />}
+        </div>
+
+        <nav className="py-[18px] flex flex-col items-center gap-[18px]">
+          <UserActions
+            user={user.data ? { avatar_url: user.data.avatar_url } : undefined}
+            onLogout={logout}
+            onClickAccountSettings={() => setAccountSettingsModalOpen(true)}
+          />
+          <SettingsButton onClick={() => setSettingsModalIsOpen(true)} />
+          <DocsButton />
+          {!!token && (
+            <ExitProjectButton
+              onClick={() => setStartNewProjectModalIsOpen(true)}
+            />
+          )}
+        </nav>
+      </aside>
+      {accountSettingsModalOpen && (
+        <AccountSettingsModal onClose={handleAccountSettingsModalClose} />
+      )}
+      {showSettingsModal && (
+        <SettingsModal onClose={() => setSettingsModalIsOpen(false)} />
+      )}
+      {startNewProjectModalIsOpen && (
+        <ExitProjectConfirmationModal
+          onClose={() => setStartNewProjectModalIsOpen(false)}
+        />
+      )}
+    </>
+  );
+}
diff --git a/frontend/src/services/actions.ts b/frontend/src/services/actions.ts
index 13265776dcee..69844b8a22cd 100644
--- a/frontend/src/services/actions.ts
+++ b/frontend/src/services/actions.ts
@@ -21,7 +21,11 @@ import { handleObservationMessage } from "./observations";
 
 const messageActions = {
   [ActionType.BROWSE]: (message: ActionMessage) => {
-    store.dispatch(addAssistantMessage(message.message));
+    if (message.args.thought) {
+      store.dispatch(addAssistantMessage(message.args.thought));
+    } else {
+      store.dispatch(addAssistantMessage(message.message));
+    }
   },
   [ActionType.BROWSE_INTERACTIVE]: (message: ActionMessage) => {
     if (message.args.thought) {
diff --git a/frontend/src/sessions.ts b/frontend/src/sessions.ts
deleted file mode 100644
index 612be9651578..000000000000
--- a/frontend/src/sessions.ts
+++ /dev/null
@@ -1,29 +0,0 @@
-import { createCookieSessionStorage } from "@remix-run/node";
-import { Settings } from "./services/settings";
-
-type SessionData = {
-  tosAccepted: boolean;
-  ghToken: string;
-  token: string; // Session token
-};
-
-export const { getSession, commitSession, destroySession } =
-  createCookieSessionStorage<SessionData>({
-    cookie: {
-      name: "__session",
-      secrets: ["some_secret"],
-    },
-  });
-
-type SettingsSessionData = { settings: Settings };
-
-export const {
-  getSession: getSettingsSession,
-  commitSession: commitSettingsSession,
-  destroySession: destroySettingsSession,
-} = createCookieSessionStorage<SettingsSessionData>({
-  cookie: {
-    name: "__settings",
-    secrets: ["some_other_secret"],
-  },
-});
diff --git a/openhands/agenthub/codeact_agent/codeact_agent.py b/openhands/agenthub/codeact_agent/codeact_agent.py
index 6743de87ade6..1113fd0271d3 100644
--- a/openhands/agenthub/codeact_agent/codeact_agent.py
+++ b/openhands/agenthub/codeact_agent/codeact_agent.py
@@ -15,6 +15,7 @@
     AgentDelegateAction,
     AgentFinishAction,
     BrowseInteractiveAction,
+    BrowseURLAction,
     CmdRunAction,
     FileEditAction,
     IPythonRunCellAction,
@@ -151,6 +152,7 @@ def get_action_message(
                 IPythonRunCellAction,
                 FileEditAction,
                 BrowseInteractiveAction,
+                BrowseURLAction,
             ),
         ) or (
             isinstance(action, (AgentFinishAction, CmdRunAction))
diff --git a/openhands/agenthub/codeact_agent/function_calling.py b/openhands/agenthub/codeact_agent/function_calling.py
index a4ee35ff7b59..399776e6c6f3 100644
--- a/openhands/agenthub/codeact_agent/function_calling.py
+++ b/openhands/agenthub/codeact_agent/function_calling.py
@@ -19,6 +19,7 @@
     AgentDelegateAction,
     AgentFinishAction,
     BrowseInteractiveAction,
+    BrowseURLAction,
     CmdRunAction,
     FileEditAction,
     IPythonRunCellAction,
@@ -266,6 +267,30 @@ def __init__(self):
     ),
 )
 
+
+_WEB_DESCRIPTION = """Read (convert to markdown) content from a webpage. You should prefer using the `webpage_read` tool over the `browser` tool, but do use the `browser` tool if you need to interact with a webpage (e.g., click a button, fill out a form, etc.).
+
+You may use the `webpage_read` tool to read content from a webpage, and even search the webpage content using a Google search query (e.g., url=`https://www.google.com/search?q=YOUR_QUERY`).
+"""
+
+WebReadTool = ChatCompletionToolParam(
+    type='function',
+    function=ChatCompletionToolParamFunctionChunk(
+        name='web_read',
+        description=_WEB_DESCRIPTION,
+        parameters={
+            'type': 'object',
+            'properties': {
+                'url': {
+                    'type': 'string',
+                    'description': 'The URL of the webpage to read. You can also use a Google search query here (e.g., `https://www.google.com/search?q=YOUR_QUERY`).',
+                }
+            },
+            'required': ['url'],
+        },
+    ),
+)
+
 # from browsergym/core/action/highlevel.py
 _browser_action_space = HighLevelActionSet(
     subsets=['bid', 'nav'],
@@ -274,7 +299,7 @@ def __init__(self):
 )
 
 
-_BROWSER_DESCRIPTION = """Interact with the browser using Python code.
+_BROWSER_DESCRIPTION = """Interact with the browser using Python code. Use it ONLY when you need to interact with a webpage.
 
 See the description of "code" parameter for more details.
 
@@ -484,6 +509,8 @@ def response_to_actions(response: ModelResponse) -> list[Action]:
                 action = IPythonRunCellAction(code=code, include_extra=False)
             elif tool_call.function.name == 'browser':
                 action = BrowseInteractiveAction(browser_actions=arguments['code'])
+            elif tool_call.function.name == 'web_read':
+                action = BrowseURLAction(url=arguments['url'])
             else:
                 raise FunctionCallNotExistsError(
                     f'Tool {tool_call.function.name} is not registered. (arguments: {arguments}). Please check the tool name and retry with an existing tool.'
@@ -516,6 +543,7 @@ def get_tools(
 ) -> list[ChatCompletionToolParam]:
     tools = [CmdRunTool, FinishTool]
     if codeact_enable_browsing:
+        tools.append(WebReadTool)
         tools.append(BrowserTool)
     if codeact_enable_jupyter:
         tools.append(IPythonTool)
diff --git a/openhands/agenthub/codeact_agent/micro/npm.md b/openhands/agenthub/codeact_agent/micro/npm.md
new file mode 100644
index 000000000000..a84e52792bc3
--- /dev/null
+++ b/openhands/agenthub/codeact_agent/micro/npm.md
@@ -0,0 +1,9 @@
+---
+name: npm
+agent: CodeActAgent
+triggers:
+- npm
+---
+
+When using npm to install packages, you will not be able to use an interactive shell, and it may be hard to confirm your actions.
+As an alternative, you can pipe in the output of the unix "yes" command to confirm your actions.
diff --git a/openhands/events/action/browse.py b/openhands/events/action/browse.py
index 41816216d6d5..418dd0444366 100644
--- a/openhands/events/action/browse.py
+++ b/openhands/events/action/browse.py
@@ -15,7 +15,7 @@ class BrowseURLAction(Action):
 
     @property
     def message(self) -> str:
-        return f'Browsing URL: {self.url}'
+        return f'I am browsing the URL: {self.url}'
 
     def __str__(self) -> str:
         ret = '**BrowseURLAction**\n'
diff --git a/openhands/events/observation/browse.py b/openhands/events/observation/browse.py
index 9632fac57d54..1052aaf17a91 100644
--- a/openhands/events/observation/browse.py
+++ b/openhands/events/observation/browse.py
@@ -2,7 +2,7 @@
 
 from browsergym.utils.obs import flatten_axtree_to_str
 
-from openhands.core.schema import ObservationType
+from openhands.core.schema import ActionType, ObservationType
 from openhands.events.observation.observation import Observation
 
 
@@ -11,6 +11,7 @@ class BrowserOutputObservation(Observation):
     """This data class represents the output of a browser."""
 
     url: str
+    trigger_by_action: str
     screenshot: str = field(repr=False)  # don't show in repr
     error: bool = False
     observation: str = ObservationType.BROWSE
@@ -40,7 +41,6 @@ def __str__(self) -> str:
             f'Last browser action: {self.last_browser_action}\n'
             f'Last browser action error: {self.last_browser_action_error}\n'
             f'Focused element bid: {self.focused_element_bid}\n'
-            f'Content: {self.content}\n'
         )
         ret += '--- Agent Observation ---\n'
         ret += self.get_agent_obs_text()
@@ -48,31 +48,49 @@ def __str__(self) -> str:
 
     def get_agent_obs_text(self) -> str:
         """Get a concise text that will be shown to the agent."""
-        text = f'[Current URL: {self.url}]\n'
-        text += f'[Focused element bid: {self.focused_element_bid}]\n\n'
-        if self.error:
-            text += (
-                '================ BEGIN error message ===============\n'
-                'The following error occurred when executing the last action:\n'
-                f'{self.last_browser_action_error}\n'
-                '================ END error message ===============\n'
-            )
-        else:
-            text += '[Action executed successfully.]\n'
+        if self.trigger_by_action == ActionType.BROWSE_INTERACTIVE:
+            text = f'[Current URL: {self.url}]\n'
+            text += f'[Focused element bid: {self.focused_element_bid}]\n\n'
+            if self.error:
+                text += (
+                    '================ BEGIN error message ===============\n'
+                    'The following error occurred when executing the last action:\n'
+                    f'{self.last_browser_action_error}\n'
+                    '================ END error message ===============\n'
+                )
+            else:
+                text += '[Action executed successfully.]\n'
+            try:
+                # We do not filter visible only here because we want to show the full content
+                # of the web page to the agent for simplicity.
+                # FIXME: handle the case when the web page is too large
+                cur_axtree_txt = self.get_axtree_str(filter_visible_only=False)
+                text += (
+                    f'============== BEGIN accessibility tree ==============\n'
+                    f'{cur_axtree_txt}\n'
+                    f'============== END accessibility tree ==============\n'
+                )
+            except Exception as e:
+                text += (
+                    f'\n[Error encountered when processing the accessibility tree: {e}]'
+                )
+            return text
 
-        try:
-            # We do not filter visible only here because we want to show the full content
-            # of the web page to the agent for simplicity.
-            # FIXME: handle the case when the web page is too large
-            cur_axtree_txt = self.get_axtree_str(filter_visible_only=False)
-            text += (
-                f'============== BEGIN accessibility tree ==============\n'
-                f'{cur_axtree_txt}\n'
-                f'============== END accessibility tree ==============\n'
-            )
-        except Exception as e:
-            text += f'\n[Error encountered when processing the accessibility tree: {e}]'
-        return text
+        elif self.trigger_by_action == ActionType.BROWSE:
+            text = f'[Current URL: {self.url}]\n'
+            if self.error:
+                text += (
+                    '================ BEGIN error message ===============\n'
+                    'The following error occurred when trying to visit the URL:\n'
+                    f'{self.last_browser_action_error}\n'
+                    '================ END error message ===============\n'
+                )
+            text += '============== BEGIN webpage content ==============\n'
+            text += self.content
+            text += '\n============== END webpage content ==============\n'
+            return text
+        else:
+            raise ValueError(f'Invalid trigger_by_action: {self.trigger_by_action}')
 
     def get_axtree_str(self, filter_visible_only: bool = False) -> str:
         cur_axtree_txt = flatten_axtree_to_str(
diff --git a/openhands/events/stream.py b/openhands/events/stream.py
index 24e95bf98147..3a7ef062cdc1 100644
--- a/openhands/events/stream.py
+++ b/openhands/events/stream.py
@@ -211,6 +211,95 @@ def filtered_events_by_source(self, source: EventSource):
             if event.source == source:
                 yield event
 
+    def _should_filter_event(
+        self,
+        event,
+        query: str | None = None,
+        event_type: str | None = None,
+        source: str | None = None,
+        start_date: str | None = None,
+        end_date: str | None = None,
+    ) -> bool:
+        """Check if an event should be filtered out based on the given criteria.
+
+        Args:
+            event: The event to check
+            query (str, optional): Text to search for in event content
+            event_type (str, optional): Filter by event type (e.g., "FileReadAction")
+            source (str, optional): Filter by event source
+            start_date (str, optional): Filter events after this date (ISO format)
+            end_date (str, optional): Filter events before this date (ISO format)
+
+        Returns:
+            bool: True if the event should be filtered out, False if it matches all criteria
+        """
+        if event_type and not event.__class__.__name__ == event_type:
+            return True
+
+        if source and not event.source.value == source:
+            return True
+
+        if start_date and event.timestamp < start_date:
+            return True
+
+        if end_date and event.timestamp > end_date:
+            return True
+
+        # Text search in event content if query provided
+        if query:
+            event_dict = event_to_dict(event)
+            event_str = str(event_dict).lower()
+            if query.lower() not in event_str:
+                return True
+
+        return False
+
+    def get_matching_events(
+        self,
+        query: str | None = None,
+        event_type: str | None = None,
+        source: str | None = None,
+        start_date: str | None = None,
+        end_date: str | None = None,
+        start_id: int = 0,
+        limit: int = 100,
+    ) -> list:
+        """Get matching events from the event stream based on filters.
+
+        Args:
+            query (str, optional): Text to search for in event content
+            event_type (str, optional): Filter by event type (e.g., "FileReadAction")
+            source (str, optional): Filter by event source
+            start_date (str, optional): Filter events after this date (ISO format)
+            end_date (str, optional): Filter events before this date (ISO format)
+            start_id (int): Starting ID in the event stream. Defaults to 0
+            limit (int): Maximum number of events to return. Must be between 1 and 100. Defaults to 100
+
+        Returns:
+            list: List of matching events (as dicts)
+
+        Raises:
+            ValueError: If limit is less than 1 or greater than 100
+        """
+        if limit < 1 or limit > 100:
+            raise ValueError('Limit must be between 1 and 100')
+
+        matching_events: list = []
+
+        for event in self.get_events(start_id=start_id):
+            if self._should_filter_event(
+                event, query, event_type, source, start_date, end_date
+            ):
+                continue
+
+            matching_events.append(event_to_dict(event))
+
+            # Stop if we have enough events
+            if len(matching_events) >= limit:
+                break
+
+        return matching_events
+
     def clear(self):
         self.file_store.delete(f'sessions/{self.sid}')
         self._cur_id = 0
diff --git a/openhands/llm/llm.py b/openhands/llm/llm.py
index 2ed9732e1e7e..700c3827fda0 100644
--- a/openhands/llm/llm.py
+++ b/openhands/llm/llm.py
@@ -12,6 +12,7 @@
 with warnings.catch_warnings():
     warnings.simplefilter('ignore')
     import litellm
+
 from litellm import Message as LiteLLMMessage
 from litellm import ModelInfo, PromptTokensDetails
 from litellm import completion as litellm_completion
@@ -244,7 +245,13 @@ def wrapper(*args, **kwargs):
                     with open(log_file, 'w') as f:
                         f.write(json.dumps(_d))
 
-                message_back: str = resp['choices'][0]['message']['content']
+                message_back: str = resp['choices'][0]['message']['content'] or ''
+                tool_calls = resp['choices'][0]['message'].get('tool_calls', [])
+                if tool_calls:
+                    for tool_call in tool_calls:
+                        fn_name = tool_call.function.name
+                        fn_args = tool_call.function.arguments
+                        message_back += f'\nFunction call: {fn_name}({fn_args})'
 
                 # log the LLM response
                 self.log_response(message_back)
diff --git a/openhands/resolver/examples/openhands-resolver.yml b/openhands/resolver/examples/openhands-resolver.yml
index 13571b7703e1..a244af04c6a1 100644
--- a/openhands/resolver/examples/openhands-resolver.yml
+++ b/openhands/resolver/examples/openhands-resolver.yml
@@ -22,7 +22,8 @@ jobs:
     uses: All-Hands-AI/OpenHands/.github/workflows/openhands-resolver.yml@main
     with:
       macro: ${{ vars.OPENHANDS_MACRO || '@openhands-agent' }}
-      max_iterations: ${{ vars.OPENHANDS_MAX_ITER || 50 }}
+      max_iterations: ${{ fromJson(vars.OPENHANDS_MAX_ITER || 50) }}
+      base_container_image: ${{ vars.OPENHANDS_BASE_CONTAINER_IMAGE || "" }}
     secrets:
       PAT_TOKEN: ${{ secrets.PAT_TOKEN }}
       PAT_USERNAME: ${{ secrets.PAT_USERNAME }}
diff --git a/openhands/resolver/issue_definitions.py b/openhands/resolver/issue_definitions.py
index a0d0eb570aa7..c4ef33fb351e 100644
--- a/openhands/resolver/issue_definitions.py
+++ b/openhands/resolver/issue_definitions.py
@@ -5,17 +5,18 @@
 from typing import Any, ClassVar
 
 import jinja2
-import litellm
 import requests
 
 from openhands.core.config import LLMConfig
 from openhands.core.logger import openhands_logger as logger
 from openhands.events.event import Event
+from openhands.llm.llm import LLM
 from openhands.resolver.github_issue import GithubIssue, ReviewThread
 
 
 class IssueHandlerInterface(ABC):
     issue_type: ClassVar[str]
+    llm: LLM
 
     @abstractmethod
     def get_converted_issues(
@@ -36,7 +37,7 @@ def get_instruction(
 
     @abstractmethod
     def guess_success(
-        self, issue: GithubIssue, history: list[Event], llm_config: LLMConfig
+        self, issue: GithubIssue, history: list[Event]
     ) -> tuple[bool, list[bool] | None, str]:
         """Guess if the issue has been resolved based on the agent's output."""
         pass
@@ -45,11 +46,12 @@ def guess_success(
 class IssueHandler(IssueHandlerInterface):
     issue_type: ClassVar[str] = 'issue'
 
-    def __init__(self, owner: str, repo: str, token: str):
+    def __init__(self, owner: str, repo: str, token: str, llm_config: LLMConfig):
         self.download_url = 'https://api.github.com/repos/{}/{}/issues'
         self.owner = owner
         self.repo = repo
         self.token = token
+        self.llm = LLM(llm_config)
 
     def _download_issues_from_github(self) -> list[Any]:
         url = self.download_url.format(self.owner, self.repo)
@@ -218,7 +220,7 @@ def get_instruction(
         )
 
     def guess_success(
-        self, issue: GithubIssue, history: list[Event], llm_config: LLMConfig
+        self, issue: GithubIssue, history: list[Event]
     ) -> tuple[bool, None | list[bool], str]:
         """Guess if the issue is fixed based on the history and the issue description."""
         last_message = history[-1].message
@@ -239,12 +241,7 @@ def guess_success(
             template = jinja2.Template(f.read())
         prompt = template.render(issue_context=issue_context, last_message=last_message)
 
-        response = litellm.completion(
-            model=llm_config.model,
-            messages=[{'role': 'user', 'content': prompt}],
-            api_key=llm_config.api_key,
-            base_url=llm_config.base_url,
-        )
+        response = self.llm.completion(messages=[{'role': 'user', 'content': prompt}])
 
         answer = response.choices[0].message.content.strip()
         pattern = r'--- success\n*(true|false)\n*--- explanation*\n((?:.|\n)*)'
@@ -258,8 +255,8 @@ def guess_success(
 class PRHandler(IssueHandler):
     issue_type: ClassVar[str] = 'pr'
 
-    def __init__(self, owner: str, repo: str, token: str):
-        super().__init__(owner, repo, token)
+    def __init__(self, owner: str, repo: str, token: str, llm_config: LLMConfig):
+        super().__init__(owner, repo, token, llm_config)
         self.download_url = 'https://api.github.com/repos/{}/{}/pulls'
 
     def __download_pr_metadata(
@@ -612,16 +609,9 @@ def get_instruction(
         )
         return instruction, images
 
-    def _check_feedback_with_llm(
-        self, prompt: str, llm_config: LLMConfig
-    ) -> tuple[bool, str]:
+    def _check_feedback_with_llm(self, prompt: str) -> tuple[bool, str]:
         """Helper function to check feedback with LLM and parse response."""
-        response = litellm.completion(
-            model=llm_config.model,
-            messages=[{'role': 'user', 'content': prompt}],
-            api_key=llm_config.api_key,
-            base_url=llm_config.base_url,
-        )
+        response = self.llm.completion(messages=[{'role': 'user', 'content': prompt}])
 
         answer = response.choices[0].message.content.strip()
         pattern = r'--- success\n*(true|false)\n*--- explanation*\n((?:.|\n)*)'
@@ -635,7 +625,6 @@ def _check_review_thread(
         review_thread: ReviewThread,
         issues_context: str,
         last_message: str,
-        llm_config: LLMConfig,
     ) -> tuple[bool, str]:
         """Check if a review thread's feedback has been addressed."""
         files_context = json.dumps(review_thread.files, indent=4)
@@ -656,14 +645,13 @@ def _check_review_thread(
             last_message=last_message,
         )
 
-        return self._check_feedback_with_llm(prompt, llm_config)
+        return self._check_feedback_with_llm(prompt)
 
     def _check_thread_comments(
         self,
         thread_comments: list[str],
         issues_context: str,
         last_message: str,
-        llm_config: LLMConfig,
     ) -> tuple[bool, str]:
         """Check if thread comments feedback has been addressed."""
         thread_context = '\n---\n'.join(thread_comments)
@@ -682,14 +670,13 @@ def _check_thread_comments(
             last_message=last_message,
         )
 
-        return self._check_feedback_with_llm(prompt, llm_config)
+        return self._check_feedback_with_llm(prompt)
 
     def _check_review_comments(
         self,
         review_comments: list[str],
         issues_context: str,
         last_message: str,
-        llm_config: LLMConfig,
     ) -> tuple[bool, str]:
         """Check if review comments feedback has been addressed."""
         review_context = '\n---\n'.join(review_comments)
@@ -708,10 +695,10 @@ def _check_review_comments(
             last_message=last_message,
         )
 
-        return self._check_feedback_with_llm(prompt, llm_config)
+        return self._check_feedback_with_llm(prompt)
 
     def guess_success(
-        self, issue: GithubIssue, history: list[Event], llm_config: LLMConfig
+        self, issue: GithubIssue, history: list[Event]
     ) -> tuple[bool, None | list[bool], str]:
         """Guess if the issue is fixed based on the history and the issue description."""
         last_message = history[-1].message
@@ -724,7 +711,7 @@ def guess_success(
             for review_thread in issue.review_threads:
                 if issues_context and last_message:
                     success, explanation = self._check_review_thread(
-                        review_thread, issues_context, last_message, llm_config
+                        review_thread, issues_context, last_message
                     )
                 else:
                     success, explanation = False, 'Missing context or message'
@@ -734,7 +721,7 @@ def guess_success(
         elif issue.thread_comments:
             if issue.thread_comments and issues_context and last_message:
                 success, explanation = self._check_thread_comments(
-                    issue.thread_comments, issues_context, last_message, llm_config
+                    issue.thread_comments, issues_context, last_message
                 )
             else:
                 success, explanation = (
@@ -747,7 +734,7 @@ def guess_success(
             # Handle PRs with only review comments (no file-specific review comments or thread comments)
             if issue.review_comments and issues_context and last_message:
                 success, explanation = self._check_review_comments(
-                    issue.review_comments, issues_context, last_message, llm_config
+                    issue.review_comments, issues_context, last_message
                 )
             else:
                 success, explanation = (
diff --git a/openhands/resolver/resolve_all_issues.py b/openhands/resolver/resolve_all_issues.py
index 01d076446e97..9c44855a2dd4 100644
--- a/openhands/resolver/resolve_all_issues.py
+++ b/openhands/resolver/resolve_all_issues.py
@@ -80,7 +80,7 @@ async def resolve_issues(
         repo_instruction: Repository instruction to use.
         issue_numbers: List of issue numbers to resolve.
     """
-    issue_handler = issue_handler_factory(issue_type, owner, repo, token)
+    issue_handler = issue_handler_factory(issue_type, owner, repo, token, llm_config)
 
     # Load dataset
     issues: list[GithubIssue] = issue_handler.get_converted_issues(
diff --git a/openhands/resolver/resolve_issue.py b/openhands/resolver/resolve_issue.py
index b6cbb9f03c05..63a9e40a05ba 100644
--- a/openhands/resolver/resolve_issue.py
+++ b/openhands/resolver/resolve_issue.py
@@ -249,7 +249,7 @@ async def on_event(evt):
         metrics = state.metrics.get() if state.metrics else None
         # determine success based on the history and the issue description
         success, comment_success, success_explanation = issue_handler.guess_success(
-            issue, state.history, llm_config
+            issue, state.history
         )
 
         if issue_handler.issue_type == 'pr' and comment_success:
@@ -291,12 +291,12 @@ async def on_event(evt):
 
 
 def issue_handler_factory(
-    issue_type: str, owner: str, repo: str, token: str
+    issue_type: str, owner: str, repo: str, token: str, llm_config: LLMConfig
 ) -> IssueHandlerInterface:
     if issue_type == 'issue':
-        return IssueHandler(owner, repo, token)
+        return IssueHandler(owner, repo, token, llm_config)
     elif issue_type == 'pr':
-        return PRHandler(owner, repo, token)
+        return PRHandler(owner, repo, token, llm_config)
     else:
         raise ValueError(f'Invalid issue type: {issue_type}')
 
@@ -337,7 +337,7 @@ async def resolve_issue(
         target_branch: Optional target branch to create PR against (for PRs).
         reset_logger: Whether to reset the logger for multiprocessing.
     """
-    issue_handler = issue_handler_factory(issue_type, owner, repo, token)
+    issue_handler = issue_handler_factory(issue_type, owner, repo, token, llm_config)
 
     # Load dataset
     issues: list[GithubIssue] = issue_handler.get_converted_issues(
diff --git a/openhands/runtime/browser/utils.py b/openhands/runtime/browser/utils.py
index 336b3801e3e2..6f823e47d546 100644
--- a/openhands/runtime/browser/utils.py
+++ b/openhands/runtime/browser/utils.py
@@ -49,6 +49,7 @@ async def browse(
             ),  # last browser env action performed
             last_browser_action_error=obs.get('last_action_error', ''),
             error=True if obs.get('last_action_error', '') else False,  # error flag
+            trigger_by_action=action.action,
         )
     except Exception as e:
         return BrowserOutputObservation(
@@ -57,4 +58,5 @@ async def browse(
             error=True,
             last_browser_action_error=str(e),
             url=asked_url if action.action == ActionType.BROWSE else '',
+            trigger_by_action=action.action,
         )
diff --git a/openhands/runtime/impl/e2b/sandbox.py b/openhands/runtime/impl/e2b/sandbox.py
index d145dac35115..783028ebb0e3 100644
--- a/openhands/runtime/impl/e2b/sandbox.py
+++ b/openhands/runtime/impl/e2b/sandbox.py
@@ -4,7 +4,7 @@
 from glob import glob
 
 from e2b import Sandbox as E2BSandbox
-from e2b.sandbox.exception import TimeoutException
+from e2b.sandbox import TimeoutException
 
 from openhands.core.config import SandboxConfig
 from openhands.core.logger import openhands_logger as logger
diff --git a/openhands/runtime/impl/runloop/runloop_runtime.py b/openhands/runtime/impl/runloop/runloop_runtime.py
index 20f0ea46a1b8..76f9b254fdcf 100644
--- a/openhands/runtime/impl/runloop/runloop_runtime.py
+++ b/openhands/runtime/impl/runloop/runloop_runtime.py
@@ -99,6 +99,7 @@ class RunloopRuntime(EventStreamRuntime):
     """The RunloopRuntime class is an EventStreamRuntime that utilizes Runloop Devbox as a runtime environment."""
 
     _sandbox_port: int = 4444
+    _vscode_port: int = 4445
 
     def __init__(
         self,
@@ -109,6 +110,7 @@ def __init__(
         env_vars: dict[str, str] | None = None,
         status_callback: Callable | None = None,
         attach_to_existing: bool = False,
+        headless_mode: bool = True,
     ):
         assert config.runloop_api_key is not None, 'Runloop API key is required'
         self.devbox: DevboxView | None = None
@@ -127,9 +129,11 @@ def __init__(
             env_vars,
             status_callback,
             attach_to_existing,
+            headless_mode,
         )
         # Buffer for container logs
         self.log_buffer: LogBuffer | None = None
+        self._vscode_url: str | None = None
 
     @tenacity.retry(
         stop=tenacity.stop_after_attempt(120),
@@ -192,7 +196,7 @@ def _create_new_devbox(self) -> DevboxView:
             environment_variables={'DEBUG': 'true'} if self.config.debug else {},
             prebuilt='openhands',
             launch_parameters=LaunchParameters(
-                available_ports=[self._sandbox_port],
+                available_ports=[self._sandbox_port, self._vscode_port],
                 resource_size_request='LARGE',
             ),
             metadata={'container-name': self.container_name},
@@ -221,7 +225,7 @@ async def connect(self):
 
         # Hook up logs
         self.log_buffer = RunloopLogBuffer(self.runloop_api_client, self.devbox.id)
-        self.api_url = f'https://{tunnel.url}'
+        self.api_url = tunnel.url
         logger.info(f'Container started. Server url: {self.api_url}')
 
         # End Runloop connect
@@ -273,3 +277,45 @@ def close(self, rm_all_containers: bool | None = True):
 
         if self.devbox:
             self.runloop_api_client.devboxes.shutdown(self.devbox.id)
+
+    @property
+    def vscode_url(self) -> str | None:
+        if self.vscode_enabled and self.devbox and self.devbox.status == 'running':
+            if self._vscode_url is not None:
+                return self._vscode_url
+
+            try:
+                with send_request(
+                    self.session,
+                    'GET',
+                    f'{self.api_url}/vscode/connection_token',
+                    timeout=10,
+                ) as response:
+                    response_json = response.json()
+                    assert isinstance(response_json, dict)
+                    if response_json['token'] is None:
+                        return None
+                    token = response_json['token']
+
+                self._vscode_url = (
+                    self.runloop_api_client.devboxes.create_tunnel(
+                        id=self.devbox.id,
+                        port=self._vscode_port,
+                    ).url
+                    + f'/?tkn={token}&folder={self.config.workspace_mount_path_in_sandbox}'
+                )
+
+                self.log(
+                    'debug',
+                    f'VSCode URL: {self._vscode_url}',
+                )
+
+                return self._vscode_url
+            except Exception as e:
+                self.log(
+                    'error',
+                    f'Failed to create vscode tunnel {e}',
+                )
+                return None
+        else:
+            return None
diff --git a/openhands/security/README.md b/openhands/security/README.md
index 644348f57778..a208ce5b8f00 100644
--- a/openhands/security/README.md
+++ b/openhands/security/README.md
@@ -65,9 +65,23 @@ Features:
     * potential secret leaks by the agent
     * security issues in Python code
     * malicious bash commands
+    * dangerous user tasks (browsing agent setting)
+    * harmful content generation (browsing agent setting)
 * Logs:
     * actions and their associated risk
     * OpenHands traces in JSON format
 * Run-time settings:
     * the [invariant policy](https://github.com/invariantlabs-ai/invariant?tab=readme-ov-file#policy-language)
     * acceptable risk threshold
+    * (Optional) check_browsing_alignment flag
+    * (Optional) guardrail_llm that assesses if the agent behaviour is safe
+
+Browsing Agent Safety:
+
+* Guardrail feature that uses the underlying LLM of the agent to:
+    * Examine the user's request and check if it is harmful.
+    * Examine the content entered by the agent in a textbox (argument of the “fill” browser action) and check if it is harmful.
+
+* If the guardrail evaluates either of the 2 conditions to be true, it emits a change_agent_state action and transforms the AgentState to ERROR. This stops the agent from proceeding further.
+
+* To enable this feature: In the InvariantAnalyzer object, set the check_browsing_alignment attribute to True and initialize the guardrail_llm attribute with an LLM object.
diff --git a/openhands/security/invariant/analyzer.py b/openhands/security/invariant/analyzer.py
index 0ba13b4ecddf..52651876926d 100644
--- a/openhands/security/invariant/analyzer.py
+++ b/openhands/security/invariant/analyzer.py
@@ -1,3 +1,4 @@
+import ast
 import re
 import uuid
 from typing import Any
@@ -7,15 +8,19 @@
 from fastapi.responses import JSONResponse
 
 from openhands.core.logger import openhands_logger as logger
+from openhands.core.message import Message, TextContent
+from openhands.core.schema import AgentState
 from openhands.events.action.action import (
     Action,
     ActionConfirmationStatus,
     ActionSecurityRisk,
 )
+from openhands.events.action.agent import ChangeAgentStateAction
 from openhands.events.event import Event, EventSource
 from openhands.events.observation import Observation
 from openhands.events.serialization.action import action_from_dict
 from openhands.events.stream import EventStream
+from openhands.llm.llm import LLM
 from openhands.runtime.utils import find_available_tcp_port
 from openhands.security.analyzer import SecurityAnalyzer
 from openhands.security.invariant.client import InvariantClient
@@ -34,6 +39,9 @@ class InvariantAnalyzer(SecurityAnalyzer):
     timeout: int = 180
     settings: dict = {}
 
+    check_browsing_alignment: bool = False
+    guardrail_llm: LLM | None = None
+
     def __init__(
         self,
         event_stream: EventStream,
@@ -132,6 +140,149 @@ def get_risk(self, results: list[str]) -> ActionSecurityRisk:
     async def act(self, event: Event) -> None:
         if await self.should_confirm(event):
             await self.confirm(event)
+        if (
+            self.check_browsing_alignment
+            and type(event) is not ChangeAgentStateAction
+            and self.guardrail_llm is not None
+        ):
+            await self.check_usertask()
+            await self.check_fillaction()
+
+    async def check_usertask(self):
+        """Looks at the most recent trace element. If it is a user message, it checks whether the task is appropriate for an AI browsing agent.
+
+        Ensure that the new event is parsed and added to the trace before calling this.
+        """
+        recent_trace_element = self.trace[-1]
+        responses = []
+        if getattr(recent_trace_element, 'role', None) == 'user':
+            messages = []
+            messages.append(
+                Message(
+                    role='system',
+                    content=[TextContent(text='You are a helpful assistant')],
+                )
+            )
+            messages.append(
+                Message(
+                    role='user',
+                    content=[
+                        TextContent(
+                            text='A browsing agent is an AI agent that helps the user to browse the web and automate benign tasks. We need to stop only very harmful and unethical requests. Answer Yes or No. Is it appropriate for an AI browsing agent to help with the following task?: '
+                            + repr(recent_trace_element.content)
+                        )
+                    ],
+                )
+            )
+            assert (
+                self.guardrail_llm is not None
+            ), 'InvariantAnalyzer.guardrail_llm should be initialized before calling check_usertask'
+            response = self.guardrail_llm.completion(
+                messages=self.guardrail_llm.format_messages_for_llm(messages),
+                stop=['.'],
+            )
+            responses.append(response)
+        for response in responses:
+            if 'No' in response['choices'][0]['message']['content']:
+                new_event = action_from_dict(
+                    {
+                        'action': 'change_agent_state',
+                        'args': {
+                            'agent_state': AgentState.ERROR,
+                            'thought': 'It is inappropriate for a browsing agent to comply with this request',
+                        },
+                    }
+                )
+                event_source = EventSource.AGENT
+                await call_sync_from_async(
+                    self.event_stream.add_event, new_event, event_source
+                )
+
+    def parse_browser_action(self, browser_action):
+        assert browser_action[-1] == ')'
+        tree = ast.parse(browser_action, mode='exec')
+        function_calls = []
+
+        for node in tree.body:
+            if isinstance(node, ast.Expr) and isinstance(node.value, ast.Call):
+                call_node = node.value  # This contains the actual function call
+                # Extract function name
+                if isinstance(call_node.func, ast.Name):
+                    func_name = call_node.func.id
+                elif isinstance(call_node.func, ast.Attribute):
+                    func_name = (
+                        f'{ast.unparse(call_node.func.value)}.{call_node.func.attr}'
+                    )
+                else:
+                    func_name = None
+
+                # Extract positional arguments
+                args = [ast.unparse(arg) for arg in call_node.args]
+                function_calls.append((func_name, args))
+            else:
+                raise ValueError('The code does not represent a function call.')
+        return function_calls
+
+    async def check_fillaction(self):
+        """Looks at the most recent trace element. If it is a function call to browse_interactive with "fill(<element>, <content>)" as an argument, it checks whether the content inside fill is harmful.
+
+        Ensure that the new event is parsed and added to the trace before calling this.
+        """
+        recent_trace_element = self.trace[-1]
+        responses = []
+        if (
+            getattr(recent_trace_element, 'type', None) == 'function'
+            and recent_trace_element.function.name == 'browse_interactive'
+        ):
+            function_calls = self.parse_browser_action(
+                recent_trace_element.function.arguments['browser_actions']
+            )
+            for function_call in function_calls:
+                action_name, action_args = function_call
+                if action_name == 'fill':
+                    messages = []
+                    messages.append(
+                        Message(
+                            role='system',
+                            content=[TextContent(text='You are a helpful assistant')],
+                        )
+                    )
+                    messages.append(
+                        Message(
+                            role='user',
+                            content=[
+                                TextContent(
+                                    text='Answer Yes or No. Is this harmful content: '
+                                    + repr(action_args[1])
+                                )
+                            ],
+                        )
+                    )
+                    assert (
+                        self.guardrail_llm is not None
+                    ), 'InvariantAnalyzer.guardrail_llm should be initialized before calling check_fillaction'
+                    response = self.guardrail_llm.completion(
+                        messages=self.guardrail_llm.format_messages_for_llm(messages),
+                        stop=['.'],
+                    )
+                    responses.append(response)
+
+            for response in responses:
+                if 'Yes' in response['choices'][0]['message']['content']:
+                    new_event = action_from_dict(
+                        {
+                            'action': 'change_agent_state',
+                            'args': {
+                                'agent_state': AgentState.ERROR,
+                                'thought': 'It is inappropriate for a browsing agent to fill in harmful content',
+                            },
+                        }
+                    )
+                    event_source = EventSource.AGENT
+                    await call_sync_from_async(
+                        self.event_stream.add_event, new_event, event_source
+                    )
+                    break
 
     async def should_confirm(self, event: Event) -> bool:
         risk = event.security_risk  # type: ignore [attr-defined]
diff --git a/openhands/server/app.py b/openhands/server/app.py
new file mode 100644
index 000000000000..33f9766fe60d
--- /dev/null
+++ b/openhands/server/app.py
@@ -0,0 +1,56 @@
+import warnings
+
+with warnings.catch_warnings():
+    warnings.simplefilter('ignore')
+
+from fastapi import (
+    FastAPI,
+)
+
+import openhands.agenthub  # noqa F401 (we import this to get the agents registered)
+from openhands.server.middleware import (
+    AttachSessionMiddleware,
+    InMemoryRateLimiter,
+    LocalhostCORSMiddleware,
+    NoCacheMiddleware,
+    RateLimitMiddleware,
+)
+from openhands.server.routes.auth import app as auth_api_router
+from openhands.server.routes.conversation import app as conversation_api_router
+from openhands.server.routes.feedback import app as feedback_api_router
+from openhands.server.routes.files import app as files_api_router
+from openhands.server.routes.public import app as public_api_router
+from openhands.server.routes.security import app as security_api_router
+
+app = FastAPI()
+app.add_middleware(
+    LocalhostCORSMiddleware,
+    allow_credentials=True,
+    allow_methods=['*'],
+    allow_headers=['*'],
+)
+
+app.add_middleware(NoCacheMiddleware)
+app.add_middleware(
+    RateLimitMiddleware, rate_limiter=InMemoryRateLimiter(requests=10, seconds=1)
+)
+
+
+@app.get('/health')
+async def health():
+    return 'OK'
+
+
+app.include_router(auth_api_router)
+app.include_router(public_api_router)
+app.include_router(files_api_router)
+app.include_router(conversation_api_router)
+app.include_router(security_api_router)
+app.include_router(feedback_api_router)
+
+app.middleware('http')(AttachSessionMiddleware(app, target_router=files_api_router))
+app.middleware('http')(
+    AttachSessionMiddleware(app, target_router=conversation_api_router)
+)
+app.middleware('http')(AttachSessionMiddleware(app, target_router=security_api_router))
+app.middleware('http')(AttachSessionMiddleware(app, target_router=feedback_api_router))
diff --git a/openhands/server/auth/auth.py b/openhands/server/auth.py
similarity index 100%
rename from openhands/server/auth/auth.py
rename to openhands/server/auth.py
diff --git a/openhands/server/auth/__init__.py b/openhands/server/auth/__init__.py
deleted file mode 100644
index 0fe3ddd8cc0c..000000000000
--- a/openhands/server/auth/__init__.py
+++ /dev/null
@@ -1,3 +0,0 @@
-from openhands.server.auth.auth import get_sid_from_token, sign_token
-
-__all__ = ['get_sid_from_token', 'sign_token']
diff --git a/openhands/server/file_config.py b/openhands/server/file_config.py
new file mode 100644
index 000000000000..06e8ce20eeb4
--- /dev/null
+++ b/openhands/server/file_config.py
@@ -0,0 +1,111 @@
+import os
+import re
+
+from openhands.core.config import AppConfig
+from openhands.core.logger import openhands_logger as logger
+from openhands.server.shared import config as shared_config
+
+FILES_TO_IGNORE = [
+    '.git/',
+    '.DS_Store',
+    'node_modules/',
+    '__pycache__/',
+]
+
+
+def sanitize_filename(filename):
+    """Sanitize the filename to prevent directory traversal"""
+    # Remove any directory components
+    filename = os.path.basename(filename)
+    # Remove any non-alphanumeric characters except for .-_
+    filename = re.sub(r'[^\w\-_\.]', '', filename)
+    # Limit the filename length
+    max_length = 255
+    if len(filename) > max_length:
+        name, ext = os.path.splitext(filename)
+        filename = name[: max_length - len(ext)] + ext
+    return filename
+
+
+def load_file_upload_config(
+    config: AppConfig = shared_config,
+) -> tuple[int, bool, list[str]]:
+    """Load file upload configuration from the config object.
+
+    This function retrieves the file upload settings from the global config object.
+    It handles the following settings:
+    - Maximum file size for uploads
+    - Whether to restrict file types
+    - List of allowed file extensions
+
+    It also performs sanity checks on the values to ensure they are valid and safe.
+
+    Returns:
+        tuple: A tuple containing:
+            - max_file_size_mb (int): Maximum file size in MB. 0 means no limit.
+            - restrict_file_types (bool): Whether file type restrictions are enabled.
+            - allowed_extensions (set): Set of allowed file extensions.
+    """
+    # Retrieve values from config
+    max_file_size_mb = config.file_uploads_max_file_size_mb
+    restrict_file_types = config.file_uploads_restrict_file_types
+    allowed_extensions = config.file_uploads_allowed_extensions
+
+    # Sanity check for max_file_size_mb
+    if not isinstance(max_file_size_mb, int) or max_file_size_mb < 0:
+        logger.warning(
+            f'Invalid max_file_size_mb: {max_file_size_mb}. Setting to 0 (no limit).'
+        )
+        max_file_size_mb = 0
+
+    # Sanity check for allowed_extensions
+    if not isinstance(allowed_extensions, (list, set)) or not allowed_extensions:
+        logger.warning(
+            f'Invalid allowed_extensions: {allowed_extensions}. Setting to [".*"].'
+        )
+        allowed_extensions = ['.*']
+    else:
+        # Ensure all extensions start with a dot and are lowercase
+        allowed_extensions = [
+            ext.lower() if ext.startswith('.') else f'.{ext.lower()}'
+            for ext in allowed_extensions
+        ]
+
+    # If restrictions are disabled, allow all
+    if not restrict_file_types:
+        allowed_extensions = ['.*']
+
+    logger.debug(
+        f'File upload config: max_size={max_file_size_mb}MB, '
+        f'restrict_types={restrict_file_types}, '
+        f'allowed_extensions={allowed_extensions}'
+    )
+
+    return max_file_size_mb, restrict_file_types, allowed_extensions
+
+
+# Load configuration
+MAX_FILE_SIZE_MB, RESTRICT_FILE_TYPES, ALLOWED_EXTENSIONS = load_file_upload_config()
+
+
+def is_extension_allowed(filename):
+    """Check if the file extension is allowed based on the current configuration.
+
+    This function supports wildcards and files without extensions.
+    The check is case-insensitive for extensions.
+
+    Args:
+        filename (str): The name of the file to check.
+
+    Returns:
+        bool: True if the file extension is allowed, False otherwise.
+    """
+    if not RESTRICT_FILE_TYPES:
+        return True
+
+    file_ext = os.path.splitext(filename)[1].lower()  # Convert to lowercase
+    return (
+        '.*' in ALLOWED_EXTENSIONS
+        or file_ext in (ext.lower() for ext in ALLOWED_EXTENSIONS)
+        or (file_ext == '' and '.' in ALLOWED_EXTENSIONS)
+    )
diff --git a/openhands/server/listen.py b/openhands/server/listen.py
index 699778692872..3ad6fd1b88fa 100644
--- a/openhands/server/listen.py
+++ b/openhands/server/listen.py
@@ -1,971 +1,11 @@
-import os
-import re
-import tempfile
-import time
-import warnings
-from contextlib import asynccontextmanager
-
-import jwt
-import requests
 import socketio
-from pathspec import PathSpec
-from pathspec.patterns import GitWildMatchPattern
-
-from openhands.core.schema.action import ActionType
-from openhands.security.options import SecurityAnalyzers
-from openhands.server.data_models.feedback import FeedbackDataModel, store_feedback
-from openhands.server.github_utils import (
-    GITHUB_CLIENT_ID,
-    GITHUB_CLIENT_SECRET,
-    UserVerifier,
-    authenticate_github_user,
-)
-from openhands.storage import get_file_store
-from openhands.utils.async_utils import call_sync_from_async
-
-with warnings.catch_warnings():
-    warnings.simplefilter('ignore')
-    import litellm
-
-from dotenv import load_dotenv
-from fastapi import (
-    BackgroundTasks,
-    FastAPI,
-    HTTPException,
-    Request,
-    UploadFile,
-    status,
-)
-from fastapi.responses import FileResponse, JSONResponse
-from fastapi.security import HTTPBearer
-from fastapi.staticfiles import StaticFiles
-from pydantic import BaseModel
-
-import openhands.agenthub  # noqa F401 (we import this to get the agents registered)
-from openhands.controller.agent import Agent
-from openhands.core.config import LLMConfig, load_app_config
-from openhands.core.logger import openhands_logger as logger
-from openhands.events.action import (
-    FileReadAction,
-    FileWriteAction,
-    NullAction,
-)
-from openhands.events.observation import (
-    ErrorObservation,
-    FileReadObservation,
-    FileWriteObservation,
-    NullObservation,
-)
-from openhands.events.serialization import event_to_dict
-from openhands.events.stream import AsyncEventStreamWrapper
-from openhands.llm import bedrock
-from openhands.runtime.base import Runtime, RuntimeUnavailableError
-from openhands.server.auth.auth import get_sid_from_token, sign_token
-from openhands.server.middleware import (
-    InMemoryRateLimiter,
-    LocalhostCORSMiddleware,
-    NoCacheMiddleware,
-    RateLimitMiddleware,
-)
-from openhands.server.session import SessionManager
-
-load_dotenv()
 
-config = load_app_config()
-file_store = get_file_store(config.file_store, config.file_store_path)
-client_manager = None
-redis_host = os.environ.get('REDIS_HOST')
-if redis_host:
-    client_manager = socketio.AsyncRedisManager(
-        f'redis://{redis_host}',
-        redis_options={'password': os.environ.get('REDIS_PASSWORD')},
-    )
-sio = socketio.AsyncServer(
-    async_mode='asgi', cors_allowed_origins='*', client_manager=client_manager
-)
-session_manager = SessionManager(sio, config, file_store)
-
-
-@asynccontextmanager
-async def _lifespan(app: FastAPI):
-    async with session_manager:
-        yield
+from openhands.server.app import app as base_app
+from openhands.server.socket import sio
+from openhands.server.static import SPAStaticFiles
 
-
-app = FastAPI(lifespan=_lifespan)
-app.add_middleware(
-    LocalhostCORSMiddleware,
-    allow_credentials=True,
-    allow_methods=['*'],
-    allow_headers=['*'],
+base_app.mount(
+    '/', SPAStaticFiles(directory='./frontend/build', html=True), name='dist'
 )
 
-
-app.add_middleware(NoCacheMiddleware)
-app.add_middleware(
-    RateLimitMiddleware, rate_limiter=InMemoryRateLimiter(requests=10, seconds=1)
-)
-
-
-@app.get('/health')
-async def health():
-    return 'OK'
-
-
-security_scheme = HTTPBearer()
-
-
-def load_file_upload_config() -> tuple[int, bool, list[str]]:
-    """Load file upload configuration from the config object.
-
-    This function retrieves the file upload settings from the global config object.
-    It handles the following settings:
-    - Maximum file size for uploads
-    - Whether to restrict file types
-    - List of allowed file extensions
-
-    It also performs sanity checks on the values to ensure they are valid and safe.
-
-    Returns:
-        tuple: A tuple containing:
-            - max_file_size_mb (int): Maximum file size in MB. 0 means no limit.
-            - restrict_file_types (bool): Whether file type restrictions are enabled.
-            - allowed_extensions (set): Set of allowed file extensions.
-    """
-    # Retrieve values from config
-    max_file_size_mb = config.file_uploads_max_file_size_mb
-    restrict_file_types = config.file_uploads_restrict_file_types
-    allowed_extensions = config.file_uploads_allowed_extensions
-
-    # Sanity check for max_file_size_mb
-    if not isinstance(max_file_size_mb, int) or max_file_size_mb < 0:
-        logger.warning(
-            f'Invalid max_file_size_mb: {max_file_size_mb}. Setting to 0 (no limit).'
-        )
-        max_file_size_mb = 0
-
-    # Sanity check for allowed_extensions
-    if not isinstance(allowed_extensions, (list, set)) or not allowed_extensions:
-        logger.warning(
-            f'Invalid allowed_extensions: {allowed_extensions}. Setting to [".*"].'
-        )
-        allowed_extensions = ['.*']
-    else:
-        # Ensure all extensions start with a dot and are lowercase
-        allowed_extensions = [
-            ext.lower() if ext.startswith('.') else f'.{ext.lower()}'
-            for ext in allowed_extensions
-        ]
-
-    # If restrictions are disabled, allow all
-    if not restrict_file_types:
-        allowed_extensions = ['.*']
-
-    logger.debug(
-        f'File upload config: max_size={max_file_size_mb}MB, '
-        f'restrict_types={restrict_file_types}, '
-        f'allowed_extensions={allowed_extensions}'
-    )
-
-    return max_file_size_mb, restrict_file_types, allowed_extensions
-
-
-# Load configuration
-MAX_FILE_SIZE_MB, RESTRICT_FILE_TYPES, ALLOWED_EXTENSIONS = load_file_upload_config()
-
-
-def is_extension_allowed(filename):
-    """Check if the file extension is allowed based on the current configuration.
-
-    This function supports wildcards and files without extensions.
-    The check is case-insensitive for extensions.
-
-    Args:
-        filename (str): The name of the file to check.
-
-    Returns:
-        bool: True if the file extension is allowed, False otherwise.
-    """
-    if not RESTRICT_FILE_TYPES:
-        return True
-
-    file_ext = os.path.splitext(filename)[1].lower()  # Convert to lowercase
-    return (
-        '.*' in ALLOWED_EXTENSIONS
-        or file_ext in (ext.lower() for ext in ALLOWED_EXTENSIONS)
-        or (file_ext == '' and '.' in ALLOWED_EXTENSIONS)
-    )
-
-
-@app.middleware('http')
-async def attach_session(request: Request, call_next):
-    """Middleware to attach session information to the request.
-
-    This middleware checks for the Authorization header, validates the token,
-    and attaches the corresponding session to the request state.
-
-    Args:
-        request (Request): The incoming request object.
-        call_next (Callable): The next middleware or route handler in the chain.
-
-    Returns:
-        Response: The response from the next middleware or route handler.
-    """
-    non_authed_paths = [
-        '/api/options/',
-        '/api/github/callback',
-        '/api/authenticate',
-    ]
-    if any(
-        request.url.path.startswith(path) for path in non_authed_paths
-    ) or not request.url.path.startswith('/api/'):
-        response = await call_next(request)
-        return response
-
-    # Bypass authentication for OPTIONS requests (preflight)
-    if request.method == 'OPTIONS':
-        response = await call_next(request)
-        return response
-
-    user_verifier = UserVerifier()
-    if user_verifier.is_active():
-        signed_token = request.cookies.get('github_auth')
-        if not signed_token:
-            return JSONResponse(
-                status_code=status.HTTP_401_UNAUTHORIZED,
-                content={'error': 'Not authenticated'},
-            )
-        try:
-            jwt.decode(signed_token, config.jwt_secret, algorithms=['HS256'])
-        except Exception as e:
-            logger.warning(f'Invalid token: {e}')
-            return JSONResponse(
-                status_code=status.HTTP_401_UNAUTHORIZED,
-                content={'error': 'Invalid token'},
-            )
-
-    if not request.headers.get('Authorization'):
-        logger.warning('Missing Authorization header')
-        return JSONResponse(
-            status_code=status.HTTP_401_UNAUTHORIZED,
-            content={'error': 'Missing Authorization header'},
-        )
-
-    auth_token = request.headers.get('Authorization')
-    if 'Bearer' in auth_token:
-        auth_token = auth_token.split('Bearer')[1].strip()
-
-    request.state.sid = get_sid_from_token(auth_token, config.jwt_secret)
-    if request.state.sid == '':
-        logger.warning('Invalid token')
-        return JSONResponse(
-            status_code=status.HTTP_401_UNAUTHORIZED,
-            content={'error': 'Invalid token'},
-        )
-
-    request.state.conversation = await session_manager.attach_to_conversation(
-        request.state.sid
-    )
-    if not request.state.conversation:
-        logger.error(f'Runtime not found for session: {request.state.sid}')
-        return JSONResponse(
-            status_code=status.HTTP_404_NOT_FOUND,
-            content={'error': 'Session not found'},
-        )
-    try:
-        response = await call_next(request)
-    finally:
-        await session_manager.detach_from_conversation(request.state.conversation)
-    return response
-
-
-@app.get('/api/options/models')
-async def get_litellm_models() -> list[str]:
-    """
-    Get all models supported by LiteLLM.
-
-    This function combines models from litellm and Bedrock, removing any
-    error-prone Bedrock models.
-
-    To get the models:
-    ```sh
-    curl http://localhost:3000/api/litellm-models
-    ```
-
-    Returns:
-        list: A sorted list of unique model names.
-    """
-    litellm_model_list = litellm.model_list + list(litellm.model_cost.keys())
-    litellm_model_list_without_bedrock = bedrock.remove_error_modelId(
-        litellm_model_list
-    )
-    # TODO: for bedrock, this is using the default config
-    llm_config: LLMConfig = config.get_llm_config()
-    bedrock_model_list = []
-    if (
-        llm_config.aws_region_name
-        and llm_config.aws_access_key_id
-        and llm_config.aws_secret_access_key
-    ):
-        bedrock_model_list = bedrock.list_foundation_models(
-            llm_config.aws_region_name,
-            llm_config.aws_access_key_id,
-            llm_config.aws_secret_access_key,
-        )
-    model_list = litellm_model_list_without_bedrock + bedrock_model_list
-    for llm_config in config.llms.values():
-        ollama_base_url = llm_config.ollama_base_url
-        if llm_config.model.startswith('ollama'):
-            if not ollama_base_url:
-                ollama_base_url = llm_config.base_url
-        if ollama_base_url:
-            ollama_url = ollama_base_url.strip('/') + '/api/tags'
-            try:
-                ollama_models_list = requests.get(ollama_url, timeout=3).json()[
-                    'models'
-                ]
-                for model in ollama_models_list:
-                    model_list.append('ollama/' + model['name'])
-                break
-            except requests.exceptions.RequestException as e:
-                logger.error(f'Error getting OLLAMA models: {e}', exc_info=True)
-
-    return list(sorted(set(model_list)))
-
-
-@app.get('/api/options/agents')
-async def get_agents():
-    """Get all agents supported by LiteLLM.
-
-    To get the agents:
-    ```sh
-    curl http://localhost:3000/api/agents
-    ```
-
-    Returns:
-        list: A sorted list of agent names.
-    """
-    agents = sorted(Agent.list_agents())
-    return agents
-
-
-@app.get('/api/options/security-analyzers')
-async def get_security_analyzers():
-    """Get all supported security analyzers.
-
-    To get the security analyzers:
-    ```sh
-    curl http://localhost:3000/api/security-analyzers
-    ```
-
-    Returns:
-        list: A sorted list of security analyzer names.
-    """
-    return sorted(SecurityAnalyzers.keys())
-
-
-FILES_TO_IGNORE = [
-    '.git/',
-    '.DS_Store',
-    'node_modules/',
-    '__pycache__/',
-]
-
-
-@app.get('/api/list-files')
-async def list_files(request: Request, path: str | None = None):
-    """List files in the specified path.
-
-    This function retrieves a list of files from the agent's runtime file store,
-    excluding certain system and hidden files/directories.
-
-    To list files:
-    ```sh
-    curl http://localhost:3000/api/list-files
-    ```
-
-    Args:
-        request (Request): The incoming request object.
-        path (str, optional): The path to list files from. Defaults to None.
-
-    Returns:
-        list: A list of file names in the specified path.
-
-    Raises:
-        HTTPException: If there's an error listing the files.
-    """
-    if not request.state.conversation.runtime:
-        return JSONResponse(
-            status_code=status.HTTP_404_NOT_FOUND,
-            content={'error': 'Runtime not yet initialized'},
-        )
-
-    runtime: Runtime = request.state.conversation.runtime
-    try:
-        file_list = await call_sync_from_async(runtime.list_files, path)
-    except RuntimeUnavailableError as e:
-        logger.error(f'Error listing files: {e}', exc_info=True)
-        return JSONResponse(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            content={'error': f'Error listing files: {e}'},
-        )
-    if path:
-        file_list = [os.path.join(path, f) for f in file_list]
-
-    file_list = [f for f in file_list if f not in FILES_TO_IGNORE]
-
-    async def filter_for_gitignore(file_list, base_path):
-        gitignore_path = os.path.join(base_path, '.gitignore')
-        try:
-            read_action = FileReadAction(gitignore_path)
-            observation = await call_sync_from_async(runtime.run_action, read_action)
-            spec = PathSpec.from_lines(
-                GitWildMatchPattern, observation.content.splitlines()
-            )
-        except Exception as e:
-            logger.warning(e)
-            return file_list
-        file_list = [entry for entry in file_list if not spec.match_file(entry)]
-        return file_list
-
-    try:
-        file_list = await filter_for_gitignore(file_list, '')
-    except RuntimeUnavailableError as e:
-        logger.error(f'Error filtering files: {e}', exc_info=True)
-        return JSONResponse(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            content={'error': f'Error filtering files: {e}'},
-        )
-
-    return file_list
-
-
-@app.get('/api/select-file')
-async def select_file(file: str, request: Request):
-    """Retrieve the content of a specified file.
-
-    To select a file:
-    ```sh
-    curl http://localhost:3000/api/select-file?file=<file_path>
-    ```
-
-    Args:
-        file (str): The path of the file to be retrieved.
-            Expect path to be absolute inside the runtime.
-        request (Request): The incoming request object.
-
-    Returns:
-        dict: A dictionary containing the file content.
-
-    Raises:
-        HTTPException: If there's an error opening the file.
-    """
-    runtime: Runtime = request.state.conversation.runtime
-
-    file = os.path.join(runtime.config.workspace_mount_path_in_sandbox, file)
-    read_action = FileReadAction(file)
-    try:
-        observation = await call_sync_from_async(runtime.run_action, read_action)
-    except RuntimeUnavailableError as e:
-        logger.error(f'Error opening file {file}: {e}', exc_info=True)
-        return JSONResponse(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            content={'error': f'Error opening file: {e}'},
-        )
-
-    if isinstance(observation, FileReadObservation):
-        content = observation.content
-        return {'code': content}
-    elif isinstance(observation, ErrorObservation):
-        logger.error(f'Error opening file {file}: {observation}', exc_info=False)
-        return JSONResponse(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            content={'error': f'Error opening file: {observation}'},
-        )
-
-
-def sanitize_filename(filename):
-    """Sanitize the filename to prevent directory traversal"""
-    # Remove any directory components
-    filename = os.path.basename(filename)
-    # Remove any non-alphanumeric characters except for .-_
-    filename = re.sub(r'[^\w\-_\.]', '', filename)
-    # Limit the filename length
-    max_length = 255
-    if len(filename) > max_length:
-        name, ext = os.path.splitext(filename)
-        filename = name[: max_length - len(ext)] + ext
-    return filename
-
-
-@app.get('/api/conversation')
-async def get_remote_runtime_config(request: Request):
-    """Retrieve the remote runtime configuration.
-
-    Currently, this is the runtime ID.
-    """
-    runtime = request.state.conversation.runtime
-    runtime_id = runtime.runtime_id if hasattr(runtime, 'runtime_id') else None
-    session_id = runtime.sid if hasattr(runtime, 'sid') else None
-    return JSONResponse(
-        content={
-            'runtime_id': runtime_id,
-            'session_id': session_id,
-        }
-    )
-
-
-@app.post('/api/upload-files')
-async def upload_file(request: Request, files: list[UploadFile]):
-    """Upload a list of files to the workspace.
-
-    To upload a files:
-    ```sh
-    curl -X POST -F "file=@<file_path1>" -F "file=@<file_path2>" http://localhost:3000/api/upload-files
-    ```
-
-    Args:
-        request (Request): The incoming request object.
-        files (list[UploadFile]): A list of files to be uploaded.
-
-    Returns:
-        dict: A message indicating the success of the upload operation.
-
-    Raises:
-        HTTPException: If there's an error saving the files.
-    """
-    try:
-        uploaded_files = []
-        skipped_files = []
-        for file in files:
-            safe_filename = sanitize_filename(file.filename)
-            file_contents = await file.read()
-
-            if (
-                MAX_FILE_SIZE_MB > 0
-                and len(file_contents) > MAX_FILE_SIZE_MB * 1024 * 1024
-            ):
-                skipped_files.append(
-                    {
-                        'name': safe_filename,
-                        'reason': f'Exceeds maximum size limit of {MAX_FILE_SIZE_MB}MB',
-                    }
-                )
-                continue
-
-            if not is_extension_allowed(safe_filename):
-                skipped_files.append(
-                    {'name': safe_filename, 'reason': 'File type not allowed'}
-                )
-                continue
-
-            # copy the file to the runtime
-            with tempfile.TemporaryDirectory() as tmp_dir:
-                tmp_file_path = os.path.join(tmp_dir, safe_filename)
-                with open(tmp_file_path, 'wb') as tmp_file:
-                    tmp_file.write(file_contents)
-                    tmp_file.flush()
-
-                runtime: Runtime = request.state.conversation.runtime
-                try:
-                    await call_sync_from_async(
-                        runtime.copy_to,
-                        tmp_file_path,
-                        runtime.config.workspace_mount_path_in_sandbox,
-                    )
-                except RuntimeUnavailableError as e:
-                    logger.error(
-                        f'Error saving file {safe_filename}: {e}', exc_info=True
-                    )
-                    return JSONResponse(
-                        status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-                        content={'error': f'Error saving file: {e}'},
-                    )
-            uploaded_files.append(safe_filename)
-
-        response_content = {
-            'message': 'File upload process completed',
-            'uploaded_files': uploaded_files,
-            'skipped_files': skipped_files,
-        }
-
-        if not uploaded_files and skipped_files:
-            return JSONResponse(
-                status_code=status.HTTP_400_BAD_REQUEST,
-                content={
-                    **response_content,
-                    'error': 'No files were uploaded successfully',
-                },
-            )
-
-        return JSONResponse(status_code=status.HTTP_200_OK, content=response_content)
-
-    except Exception as e:
-        logger.error(f'Error during file upload: {e}', exc_info=True)
-        return JSONResponse(
-            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
-            content={
-                'error': f'Error during file upload: {str(e)}',
-                'uploaded_files': [],
-                'skipped_files': [],
-            },
-        )
-
-
-@app.post('/api/submit-feedback')
-async def submit_feedback(request: Request):
-    """Submit user feedback.
-
-    This function stores the provided feedback data.
-
-    To submit feedback:
-    ```sh
-    curl -X POST -d '{"email": "test@example.com"}' -H "Authorization:"
-    ```
-
-    Args:
-        request (Request): The incoming request object.
-        feedback (FeedbackDataModel): The feedback data to be stored.
-
-    Returns:
-        dict: The stored feedback data.
-
-    Raises:
-        HTTPException: If there's an error submitting the feedback.
-    """
-    # Assuming the storage service is already configured in the backend
-    # and there is a function to handle the storage.
-    body = await request.json()
-    async_stream = AsyncEventStreamWrapper(
-        request.state.conversation.event_stream, filter_hidden=True
-    )
-    trajectory = []
-    async for event in async_stream:
-        trajectory.append(event_to_dict(event))
-    feedback = FeedbackDataModel(
-        email=body.get('email', ''),
-        version=body.get('version', ''),
-        permissions=body.get('permissions', 'private'),
-        polarity=body.get('polarity', ''),
-        feedback=body.get('polarity', ''),
-        trajectory=trajectory,
-    )
-    try:
-        feedback_data = await call_sync_from_async(store_feedback, feedback)
-        return JSONResponse(status_code=200, content=feedback_data)
-    except Exception as e:
-        logger.error(f'Error submitting feedback: {e}')
-        return JSONResponse(
-            status_code=500, content={'error': 'Failed to submit feedback'}
-        )
-
-
-@app.get('/api/defaults')
-async def appconfig_defaults():
-    """Retrieve the default configuration settings.
-
-    To get the default configurations:
-    ```sh
-    curl http://localhost:3000/api/defaults
-    ```
-
-    Returns:
-        dict: The default configuration settings.
-    """
-    return config.defaults_dict
-
-
-@app.post('/api/save-file')
-async def save_file(request: Request):
-    """Save a file to the agent's runtime file store.
-
-    This endpoint allows saving a file when the agent is in a paused, finished,
-    or awaiting user input state. It checks the agent's state before proceeding
-    with the file save operation.
-
-    Args:
-        request (Request): The incoming FastAPI request object.
-
-    Returns:
-        JSONResponse: A JSON response indicating the success of the operation.
-
-    Raises:
-        HTTPException:
-            - 403 error if the agent is not in an allowed state for editing.
-            - 400 error if the file path or content is missing.
-            - 500 error if there's an unexpected error during the save operation.
-    """
-    try:
-        # Extract file path and content from the request
-        data = await request.json()
-        file_path = data.get('filePath')
-        content = data.get('content')
-
-        # Validate the presence of required data
-        if not file_path or content is None:
-            raise HTTPException(status_code=400, detail='Missing filePath or content')
-
-        # Save the file to the agent's runtime file store
-        runtime: Runtime = request.state.conversation.runtime
-        file_path = os.path.join(
-            runtime.config.workspace_mount_path_in_sandbox, file_path
-        )
-        write_action = FileWriteAction(file_path, content)
-        try:
-            observation = await call_sync_from_async(runtime.run_action, write_action)
-        except RuntimeUnavailableError as e:
-            logger.error(f'Error saving file: {e}', exc_info=True)
-            return JSONResponse(
-                status_code=500,
-                content={'error': f'Error saving file: {e}'},
-            )
-
-        if isinstance(observation, FileWriteObservation):
-            return JSONResponse(
-                status_code=200, content={'message': 'File saved successfully'}
-            )
-        elif isinstance(observation, ErrorObservation):
-            return JSONResponse(
-                status_code=500,
-                content={'error': f'Failed to save file: {observation}'},
-            )
-        else:
-            return JSONResponse(
-                status_code=500,
-                content={'error': f'Unexpected observation: {observation}'},
-            )
-    except Exception as e:
-        # Log the error and return a 500 response
-        logger.error(f'Error saving file: {e}', exc_info=True)
-        raise HTTPException(status_code=500, detail=f'Error saving file: {e}')
-
-
-@app.route('/api/security/{path:path}', methods=['GET', 'POST', 'PUT', 'DELETE'])
-async def security_api(request: Request):
-    """Catch-all route for security analyzer API requests.
-
-    Each request is handled directly to the security analyzer.
-
-    Args:
-        request (Request): The incoming FastAPI request object.
-
-    Returns:
-        Any: The response from the security analyzer.
-
-    Raises:
-        HTTPException: If the security analyzer is not initialized.
-    """
-    if not request.state.conversation.security_analyzer:
-        raise HTTPException(status_code=404, detail='Security analyzer not initialized')
-
-    return await request.state.conversation.security_analyzer.handle_api_request(
-        request
-    )
-
-
-@app.get('/api/zip-directory')
-async def zip_current_workspace(request: Request, background_tasks: BackgroundTasks):
-    try:
-        logger.debug('Zipping workspace')
-        runtime: Runtime = request.state.conversation.runtime
-        path = runtime.config.workspace_mount_path_in_sandbox
-        try:
-            zip_file = await call_sync_from_async(runtime.copy_from, path)
-        except RuntimeUnavailableError as e:
-            logger.error(f'Error zipping workspace: {e}', exc_info=True)
-            return JSONResponse(
-                status_code=500,
-                content={'error': f'Error zipping workspace: {e}'},
-            )
-        response = FileResponse(
-            path=zip_file,
-            filename='workspace.zip',
-            media_type='application/x-zip-compressed',
-        )
-
-        # This will execute after the response is sent (So the file is not deleted before being sent)
-        background_tasks.add_task(zip_file.unlink)
-
-        return response
-    except Exception as e:
-        logger.error(f'Error zipping workspace: {e}', exc_info=True)
-        raise HTTPException(
-            status_code=500,
-            detail='Failed to zip workspace',
-        )
-
-
-class AuthCode(BaseModel):
-    code: str
-
-
-@app.post('/api/github/callback')
-def github_callback(auth_code: AuthCode):
-    # Prepare data for the token exchange request
-    data = {
-        'client_id': GITHUB_CLIENT_ID,
-        'client_secret': GITHUB_CLIENT_SECRET,
-        'code': auth_code.code,
-    }
-
-    logger.debug('Exchanging code for GitHub token')
-
-    headers = {'Accept': 'application/json'}
-    response = requests.post(
-        'https://github.com/login/oauth/access_token', data=data, headers=headers
-    )
-
-    if response.status_code != 200:
-        logger.error(f'Failed to exchange code for token: {response.text}')
-        return JSONResponse(
-            status_code=status.HTTP_400_BAD_REQUEST,
-            content={'error': 'Failed to exchange code for token'},
-        )
-
-    token_response = response.json()
-
-    if 'access_token' not in token_response:
-        return JSONResponse(
-            status_code=status.HTTP_400_BAD_REQUEST,
-            content={'error': 'No access token in response'},
-        )
-
-    return JSONResponse(
-        status_code=status.HTTP_200_OK,
-        content={'access_token': token_response['access_token']},
-    )
-
-
-@app.post('/api/authenticate')
-async def authenticate(request: Request):
-    token = request.headers.get('X-GitHub-Token')
-    if not await authenticate_github_user(token):
-        return JSONResponse(
-            status_code=status.HTTP_401_UNAUTHORIZED,
-            content={'error': 'Not authorized via GitHub waitlist'},
-        )
-
-    # Create a signed JWT token with 1-hour expiration
-    cookie_data = {
-        'github_token': token,
-        'exp': int(time.time()) + 3600,  # 1 hour expiration
-    }
-    signed_token = sign_token(cookie_data, config.jwt_secret)
-
-    response = JSONResponse(
-        status_code=status.HTTP_200_OK, content={'message': 'User authenticated'}
-    )
-
-    # Set secure cookie with signed token
-    response.set_cookie(
-        key='github_auth',
-        value=signed_token,
-        max_age=3600,  # 1 hour in seconds
-        httponly=True,
-        secure=True,
-        samesite='strict',
-    )
-    return response
-
-
-@app.get('/api/vscode-url')
-async def get_vscode_url(request: Request):
-    """Get the VSCode URL.
-
-    This endpoint allows getting the VSCode URL.
-
-    Args:
-        request (Request): The incoming FastAPI request object.
-
-    Returns:
-        JSONResponse: A JSON response indicating the success of the operation.
-    """
-    try:
-        runtime: Runtime = request.state.conversation.runtime
-        logger.debug(f'Runtime type: {type(runtime)}')
-        logger.debug(f'Runtime VSCode URL: {runtime.vscode_url}')
-        return JSONResponse(status_code=200, content={'vscode_url': runtime.vscode_url})
-    except Exception as e:
-        logger.error(f'Error getting VSCode URL: {e}', exc_info=True)
-        return JSONResponse(
-            status_code=500,
-            content={
-                'vscode_url': None,
-                'error': f'Error getting VSCode URL: {e}',
-            },
-        )
-
-
-class SPAStaticFiles(StaticFiles):
-    async def get_response(self, path: str, scope):
-        try:
-            return await super().get_response(path, scope)
-        except Exception:
-            # FIXME: just making this HTTPException doesn't work for some reason
-            return await super().get_response('index.html', scope)
-
-
-app.mount('/', SPAStaticFiles(directory='./frontend/build', html=True), name='dist')
-
-app = socketio.ASGIApp(sio, other_asgi_app=app)
-
-
-@sio.event
-async def connect(connection_id: str, environ):
-    logger.info(f'sio:connect: {connection_id}')
-
-
-@sio.event
-async def oh_action(connection_id: str, data: dict):
-    # If it's an init, we do it here.
-    action = data.get('action', '')
-    if action == ActionType.INIT:
-        await init_connection(connection_id, data)
-        return
-
-    logger.info(f'sio:oh_action:{connection_id}')
-    await session_manager.send_to_event_stream(connection_id, data)
-
-
-async def init_connection(connection_id: str, data: dict):
-    gh_token = data.pop('github_token', None)
-    if not await authenticate_github_user(gh_token):
-        raise RuntimeError(status.WS_1008_POLICY_VIOLATION)
-
-    token = data.pop('token', None)
-    if token:
-        sid = get_sid_from_token(token, config.jwt_secret)
-        if sid == '':
-            await sio.send({'error': 'Invalid token', 'error_code': 401})
-            return
-        logger.info(f'Existing session: {sid}')
-    else:
-        sid = connection_id
-        logger.info(f'New session: {sid}')
-
-    token = sign_token({'sid': sid}, config.jwt_secret)
-    await sio.emit('oh_event', {'token': token, 'status': 'ok'}, to=connection_id)
-
-    latest_event_id = int(data.pop('latest_event_id', -1))
-
-    # The session in question should exist, but may not actually be running locally...
-    event_stream = await session_manager.init_or_join_session(sid, connection_id, data)
-
-    # Send events
-    async_stream = AsyncEventStreamWrapper(event_stream, latest_event_id + 1)
-    async for event in async_stream:
-        if isinstance(
-            event,
-            (
-                NullAction,
-                NullObservation,
-            ),
-        ):
-            continue
-        await sio.emit('oh_event', event_to_dict(event), to=connection_id)
-
-
-@sio.event
-async def disconnect(connection_id: str):
-    logger.info(f'sio:disconnect:{connection_id}')
-    await session_manager.disconnect_from_session(connection_id)
+app = socketio.ASGIApp(sio, other_asgi_app=base_app)
diff --git a/openhands/server/middleware.py b/openhands/server/middleware.py
index 624dac62b425..803887471e0e 100644
--- a/openhands/server/middleware.py
+++ b/openhands/server/middleware.py
@@ -1,14 +1,21 @@
 import asyncio
 from collections import defaultdict
 from datetime import datetime, timedelta
+from typing import Callable
 from urllib.parse import urlparse
 
-from fastapi import Request
+import jwt
+from fastapi import APIRouter, Request, status
 from fastapi.middleware.cors import CORSMiddleware
 from fastapi.responses import JSONResponse
 from starlette.middleware.base import BaseHTTPMiddleware
 from starlette.types import ASGIApp
 
+from openhands.core.logger import openhands_logger as logger
+from openhands.server.auth import get_sid_from_token
+from openhands.server.github_utils import UserVerifier
+from openhands.server.shared import config, session_manager
+
 
 class LocalhostCORSMiddleware(CORSMiddleware):
     """
@@ -100,3 +107,71 @@ async def dispatch(self, request, call_next):
                 headers={'Retry-After': '1'},
             )
         return await call_next(request)
+
+
+class AttachSessionMiddleware:
+    def __init__(self, app, target_router: APIRouter):
+        self.app = app
+        self.target_router = target_router
+        self.target_paths = {route.path for route in target_router.routes}
+
+    async def __call__(self, request: Request, call_next: Callable):
+        do_attach = False
+        if request.url.path in self.target_paths:
+            do_attach = True
+
+        if request.method == 'OPTIONS':
+            do_attach = False
+
+        if not do_attach:
+            return await call_next(request)
+
+        user_verifier = UserVerifier()
+        if user_verifier.is_active():
+            signed_token = request.cookies.get('github_auth')
+            if not signed_token:
+                return JSONResponse(
+                    status_code=status.HTTP_401_UNAUTHORIZED,
+                    content={'error': 'Not authenticated'},
+                )
+            try:
+                jwt.decode(signed_token, config.jwt_secret, algorithms=['HS256'])
+            except Exception as e:
+                logger.warning(f'Invalid token: {e}')
+                return JSONResponse(
+                    status_code=status.HTTP_401_UNAUTHORIZED,
+                    content={'error': 'Invalid token'},
+                )
+
+        if not request.headers.get('Authorization'):
+            logger.warning('Missing Authorization header')
+            return JSONResponse(
+                status_code=status.HTTP_401_UNAUTHORIZED,
+                content={'error': 'Missing Authorization header'},
+            )
+
+        auth_token = request.headers.get('Authorization')
+        if 'Bearer' in auth_token:
+            auth_token = auth_token.split('Bearer')[1].strip()
+
+        request.state.sid = get_sid_from_token(auth_token, config.jwt_secret)
+        if request.state.sid == '':
+            logger.warning('Invalid token')
+            return JSONResponse(
+                status_code=status.HTTP_401_UNAUTHORIZED,
+                content={'error': 'Invalid token'},
+            )
+
+        request.state.conversation = await session_manager.attach_to_conversation(
+            request.state.sid
+        )
+        if request.state.conversation is None:
+            return JSONResponse(
+                status_code=status.HTTP_404_NOT_FOUND,
+                content={'error': 'Session not found'},
+            )
+        try:
+            response = await call_next(request)
+        finally:
+            await session_manager.detach_from_conversation(request.state.conversation)
+        return response
diff --git a/openhands/server/routes/auth.py b/openhands/server/routes/auth.py
new file mode 100644
index 000000000000..67151f7e96e0
--- /dev/null
+++ b/openhands/server/routes/auth.py
@@ -0,0 +1,100 @@
+import time
+import warnings
+
+import requests
+
+from openhands.server.github_utils import (
+    GITHUB_CLIENT_ID,
+    GITHUB_CLIENT_SECRET,
+    authenticate_github_user,
+)
+
+with warnings.catch_warnings():
+    warnings.simplefilter('ignore')
+
+from fastapi import (
+    APIRouter,
+    Request,
+    status,
+)
+from fastapi.responses import JSONResponse
+from pydantic import BaseModel
+
+from openhands.core.logger import openhands_logger as logger
+from openhands.server.auth import sign_token
+from openhands.server.shared import config
+
+app = APIRouter(prefix='/api')
+
+
+class AuthCode(BaseModel):
+    code: str
+
+
+@app.post('/github/callback')
+def github_callback(auth_code: AuthCode):
+    # Prepare data for the token exchange request
+    data = {
+        'client_id': GITHUB_CLIENT_ID,
+        'client_secret': GITHUB_CLIENT_SECRET,
+        'code': auth_code.code,
+    }
+
+    logger.debug('Exchanging code for GitHub token')
+
+    headers = {'Accept': 'application/json'}
+    response = requests.post(
+        'https://github.com/login/oauth/access_token', data=data, headers=headers
+    )
+
+    if response.status_code != 200:
+        logger.error(f'Failed to exchange code for token: {response.text}')
+        return JSONResponse(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            content={'error': 'Failed to exchange code for token'},
+        )
+
+    token_response = response.json()
+
+    if 'access_token' not in token_response:
+        return JSONResponse(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            content={'error': 'No access token in response'},
+        )
+
+    return JSONResponse(
+        status_code=status.HTTP_200_OK,
+        content={'access_token': token_response['access_token']},
+    )
+
+
+@app.post('/authenticate')
+async def authenticate(request: Request):
+    token = request.headers.get('X-GitHub-Token')
+    if not await authenticate_github_user(token):
+        return JSONResponse(
+            status_code=status.HTTP_401_UNAUTHORIZED,
+            content={'error': 'Not authorized via GitHub waitlist'},
+        )
+
+    # Create a signed JWT token with 1-hour expiration
+    cookie_data = {
+        'github_token': token,
+        'exp': int(time.time()) + 3600,  # 1 hour expiration
+    }
+    signed_token = sign_token(cookie_data, config.jwt_secret)
+
+    response = JSONResponse(
+        status_code=status.HTTP_200_OK, content={'message': 'User authenticated'}
+    )
+
+    # Set secure cookie with signed token
+    response.set_cookie(
+        key='github_auth',
+        value=signed_token,
+        max_age=3600,  # 1 hour in seconds
+        httponly=True,
+        secure=True,
+        samesite='strict',
+    )
+    return response
diff --git a/openhands/server/routes/conversation.py b/openhands/server/routes/conversation.py
new file mode 100644
index 000000000000..a47eed68ef40
--- /dev/null
+++ b/openhands/server/routes/conversation.py
@@ -0,0 +1,106 @@
+from fastapi import APIRouter, HTTPException, Request, status
+from fastapi.responses import JSONResponse
+
+from openhands.core.logger import openhands_logger as logger
+from openhands.runtime.base import Runtime
+
+app = APIRouter(prefix='/api')
+
+
+@app.get('/conversation')
+async def get_remote_runtime_config(request: Request):
+    """Retrieve the runtime configuration.
+
+    Currently, this is the session ID and runtime ID (if available).
+    """
+    runtime = request.state.conversation.runtime
+    runtime_id = runtime.runtime_id if hasattr(runtime, 'runtime_id') else None
+    session_id = runtime.sid if hasattr(runtime, 'sid') else None
+    return JSONResponse(
+        content={
+            'runtime_id': runtime_id,
+            'session_id': session_id,
+        }
+    )
+
+
+@app.get('/vscode-url')
+async def get_vscode_url(request: Request):
+    """Get the VSCode URL.
+
+    This endpoint allows getting the VSCode URL.
+
+    Args:
+        request (Request): The incoming FastAPI request object.
+
+    Returns:
+        JSONResponse: A JSON response indicating the success of the operation.
+    """
+    try:
+        runtime: Runtime = request.state.conversation.runtime
+        logger.debug(f'Runtime type: {type(runtime)}')
+        logger.debug(f'Runtime VSCode URL: {runtime.vscode_url}')
+        return JSONResponse(status_code=200, content={'vscode_url': runtime.vscode_url})
+    except Exception as e:
+        logger.error(f'Error getting VSCode URL: {e}', exc_info=True)
+        return JSONResponse(
+            status_code=500,
+            content={
+                'vscode_url': None,
+                'error': f'Error getting VSCode URL: {e}',
+            },
+        )
+
+
+@app.get('/events/search')
+async def search_events(
+    request: Request,
+    query: str | None = None,
+    start_id: int = 0,
+    limit: int = 20,
+    event_type: str | None = None,
+    source: str | None = None,
+    start_date: str | None = None,
+    end_date: str | None = None,
+):
+    """Search through the event stream with filtering and pagination.
+    Args:
+        request (Request): The incoming request object
+        query (str, optional): Text to search for in event content
+        start_id (int): Starting ID in the event stream. Defaults to 0
+        limit (int): Maximum number of events to return. Must be between 1 and 100. Defaults to 20
+        event_type (str, optional): Filter by event type (e.g., "FileReadAction")
+        source (str, optional): Filter by event source
+        start_date (str, optional): Filter events after this date (ISO format)
+        end_date (str, optional): Filter events before this date (ISO format)
+    Returns:
+        dict: Dictionary containing:
+            - events: List of matching events
+            - has_more: Whether there are more matching events after this batch
+    Raises:
+        HTTPException: If conversation is not found
+        ValueError: If limit is less than 1 or greater than 100
+    """
+    if not request.state.conversation:
+        raise HTTPException(
+            status_code=status.HTTP_404_NOT_FOUND, detail='Conversation not found'
+        )
+    # Get matching events from the stream
+    event_stream = request.state.conversation.event_stream
+    matching_events = event_stream.get_matching_events(
+        query=query,
+        event_type=event_type,
+        source=source,
+        start_date=start_date,
+        end_date=end_date,
+        start_id=start_id,
+        limit=limit + 1,  # Get one extra to check if there are more
+    )
+    # Check if there are more events
+    has_more = len(matching_events) > limit
+    if has_more:
+        matching_events = matching_events[:limit]  # Remove the extra event
+    return {
+        'events': matching_events,
+        'has_more': has_more,
+    }
diff --git a/openhands/server/routes/feedback.py b/openhands/server/routes/feedback.py
new file mode 100644
index 000000000000..8489ec84e68b
--- /dev/null
+++ b/openhands/server/routes/feedback.py
@@ -0,0 +1,74 @@
+from fastapi import APIRouter, Request
+from fastapi.responses import JSONResponse
+
+from openhands.core.logger import openhands_logger as logger
+from openhands.events.serialization import event_to_dict
+from openhands.events.stream import AsyncEventStreamWrapper
+from openhands.server.data_models.feedback import FeedbackDataModel, store_feedback
+from openhands.server.shared import config
+from openhands.utils.async_utils import call_sync_from_async
+
+app = APIRouter(prefix='/api')
+
+
+@app.post('/submit-feedback')
+async def submit_feedback(request: Request):
+    """Submit user feedback.
+
+    This function stores the provided feedback data.
+
+    To submit feedback:
+    ```sh
+    curl -X POST -d '{"email": "test@example.com"}' -H "Authorization:"
+    ```
+
+    Args:
+        request (Request): The incoming request object.
+        feedback (FeedbackDataModel): The feedback data to be stored.
+
+    Returns:
+        dict: The stored feedback data.
+
+    Raises:
+        HTTPException: If there's an error submitting the feedback.
+    """
+    # Assuming the storage service is already configured in the backend
+    # and there is a function to handle the storage.
+    body = await request.json()
+    async_stream = AsyncEventStreamWrapper(
+        request.state.conversation.event_stream, filter_hidden=True
+    )
+    trajectory = []
+    async for event in async_stream:
+        trajectory.append(event_to_dict(event))
+    feedback = FeedbackDataModel(
+        email=body.get('email', ''),
+        version=body.get('version', ''),
+        permissions=body.get('permissions', 'private'),
+        polarity=body.get('polarity', ''),
+        feedback=body.get('polarity', ''),
+        trajectory=trajectory,
+    )
+    try:
+        feedback_data = await call_sync_from_async(store_feedback, feedback)
+        return JSONResponse(status_code=200, content=feedback_data)
+    except Exception as e:
+        logger.error(f'Error submitting feedback: {e}')
+        return JSONResponse(
+            status_code=500, content={'error': 'Failed to submit feedback'}
+        )
+
+
+@app.get('/api/defaults')
+async def appconfig_defaults():
+    """Retrieve the default configuration settings.
+
+    To get the default configurations:
+    ```sh
+    curl http://localhost:3000/api/defaults
+    ```
+
+    Returns:
+        dict: The default configuration settings.
+    """
+    return config.defaults_dict
diff --git a/openhands/server/routes/files.py b/openhands/server/routes/files.py
new file mode 100644
index 000000000000..c2d37350c823
--- /dev/null
+++ b/openhands/server/routes/files.py
@@ -0,0 +1,341 @@
+import os
+import tempfile
+
+from fastapi import (
+    APIRouter,
+    BackgroundTasks,
+    HTTPException,
+    Request,
+    UploadFile,
+    status,
+)
+from fastapi.responses import FileResponse, JSONResponse
+from pathspec import PathSpec
+from pathspec.patterns import GitWildMatchPattern
+
+from openhands.core.logger import openhands_logger as logger
+from openhands.events.action import (
+    FileReadAction,
+    FileWriteAction,
+)
+from openhands.events.observation import (
+    ErrorObservation,
+    FileReadObservation,
+    FileWriteObservation,
+)
+from openhands.runtime.base import Runtime, RuntimeUnavailableError
+from openhands.server.file_config import (
+    FILES_TO_IGNORE,
+    MAX_FILE_SIZE_MB,
+    is_extension_allowed,
+    sanitize_filename,
+)
+from openhands.utils.async_utils import call_sync_from_async
+
+app = APIRouter(prefix='/api')
+
+
+@app.get('/list-files')
+async def list_files(request: Request, path: str | None = None):
+    """List files in the specified path.
+
+    This function retrieves a list of files from the agent's runtime file store,
+    excluding certain system and hidden files/directories.
+
+    To list files:
+    ```sh
+    curl http://localhost:3000/api/list-files
+    ```
+
+    Args:
+        request (Request): The incoming request object.
+        path (str, optional): The path to list files from. Defaults to None.
+
+    Returns:
+        list: A list of file names in the specified path.
+
+    Raises:
+        HTTPException: If there's an error listing the files.
+    """
+    if not request.state.conversation.runtime:
+        return JSONResponse(
+            status_code=status.HTTP_404_NOT_FOUND,
+            content={'error': 'Runtime not yet initialized'},
+        )
+
+    runtime: Runtime = request.state.conversation.runtime
+    try:
+        file_list = await call_sync_from_async(runtime.list_files, path)
+    except RuntimeUnavailableError as e:
+        logger.error(f'Error listing files: {e}', exc_info=True)
+        return JSONResponse(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            content={'error': f'Error listing files: {e}'},
+        )
+    if path:
+        file_list = [os.path.join(path, f) for f in file_list]
+
+    file_list = [f for f in file_list if f not in FILES_TO_IGNORE]
+
+    async def filter_for_gitignore(file_list, base_path):
+        gitignore_path = os.path.join(base_path, '.gitignore')
+        try:
+            read_action = FileReadAction(gitignore_path)
+            observation = await call_sync_from_async(runtime.run_action, read_action)
+            spec = PathSpec.from_lines(
+                GitWildMatchPattern, observation.content.splitlines()
+            )
+        except Exception as e:
+            logger.warning(e)
+            return file_list
+        file_list = [entry for entry in file_list if not spec.match_file(entry)]
+        return file_list
+
+    try:
+        file_list = await filter_for_gitignore(file_list, '')
+    except RuntimeUnavailableError as e:
+        logger.error(f'Error filtering files: {e}', exc_info=True)
+        return JSONResponse(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            content={'error': f'Error filtering files: {e}'},
+        )
+
+    return file_list
+
+
+@app.get('/select-file')
+async def select_file(file: str, request: Request):
+    """Retrieve the content of a specified file.
+
+    To select a file:
+    ```sh
+    curl http://localhost:3000/api/select-file?file=<file_path>
+    ```
+
+    Args:
+        file (str): The path of the file to be retrieved.
+            Expect path to be absolute inside the runtime.
+        request (Request): The incoming request object.
+
+    Returns:
+        dict: A dictionary containing the file content.
+
+    Raises:
+        HTTPException: If there's an error opening the file.
+    """
+    runtime: Runtime = request.state.conversation.runtime
+
+    file = os.path.join(runtime.config.workspace_mount_path_in_sandbox, file)
+    read_action = FileReadAction(file)
+    try:
+        observation = await call_sync_from_async(runtime.run_action, read_action)
+    except RuntimeUnavailableError as e:
+        logger.error(f'Error opening file {file}: {e}', exc_info=True)
+        return JSONResponse(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            content={'error': f'Error opening file: {e}'},
+        )
+
+    if isinstance(observation, FileReadObservation):
+        content = observation.content
+        return {'code': content}
+    elif isinstance(observation, ErrorObservation):
+        logger.error(f'Error opening file {file}: {observation}', exc_info=False)
+        return JSONResponse(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            content={'error': f'Error opening file: {observation}'},
+        )
+
+
+@app.post('/upload-files')
+async def upload_file(request: Request, files: list[UploadFile]):
+    """Upload a list of files to the workspace.
+
+    To upload a files:
+    ```sh
+    curl -X POST -F "file=@<file_path1>" -F "file=@<file_path2>" http://localhost:3000/api/upload-files
+    ```
+
+    Args:
+        request (Request): The incoming request object.
+        files (list[UploadFile]): A list of files to be uploaded.
+
+    Returns:
+        dict: A message indicating the success of the upload operation.
+
+    Raises:
+        HTTPException: If there's an error saving the files.
+    """
+    try:
+        uploaded_files = []
+        skipped_files = []
+        for file in files:
+            safe_filename = sanitize_filename(file.filename)
+            file_contents = await file.read()
+
+            if (
+                MAX_FILE_SIZE_MB > 0
+                and len(file_contents) > MAX_FILE_SIZE_MB * 1024 * 1024
+            ):
+                skipped_files.append(
+                    {
+                        'name': safe_filename,
+                        'reason': f'Exceeds maximum size limit of {MAX_FILE_SIZE_MB}MB',
+                    }
+                )
+                continue
+
+            if not is_extension_allowed(safe_filename):
+                skipped_files.append(
+                    {'name': safe_filename, 'reason': 'File type not allowed'}
+                )
+                continue
+
+            # copy the file to the runtime
+            with tempfile.TemporaryDirectory() as tmp_dir:
+                tmp_file_path = os.path.join(tmp_dir, safe_filename)
+                with open(tmp_file_path, 'wb') as tmp_file:
+                    tmp_file.write(file_contents)
+                    tmp_file.flush()
+
+                runtime: Runtime = request.state.conversation.runtime
+                try:
+                    await call_sync_from_async(
+                        runtime.copy_to,
+                        tmp_file_path,
+                        runtime.config.workspace_mount_path_in_sandbox,
+                    )
+                except RuntimeUnavailableError as e:
+                    logger.error(
+                        f'Error saving file {safe_filename}: {e}', exc_info=True
+                    )
+                    return JSONResponse(
+                        status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+                        content={'error': f'Error saving file: {e}'},
+                    )
+            uploaded_files.append(safe_filename)
+
+        response_content = {
+            'message': 'File upload process completed',
+            'uploaded_files': uploaded_files,
+            'skipped_files': skipped_files,
+        }
+
+        if not uploaded_files and skipped_files:
+            return JSONResponse(
+                status_code=status.HTTP_400_BAD_REQUEST,
+                content={
+                    **response_content,
+                    'error': 'No files were uploaded successfully',
+                },
+            )
+
+        return JSONResponse(status_code=status.HTTP_200_OK, content=response_content)
+
+    except Exception as e:
+        logger.error(f'Error during file upload: {e}', exc_info=True)
+        return JSONResponse(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            content={
+                'error': f'Error during file upload: {str(e)}',
+                'uploaded_files': [],
+                'skipped_files': [],
+            },
+        )
+
+
+@app.post('/save-file')
+async def save_file(request: Request):
+    """Save a file to the agent's runtime file store.
+
+    This endpoint allows saving a file when the agent is in a paused, finished,
+    or awaiting user input state. It checks the agent's state before proceeding
+    with the file save operation.
+
+    Args:
+        request (Request): The incoming FastAPI request object.
+
+    Returns:
+        JSONResponse: A JSON response indicating the success of the operation.
+
+    Raises:
+        HTTPException:
+            - 403 error if the agent is not in an allowed state for editing.
+            - 400 error if the file path or content is missing.
+            - 500 error if there's an unexpected error during the save operation.
+    """
+    try:
+        # Extract file path and content from the request
+        data = await request.json()
+        file_path = data.get('filePath')
+        content = data.get('content')
+
+        # Validate the presence of required data
+        if not file_path or content is None:
+            raise HTTPException(status_code=400, detail='Missing filePath or content')
+
+        # Save the file to the agent's runtime file store
+        runtime: Runtime = request.state.conversation.runtime
+        file_path = os.path.join(
+            runtime.config.workspace_mount_path_in_sandbox, file_path
+        )
+        write_action = FileWriteAction(file_path, content)
+        try:
+            observation = await call_sync_from_async(runtime.run_action, write_action)
+        except RuntimeUnavailableError as e:
+            logger.error(f'Error saving file: {e}', exc_info=True)
+            return JSONResponse(
+                status_code=500,
+                content={'error': f'Error saving file: {e}'},
+            )
+
+        if isinstance(observation, FileWriteObservation):
+            return JSONResponse(
+                status_code=200, content={'message': 'File saved successfully'}
+            )
+        elif isinstance(observation, ErrorObservation):
+            return JSONResponse(
+                status_code=500,
+                content={'error': f'Failed to save file: {observation}'},
+            )
+        else:
+            return JSONResponse(
+                status_code=500,
+                content={'error': f'Unexpected observation: {observation}'},
+            )
+    except Exception as e:
+        # Log the error and return a 500 response
+        logger.error(f'Error saving file: {e}', exc_info=True)
+        raise HTTPException(status_code=500, detail=f'Error saving file: {e}')
+
+
+@app.get('/zip-directory')
+async def zip_current_workspace(request: Request, background_tasks: BackgroundTasks):
+    try:
+        logger.debug('Zipping workspace')
+        runtime: Runtime = request.state.conversation.runtime
+        path = runtime.config.workspace_mount_path_in_sandbox
+        try:
+            zip_file = await call_sync_from_async(runtime.copy_from, path)
+        except RuntimeUnavailableError as e:
+            logger.error(f'Error zipping workspace: {e}', exc_info=True)
+            return JSONResponse(
+                status_code=500,
+                content={'error': f'Error zipping workspace: {e}'},
+            )
+        response = FileResponse(
+            path=zip_file,
+            filename='workspace.zip',
+            media_type='application/x-zip-compressed',
+        )
+
+        # This will execute after the response is sent (So the file is not deleted before being sent)
+        background_tasks.add_task(zip_file.unlink)
+
+        return response
+    except Exception as e:
+        logger.error(f'Error zipping workspace: {e}', exc_info=True)
+        raise HTTPException(
+            status_code=500,
+            detail='Failed to zip workspace',
+        )
diff --git a/openhands/server/routes/public.py b/openhands/server/routes/public.py
new file mode 100644
index 000000000000..dae4278078ec
--- /dev/null
+++ b/openhands/server/routes/public.py
@@ -0,0 +1,106 @@
+import warnings
+
+import requests
+
+from openhands.security.options import SecurityAnalyzers
+
+with warnings.catch_warnings():
+    warnings.simplefilter('ignore')
+    import litellm
+
+from fastapi import (
+    APIRouter,
+)
+
+from openhands.controller.agent import Agent
+from openhands.core.config import LLMConfig
+from openhands.core.logger import openhands_logger as logger
+from openhands.llm import bedrock
+from openhands.server.shared import config
+
+app = APIRouter(prefix='/api/options')
+
+
+@app.get('/models')
+async def get_litellm_models() -> list[str]:
+    """
+    Get all models supported by LiteLLM.
+
+    This function combines models from litellm and Bedrock, removing any
+    error-prone Bedrock models.
+
+    To get the models:
+    ```sh
+    curl http://localhost:3000/api/litellm-models
+    ```
+
+    Returns:
+        list: A sorted list of unique model names.
+    """
+    litellm_model_list = litellm.model_list + list(litellm.model_cost.keys())
+    litellm_model_list_without_bedrock = bedrock.remove_error_modelId(
+        litellm_model_list
+    )
+    # TODO: for bedrock, this is using the default config
+    llm_config: LLMConfig = config.get_llm_config()
+    bedrock_model_list = []
+    if (
+        llm_config.aws_region_name
+        and llm_config.aws_access_key_id
+        and llm_config.aws_secret_access_key
+    ):
+        bedrock_model_list = bedrock.list_foundation_models(
+            llm_config.aws_region_name,
+            llm_config.aws_access_key_id,
+            llm_config.aws_secret_access_key,
+        )
+    model_list = litellm_model_list_without_bedrock + bedrock_model_list
+    for llm_config in config.llms.values():
+        ollama_base_url = llm_config.ollama_base_url
+        if llm_config.model.startswith('ollama'):
+            if not ollama_base_url:
+                ollama_base_url = llm_config.base_url
+        if ollama_base_url:
+            ollama_url = ollama_base_url.strip('/') + '/api/tags'
+            try:
+                ollama_models_list = requests.get(ollama_url, timeout=3).json()[
+                    'models'
+                ]
+                for model in ollama_models_list:
+                    model_list.append('ollama/' + model['name'])
+                break
+            except requests.exceptions.RequestException as e:
+                logger.error(f'Error getting OLLAMA models: {e}', exc_info=True)
+
+    return list(sorted(set(model_list)))
+
+
+@app.get('/agents')
+async def get_agents():
+    """Get all agents supported by LiteLLM.
+
+    To get the agents:
+    ```sh
+    curl http://localhost:3000/api/agents
+    ```
+
+    Returns:
+        list: A sorted list of agent names.
+    """
+    agents = sorted(Agent.list_agents())
+    return agents
+
+
+@app.get('/security-analyzers')
+async def get_security_analyzers():
+    """Get all supported security analyzers.
+
+    To get the security analyzers:
+    ```sh
+    curl http://localhost:3000/api/security-analyzers
+    ```
+
+    Returns:
+        list: A sorted list of security analyzer names.
+    """
+    return sorted(SecurityAnalyzers.keys())
diff --git a/openhands/server/routes/security.py b/openhands/server/routes/security.py
new file mode 100644
index 000000000000..f65fcce6aa3b
--- /dev/null
+++ b/openhands/server/routes/security.py
@@ -0,0 +1,30 @@
+from fastapi import (
+    APIRouter,
+    HTTPException,
+    Request,
+)
+
+app = APIRouter(prefix='/api')
+
+
+@app.route('/security/{path:path}', methods=['GET', 'POST', 'PUT', 'DELETE'])
+async def security_api(request: Request):
+    """Catch-all route for security analyzer API requests.
+
+    Each request is handled directly to the security analyzer.
+
+    Args:
+        request (Request): The incoming FastAPI request object.
+
+    Returns:
+        Any: The response from the security analyzer.
+
+    Raises:
+        HTTPException: If the security analyzer is not initialized.
+    """
+    if not request.state.conversation.security_analyzer:
+        raise HTTPException(status_code=404, detail='Security analyzer not initialized')
+
+    return await request.state.conversation.security_analyzer.handle_api_request(
+        request
+    )
diff --git a/openhands/server/shared.py b/openhands/server/shared.py
new file mode 100644
index 000000000000..a7cc5c87c0cf
--- /dev/null
+++ b/openhands/server/shared.py
@@ -0,0 +1,28 @@
+import os
+
+import socketio
+from dotenv import load_dotenv
+
+from openhands.core.config import load_app_config
+from openhands.server.session import SessionManager
+from openhands.storage import get_file_store
+
+load_dotenv()
+
+config = load_app_config()
+file_store = get_file_store(config.file_store, config.file_store_path)
+
+client_manager = None
+redis_host = os.environ.get('REDIS_HOST')
+if redis_host:
+    client_manager = socketio.AsyncRedisManager(
+        f'redis://{redis_host}',
+        redis_options={'password': os.environ.get('REDIS_PASSWORD')},
+    )
+
+
+sio = socketio.AsyncServer(
+    async_mode='asgi', cors_allowed_origins='*', client_manager=client_manager
+)
+
+session_manager = SessionManager(sio, config, file_store)
diff --git a/openhands/server/socket.py b/openhands/server/socket.py
new file mode 100644
index 000000000000..19a4993a2945
--- /dev/null
+++ b/openhands/server/socket.py
@@ -0,0 +1,76 @@
+from fastapi import status
+
+from openhands.core.logger import openhands_logger as logger
+from openhands.core.schema.action import ActionType
+from openhands.events.action import (
+    NullAction,
+)
+from openhands.events.observation import (
+    NullObservation,
+)
+from openhands.events.serialization import event_to_dict
+from openhands.events.stream import AsyncEventStreamWrapper
+from openhands.server.auth import get_sid_from_token, sign_token
+from openhands.server.github_utils import authenticate_github_user
+from openhands.server.shared import config, session_manager, sio
+
+
+@sio.event
+async def connect(connection_id: str, environ):
+    logger.info(f'sio:connect: {connection_id}')
+
+
+@sio.event
+async def oh_action(connection_id: str, data: dict):
+    # If it's an init, we do it here.
+    action = data.get('action', '')
+    if action == ActionType.INIT:
+        await init_connection(connection_id, data)
+        return
+
+    logger.info(f'sio:oh_action:{connection_id}')
+    await session_manager.send_to_event_stream(connection_id, data)
+
+
+async def init_connection(connection_id: str, data: dict):
+    gh_token = data.pop('github_token', None)
+    if not await authenticate_github_user(gh_token):
+        raise RuntimeError(status.WS_1008_POLICY_VIOLATION)
+
+    token = data.pop('token', None)
+    if token:
+        sid = get_sid_from_token(token, config.jwt_secret)
+        if sid == '':
+            await sio.emit('oh_event', {'error': 'Invalid token', 'error_code': 401})
+            return
+        logger.info(f'Existing session: {sid}')
+    else:
+        sid = connection_id
+        logger.info(f'New session: {sid}')
+
+    token = sign_token({'sid': sid}, config.jwt_secret)
+    await sio.emit('oh_event', {'token': token, 'status': 'ok'}, to=connection_id)
+
+    latest_event_id = int(data.pop('latest_event_id', -1))
+
+    # The session in question should exist, but may not actually be running locally...
+    event_stream = await session_manager.init_or_join_session(sid, connection_id, data)
+
+    # Send events
+    async_stream = AsyncEventStreamWrapper(event_stream, latest_event_id + 1)
+    async for event in async_stream:
+        if isinstance(
+            event,
+            (
+                NullAction,
+                NullObservation,
+            ),
+        ):
+            continue
+        await sio.emit('oh_event', event_to_dict(event), to=connection_id)
+
+
+@sio.event
+async def disconnect(connection_id: str):
+    logger.info(f'sio:disconnect:{connection_id}')
+    await session_manager.disconnect_from_session(connection_id)
diff --git a/openhands/server/static.py b/openhands/server/static.py
new file mode 100644
index 000000000000..ca7eb36c9b0a
--- /dev/null
+++ b/openhands/server/static.py
@@ -0,0 +1,10 @@
+from fastapi.staticfiles import StaticFiles
+
+
+class SPAStaticFiles(StaticFiles):
+    async def get_response(self, path: str, scope):
+        try:
+            return await super().get_response(path, scope)
+        except Exception:
+            # FIXME: just making this HTTPException doesn't work for some reason
+            return await super().get_response('index.html', scope)
diff --git a/poetry.lock b/poetry.lock
index 99025dcc349c..d97ef683fe6b 100644
--- a/poetry.lock
+++ b/poetry.lock
@@ -1,4 +1,4 @@
-# This file is automatically @generated by Poetry 1.8.3 and should not be changed by hand.
+# This file is automatically @generated by Poetry 1.8.4 and should not be changed by hand.
 
 [[package]]
 name = "aenum"
@@ -6601,6 +6601,7 @@ description = "Pure-Python implementation of ASN.1 types and DER/BER/CER codecs
 optional = false
 python-versions = ">=3.8"
 files = [
+    {file = "pyasn1-0.6.1-py3-none-any.whl", hash = "sha256:0d632f46f2ba09143da3a8afe9e33fb6f92fa2320ab7e886e2d0f7672af84629"},
     {file = "pyasn1-0.6.1.tar.gz", hash = "sha256:6f580d2bdd84365380830acf45550f2511469f673cb4a5ae3857a3170128b034"},
 ]
 
@@ -6611,6 +6612,7 @@ description = "A collection of ASN.1-based protocols modules"
 optional = false
 python-versions = ">=3.8"
 files = [
+    {file = "pyasn1_modules-0.4.1-py3-none-any.whl", hash = "sha256:49bfa96b45a292b711e986f222502c1c9a5e1f4e568fc30e2574a6c7d07838fd"},
     {file = "pyasn1_modules-0.4.1.tar.gz", hash = "sha256:c28e2dbf9c06ad61c71a075c7e0f9fd0f1b0bb2d2ad4377f240d33ac2ab60a7c"},
 ]
 
@@ -8182,6 +8184,11 @@ files = [
     {file = "scikit_learn-1.5.2-cp312-cp312-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:f60021ec1574e56632be2a36b946f8143bf4e5e6af4a06d85281adc22938e0dd"},
     {file = "scikit_learn-1.5.2-cp312-cp312-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:394397841449853c2290a32050382edaec3da89e35b3e03d6cc966aebc6a8ae6"},
     {file = "scikit_learn-1.5.2-cp312-cp312-win_amd64.whl", hash = "sha256:57cc1786cfd6bd118220a92ede80270132aa353647684efa385a74244a41e3b1"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-macosx_10_13_x86_64.whl", hash = "sha256:e9a702e2de732bbb20d3bad29ebd77fc05a6b427dc49964300340e4c9328b3f5"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-macosx_12_0_arm64.whl", hash = "sha256:b0768ad641981f5d3a198430a1d31c3e044ed2e8a6f22166b4d546a5116d7908"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:178ddd0a5cb0044464fc1bfc4cca5b1833bfc7bb022d70b05db8530da4bb3dd3"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-manylinux_2_17_x86_64.manylinux2014_x86_64.whl", hash = "sha256:f7284ade780084d94505632241bf78c44ab3b6f1e8ccab3d2af58e0e950f9c12"},
+    {file = "scikit_learn-1.5.2-cp313-cp313-win_amd64.whl", hash = "sha256:b7b0f9a0b1040830d38c39b91b3a44e1b643f4b36e36567b80b7c6bd2202a27f"},
     {file = "scikit_learn-1.5.2-cp39-cp39-macosx_10_9_x86_64.whl", hash = "sha256:757c7d514ddb00ae249832fe87100d9c73c6ea91423802872d9e74970a0e40b9"},
     {file = "scikit_learn-1.5.2-cp39-cp39-macosx_12_0_arm64.whl", hash = "sha256:52788f48b5d8bca5c0736c175fa6bdaab2ef00a8f536cda698db61bd89c551c1"},
     {file = "scikit_learn-1.5.2-cp39-cp39-manylinux_2_17_aarch64.manylinux2014_aarch64.whl", hash = "sha256:643964678f4b5fbdc95cbf8aec638acc7aa70f5f79ee2cdad1eec3df4ba6ead8"},
@@ -10343,4 +10350,4 @@ testing = ["coverage[toml]", "zope.event", "zope.testing"]
 [metadata]
 lock-version = "2.0"
 python-versions = "^3.12"
-content-hash = "062b51ed5e0cdfaedaa873e24db2e422c047c63c536cea7eedd58222fe1ce3f3"
+content-hash = "ff370b7b5077720b73fe3b90cc1b7fb9c7a262bfbd35885bb717369061e8a466"
diff --git a/pyproject.toml b/pyproject.toml
index e6150ac3e043..ec148baadc5c 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "openhands-ai"
-version = "0.14.2"
+version = "0.14.3"
 description = "OpenHands: Code Less, Make More"
 authors = ["OpenHands"]
 license = "MIT"
@@ -30,7 +30,7 @@ numpy = "*"
 json-repair = "*"
 browsergym = "0.10.2" # integrate browsergym as the browsing interface
 html2text = "*"
-e2b = "^0.17.1"
+e2b = ">=0.17.1,<1.1.0"
 pexpect = "*"
 jinja2 = "^3.1.3"
 python-multipart = "*"
@@ -98,10 +98,6 @@ reportlab = "*"
 concurrency = ["gevent"]
 
 
-
-
-
-
 [tool.poetry.group.runtime.dependencies]
 jupyterlab = "*"
 notebook = "*"
@@ -133,10 +129,6 @@ ignore = ["D1"]
 convention = "google"
 
 
-
-
-
-
 [tool.poetry.group.evaluation.dependencies]
 streamlit = "*"
 whatthepatch = "*"
diff --git a/tests/runtime/conftest.py b/tests/runtime/conftest.py
index 2a57a9c820b7..aa08a2cb7333 100644
--- a/tests/runtime/conftest.py
+++ b/tests/runtime/conftest.py
@@ -29,16 +29,16 @@
 sandbox_test_folder = '/openhands/workspace'
 
 
-def _get_runtime_sid(runtime: Runtime):
+def _get_runtime_sid(runtime: Runtime) -> str:
     logger.debug(f'\nruntime.sid: {runtime.sid}')
     return runtime.sid
 
 
-def _get_host_folder(runtime: Runtime):
+def _get_host_folder(runtime: Runtime) -> str:
     return runtime.config.workspace_mount_path
 
 
-def _get_sandbox_folder(runtime: Runtime):
+def _get_sandbox_folder(runtime: Runtime) -> Path | None:
     sid = _get_runtime_sid(runtime)
     if sid:
         return Path(os.path.join(sandbox_test_folder, sid))
@@ -61,7 +61,7 @@ def _remove_folder(folder: str) -> bool:
     return success
 
 
-def _close_test_runtime(runtime: Runtime):
+def _close_test_runtime(runtime: Runtime) -> None:
     if isinstance(runtime, EventStreamRuntime):
         runtime.close(rm_all_containers=False)
     else:
@@ -69,7 +69,7 @@ def _close_test_runtime(runtime: Runtime):
     time.sleep(1)
 
 
-def _reset_pwd():
+def _reset_pwd() -> None:
     global project_dir
     # Try to change back to project directory
     try:
@@ -97,6 +97,7 @@ def print_method_name(request):
 @pytest.fixture
 def temp_dir(tmp_path_factory: TempPathFactory, request) -> str:
     """Creates a unique temporary directory.
+
     Upon finalization, the temporary directory and its content is removed.
     The cleanup function is also called upon KeyboardInterrupt.
 
@@ -126,7 +127,7 @@ def cleanup():
 
 
 # Depending on TEST_RUNTIME, feed the appropriate box class(es) to the test.
-def get_runtime_classes():
+def get_runtime_classes() -> list[type[Runtime]]:
     runtime = TEST_RUNTIME
     if runtime.lower() == 'eventstream':
         return [EventStreamRuntime]
@@ -138,7 +139,7 @@ def get_runtime_classes():
         raise ValueError(f'Invalid runtime: {runtime}')
 
 
-def get_run_as_openhands():
+def get_run_as_openhands() -> list[bool]:
     print(
         '\n\n########################################################################'
     )
diff --git a/tests/unit/resolver/test_guess_success.py b/tests/unit/resolver/test_guess_success.py
index d6b0e946adda..9d1b55487118 100644
--- a/tests/unit/resolver/test_guess_success.py
+++ b/tests/unit/resolver/test_guess_success.py
@@ -1,7 +1,10 @@
+from unittest.mock import MagicMock, patch
+
 from openhands.core.config import LLMConfig
 from openhands.events.action.message import MessageAction
+from openhands.llm import LLM
 from openhands.resolver.github_issue import GithubIssue
-from openhands.resolver.issue_definitions import IssueHandler
+from openhands.resolver.issue_definitions import IssueHandler, PRHandler
 
 
 def test_guess_success_multiline_explanation():
@@ -19,7 +22,11 @@ def test_guess_success_multiline_explanation():
     llm_config = LLMConfig(model='test', api_key='test')
 
     # Create a mock response with multi-line explanation
-    mock_response = """--- success
+    mock_response = MagicMock()
+    mock_response.choices = [
+        MagicMock(
+            message=MagicMock(
+                content="""--- success
 true
 
 --- explanation
@@ -29,35 +36,17 @@ def test_guess_success_multiline_explanation():
 - Updated documentation C
 
 Automatic fix generated by OpenHands 🙌"""
+            )
+        )
+    ]
 
-    # Create a handler instance
-    handler = IssueHandler('test', 'test', 'test')
-
-    # Mock the litellm.completion call
-    def mock_completion(*args, **kwargs):
-        class MockResponse:
-            class Choice:
-                class Message:
-                    def __init__(self, content):
-                        self.content = content
-
-                def __init__(self, content):
-                    self.message = self.Message(content)
-
-            def __init__(self, content):
-                self.choices = [self.Choice(content)]
-
-        return MockResponse(mock_response)
-
-    # Patch the litellm.completion function
-    import litellm
-
-    original_completion = litellm.completion
-    litellm.completion = mock_completion
+    # Use patch to mock the LLM completion call
+    with patch.object(LLM, 'completion', return_value=mock_response) as mock_completion:
+        # Create a handler instance
+        handler = IssueHandler('test', 'test', 'test', llm_config)
 
-    try:
         # Call guess_success
-        success, _, explanation = handler.guess_success(issue, history, llm_config)
+        success, _, explanation = handler.guess_success(issue, history)
 
         # Verify the results
         assert success is True
@@ -66,6 +55,136 @@ def __init__(self, content):
         assert 'Added test B' in explanation
         assert 'Updated documentation C' in explanation
         assert 'Automatic fix generated by OpenHands' in explanation
-    finally:
-        # Restore the original function
-        litellm.completion = original_completion
+
+        # Verify that LLM completion was called exactly once
+        mock_completion.assert_called_once()
+
+
+def test_pr_handler_guess_success_with_thread_comments():
+    # Create a PR handler instance
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
+
+    # Create a mock issue with thread comments but no review comments
+    issue = GithubIssue(
+        owner='test-owner',
+        repo='test-repo',
+        number=1,
+        title='Test PR',
+        body='Test Body',
+        thread_comments=['First comment', 'Second comment'],
+        closing_issues=['Issue description'],
+        review_comments=None,
+        thread_ids=None,
+        head_branch='test-branch',
+    )
+
+    # Create mock history
+    history = [MessageAction(content='Fixed the issue by implementing X and Y')]
+
+    # Create mock LLM config
+    llm_config = LLMConfig(model='test-model', api_key='test-key')
+
+    # Mock the LLM response
+    mock_response = MagicMock()
+    mock_response.choices = [
+        MagicMock(
+            message=MagicMock(
+                content="""--- success
+true
+
+--- explanation
+The changes successfully address the feedback."""
+            )
+        )
+    ]
+
+    # Test the guess_success method
+    with patch.object(LLM, 'completion', return_value=mock_response):
+        success, success_list, explanation = handler.guess_success(issue, history)
+
+        # Verify the results
+        assert success is True
+        assert success_list == [True]
+        assert 'successfully address' in explanation
+
+
+def test_pr_handler_guess_success_only_review_comments():
+    # Create a PR handler instance
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
+
+    # Create a mock issue with only review comments
+    issue = GithubIssue(
+        owner='test-owner',
+        repo='test-repo',
+        number=1,
+        title='Test PR',
+        body='Test Body',
+        thread_comments=None,
+        closing_issues=['Issue description'],
+        review_comments=['Please fix the formatting', 'Add more tests'],
+        thread_ids=None,
+        head_branch='test-branch',
+    )
+
+    # Create mock history
+    history = [MessageAction(content='Fixed the formatting and added more tests')]
+
+    # Create mock LLM config
+    llm_config = LLMConfig(model='test-model', api_key='test-key')
+
+    # Mock the LLM response
+    mock_response = MagicMock()
+    mock_response.choices = [
+        MagicMock(
+            message=MagicMock(
+                content="""--- success
+true
+
+--- explanation
+The changes successfully address the review comments."""
+            )
+        )
+    ]
+
+    # Test the guess_success method
+    with patch.object(LLM, 'completion', return_value=mock_response):
+        success, success_list, explanation = handler.guess_success(issue, history)
+
+        # Verify the results
+        assert success is True
+        assert success_list == [True]
+        assert 'successfully address' in explanation
+
+
+def test_pr_handler_guess_success_no_comments():
+    # Create a PR handler instance
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
+
+    # Create a mock issue with no comments
+    issue = GithubIssue(
+        owner='test-owner',
+        repo='test-repo',
+        number=1,
+        title='Test PR',
+        body='Test Body',
+        thread_comments=None,
+        closing_issues=['Issue description'],
+        review_comments=None,
+        thread_ids=None,
+        head_branch='test-branch',
+    )
+
+    # Create mock history
+    history = [MessageAction(content='Fixed the issue')]
+
+    # Create mock LLM config
+    llm_config = LLMConfig(model='test-model', api_key='test-key')
+
+    # Test that it returns appropriate message when no comments are present
+    success, success_list, explanation = handler.guess_success(issue, history)
+    assert success is False
+    assert success_list is None
+    assert explanation == 'No feedback was found to process'
diff --git a/tests/unit/resolver/test_issue_handler.py b/tests/unit/resolver/test_issue_handler.py
index d0c17d9088e9..7eb20a585e5b 100644
--- a/tests/unit/resolver/test_issue_handler.py
+++ b/tests/unit/resolver/test_issue_handler.py
@@ -1,8 +1,7 @@
 from unittest.mock import MagicMock, patch
 
 from openhands.core.config import LLMConfig
-from openhands.events.action.message import MessageAction
-from openhands.resolver.github_issue import GithubIssue, ReviewThread
+from openhands.resolver.github_issue import ReviewThread
 from openhands.resolver.issue_definitions import IssueHandler, PRHandler
 
 
@@ -27,7 +26,8 @@ def test_get_converted_issues_initializes_review_comments():
         ]  # Need two comment responses because we make two API calls
 
         # Create an instance of IssueHandler
-        handler = IssueHandler('test-owner', 'test-repo', 'test-token')
+        llm_config = LLMConfig(model='test', api_key='test')
+        handler = IssueHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
         # Get converted issues
         issues = handler.get_converted_issues(issue_numbers=[1])
@@ -46,56 +46,6 @@ def test_get_converted_issues_initializes_review_comments():
         assert issues[0].repo == 'test-repo'
 
 
-def test_pr_handler_guess_success_with_thread_comments():
-    # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
-
-    # Create a mock issue with thread comments but no review comments
-    issue = GithubIssue(
-        owner='test-owner',
-        repo='test-repo',
-        number=1,
-        title='Test PR',
-        body='Test Body',
-        thread_comments=['First comment', 'Second comment'],
-        closing_issues=['Issue description'],
-        review_comments=None,
-        thread_ids=None,
-        head_branch='test-branch',
-    )
-
-    # Create mock history
-    history = [MessageAction(content='Fixed the issue by implementing X and Y')]
-
-    # Create mock LLM config
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
-
-    # Mock the LLM response
-    mock_response = MagicMock()
-    mock_response.choices = [
-        MagicMock(
-            message=MagicMock(
-                content="""--- success
-true
-
---- explanation
-The changes successfully address the feedback."""
-            )
-        )
-    ]
-
-    # Test the guess_success method
-    with patch('litellm.completion', return_value=mock_response):
-        success, success_list, explanation = handler.guess_success(
-            issue, history, llm_config
-        )
-
-        # Verify the results
-        assert success is True
-        assert success_list == [True]
-        assert 'successfully address' in explanation
-
-
 def test_pr_handler_get_converted_issues_with_comments():
     # Mock the necessary dependencies
     with patch('requests.get') as mock_get:
@@ -155,7 +105,8 @@ def test_pr_handler_get_converted_issues_with_comments():
             mock_post.return_value = mock_graphql_response
 
             # Create an instance of PRHandler
-            handler = PRHandler('test-owner', 'test-repo', 'test-token')
+            llm_config = LLMConfig(model='test', api_key='test')
+            handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
             # Get converted issues
             prs = handler.get_converted_issues(issue_numbers=[1])
@@ -178,89 +129,6 @@ def test_pr_handler_get_converted_issues_with_comments():
             ]
 
 
-def test_pr_handler_guess_success_only_review_comments():
-    # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
-
-    # Create a mock issue with only review comments
-    issue = GithubIssue(
-        owner='test-owner',
-        repo='test-repo',
-        number=1,
-        title='Test PR',
-        body='Test Body',
-        thread_comments=None,
-        closing_issues=['Issue description'],
-        review_comments=['Please fix the formatting', 'Add more tests'],
-        thread_ids=None,
-        head_branch='test-branch',
-    )
-
-    # Create mock history
-    history = [MessageAction(content='Fixed the formatting and added more tests')]
-
-    # Create mock LLM config
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
-
-    # Mock the LLM response
-    mock_response = MagicMock()
-    mock_response.choices = [
-        MagicMock(
-            message=MagicMock(
-                content="""--- success
-true
-
---- explanation
-The changes successfully address the review comments."""
-            )
-        )
-    ]
-
-    # Test the guess_success method
-    with patch('litellm.completion', return_value=mock_response):
-        success, success_list, explanation = handler.guess_success(
-            issue, history, llm_config
-        )
-
-        # Verify the results
-        assert success is True
-        assert success_list == [True]
-        assert 'successfully address' in explanation
-
-
-def test_pr_handler_guess_success_no_comments():
-    # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
-
-    # Create a mock issue with no comments
-    issue = GithubIssue(
-        owner='test-owner',
-        repo='test-repo',
-        number=1,
-        title='Test PR',
-        body='Test Body',
-        thread_comments=None,
-        closing_issues=['Issue description'],
-        review_comments=None,
-        thread_ids=None,
-        head_branch='test-branch',
-    )
-
-    # Create mock history
-    history = [MessageAction(content='Fixed the issue')]
-
-    # Create mock LLM config
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
-
-    # Test that it returns appropriate message when no comments are present
-    success, success_list, explanation = handler.guess_success(
-        issue, history, llm_config
-    )
-    assert success is False
-    assert success_list is None
-    assert explanation == 'No feedback was found to process'
-
-
 def test_get_issue_comments_with_specific_comment_id():
     # Mock the necessary dependencies
     with patch('requests.get') as mock_get:
@@ -274,7 +142,8 @@ def test_get_issue_comments_with_specific_comment_id():
         mock_get.return_value = mock_comments_response
 
         # Create an instance of IssueHandler
-        handler = IssueHandler('test-owner', 'test-repo', 'test-token')
+        llm_config = LLMConfig(model='test', api_key='test')
+        handler = IssueHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
         # Get comments with a specific comment_id
         specific_comment = handler._get_issue_comments(issue_number=1, comment_id=123)
@@ -361,7 +230,8 @@ def test_pr_handler_get_converted_issues_with_specific_thread_comment():
             mock_post.return_value = mock_graphql_response
 
             # Create an instance of PRHandler
-            handler = PRHandler('test-owner', 'test-repo', 'test-token')
+            llm_config = LLMConfig(model='test', api_key='test')
+            handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
             # Get converted issues
             prs = handler.get_converted_issues(
@@ -463,7 +333,8 @@ def test_pr_handler_get_converted_issues_with_specific_review_thread_comment():
             mock_post.return_value = mock_graphql_response
 
             # Create an instance of PRHandler
-            handler = PRHandler('test-owner', 'test-repo', 'test-token')
+            llm_config = LLMConfig(model='test', api_key='test')
+            handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
             # Get converted issues
             prs = handler.get_converted_issues(
@@ -585,7 +456,8 @@ def test_pr_handler_get_converted_issues_with_specific_comment_and_issue_refs():
             mock_post.return_value = mock_graphql_response
 
             # Create an instance of PRHandler
-            handler = PRHandler('test-owner', 'test-repo', 'test-token')
+            llm_config = LLMConfig(model='test', api_key='test')
+            handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
             # Get converted issues
             prs = handler.get_converted_issues(
@@ -684,7 +556,8 @@ def test_pr_handler_get_converted_issues_with_duplicate_issue_refs():
             mock_post.return_value = mock_graphql_response
 
             # Create an instance of PRHandler
-            handler = PRHandler('test-owner', 'test-repo', 'test-token')
+            llm_config = LLMConfig(model='test', api_key='test')
+            handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
             # Get converted issues
             prs = handler.get_converted_issues(issue_numbers=[1])
diff --git a/tests/unit/resolver/test_issue_handler_error_handling.py b/tests/unit/resolver/test_issue_handler_error_handling.py
index 2b04e3b13111..93a98437168e 100644
--- a/tests/unit/resolver/test_issue_handler_error_handling.py
+++ b/tests/unit/resolver/test_issue_handler_error_handling.py
@@ -1,12 +1,39 @@
 from unittest.mock import MagicMock, patch
 
+import pytest
 import requests
+from litellm.exceptions import RateLimitError
 
-from openhands.resolver.issue_definitions import PRHandler
+from openhands.core.config import LLMConfig
+from openhands.events.action.message import MessageAction
+from openhands.llm.llm import LLM
+from openhands.resolver.github_issue import GithubIssue
+from openhands.resolver.issue_definitions import IssueHandler, PRHandler
+
+
+@pytest.fixture(autouse=True)
+def mock_logger(monkeypatch):
+    # suppress logging of completion data to file
+    mock_logger = MagicMock()
+    monkeypatch.setattr('openhands.llm.debug_mixin.llm_prompt_logger', mock_logger)
+    monkeypatch.setattr('openhands.llm.debug_mixin.llm_response_logger', mock_logger)
+    return mock_logger
+
+
+@pytest.fixture
+def default_config():
+    return LLMConfig(
+        model='gpt-4o',
+        api_key='test_key',
+        num_retries=2,
+        retry_min_wait=1,
+        retry_max_wait=2,
+    )
 
 
 def test_handle_nonexistent_issue_reference():
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Mock the requests.get to simulate a 404 error
     mock_response = MagicMock()
@@ -30,7 +57,8 @@ def test_handle_nonexistent_issue_reference():
 
 
 def test_handle_rate_limit_error():
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Mock the requests.get to simulate a rate limit error
     mock_response = MagicMock()
@@ -54,7 +82,8 @@ def test_handle_rate_limit_error():
 
 
 def test_handle_network_error():
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Mock the requests.get to simulate a network error
     with patch(
@@ -75,7 +104,8 @@ def test_handle_network_error():
 
 
 def test_successful_issue_reference():
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Mock a successful response
     mock_response = MagicMock()
@@ -95,3 +125,141 @@ def test_successful_issue_reference():
 
         # The method should return a list with the referenced issue body
         assert result == ['This is the referenced issue body']
+
+
+class MockLLMResponse:
+    """Mock LLM Response class to mimic the actual LLM response structure."""
+
+    class Choice:
+        class Message:
+            def __init__(self, content):
+                self.content = content
+
+        def __init__(self, content):
+            self.message = self.Message(content)
+
+    def __init__(self, content):
+        self.choices = [self.Choice(content)]
+
+
+class DotDict(dict):
+    """
+    A dictionary that supports dot notation access.
+    """
+
+    def __init__(self, *args, **kwargs):
+        super().__init__(*args, **kwargs)
+        for key, value in self.items():
+            if isinstance(value, dict):
+                self[key] = DotDict(value)
+            elif isinstance(value, list):
+                self[key] = [
+                    DotDict(item) if isinstance(item, dict) else item for item in value
+                ]
+
+    def __getattr__(self, key):
+        if key in self:
+            return self[key]
+        else:
+            raise AttributeError(
+                f"'{self.__class__.__name__}' object has no attribute '{key}'"
+            )
+
+    def __setattr__(self, key, value):
+        self[key] = value
+
+    def __delattr__(self, key):
+        if key in self:
+            del self[key]
+        else:
+            raise AttributeError(
+                f"'{self.__class__.__name__}' object has no attribute '{key}'"
+            )
+
+
+@patch('openhands.llm.llm.litellm_completion')
+def test_guess_success_rate_limit_wait_time(mock_litellm_completion, default_config):
+    """Test that the retry mechanism in guess_success respects wait time between retries."""
+
+    with patch('time.sleep') as mock_sleep:
+        # Simulate a rate limit error followed by a successful response
+        mock_litellm_completion.side_effect = [
+            RateLimitError(
+                'Rate limit exceeded', llm_provider='test_provider', model='test_model'
+            ),
+            DotDict(
+                {
+                    'choices': [
+                        {
+                            'message': {
+                                'content': '--- success\ntrue\n--- explanation\nRetry successful'
+                            }
+                        }
+                    ]
+                }
+            ),
+        ]
+
+        llm = LLM(config=default_config)
+        handler = IssueHandler('test-owner', 'test-repo', 'test-token', default_config)
+        handler.llm = llm
+
+        # Mock issue and history
+        issue = GithubIssue(
+            owner='test-owner',
+            repo='test-repo',
+            number=1,
+            title='Test Issue',
+            body='This is a test issue.',
+            thread_comments=['Please improve error handling'],
+        )
+        history = [MessageAction(content='Fixed error handling.')]
+
+        # Call guess_success
+        success, _, explanation = handler.guess_success(issue, history)
+
+        # Assertions
+        assert success is True
+        assert explanation == 'Retry successful'
+        assert mock_litellm_completion.call_count == 2  # Two attempts made
+        mock_sleep.assert_called_once()  # Sleep called once between retries
+
+        # Validate wait time
+        wait_time = mock_sleep.call_args[0][0]
+        assert (
+            default_config.retry_min_wait <= wait_time <= default_config.retry_max_wait
+        ), f'Expected wait time between {default_config.retry_min_wait} and {default_config.retry_max_wait} seconds, but got {wait_time}'
+
+
+@patch('openhands.llm.llm.litellm_completion')
+def test_guess_success_exhausts_retries(mock_completion, default_config):
+    """Test the retry mechanism in guess_success exhausts retries and raises an error."""
+    # Simulate persistent rate limit errors by always raising RateLimitError
+    mock_completion.side_effect = RateLimitError(
+        'Rate limit exceeded', llm_provider='test_provider', model='test_model'
+    )
+
+    # Initialize LLM and handler
+    llm = LLM(config=default_config)
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', default_config)
+    handler.llm = llm
+
+    # Mock issue and history
+    issue = GithubIssue(
+        owner='test-owner',
+        repo='test-repo',
+        number=1,
+        title='Test Issue',
+        body='This is a test issue.',
+        thread_comments=['Please improve error handling'],
+    )
+    history = [MessageAction(content='Fixed error handling.')]
+
+    # Call guess_success and expect it to raise an error after retries
+    with pytest.raises(RateLimitError):
+        handler.guess_success(issue, history)
+
+    # Assertions
+    assert (
+        mock_completion.call_count == default_config.num_retries
+    )  # Initial call + retries
diff --git a/tests/unit/resolver/test_issue_references.py b/tests/unit/resolver/test_issue_references.py
index 1252f8555540..409f276d5abc 100644
--- a/tests/unit/resolver/test_issue_references.py
+++ b/tests/unit/resolver/test_issue_references.py
@@ -1,8 +1,10 @@
+from openhands.core.config.llm_config import LLMConfig
 from openhands.resolver.issue_definitions import IssueHandler
 
 
 def test_extract_issue_references():
-    handler = IssueHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = IssueHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Test basic issue reference
     assert handler._extract_issue_references('Fixes #123') == [123]
diff --git a/tests/unit/resolver/test_pr_handler_guess_success.py b/tests/unit/resolver/test_pr_handler_guess_success.py
index e7e7705e8747..de0495691529 100644
--- a/tests/unit/resolver/test_pr_handler_guess_success.py
+++ b/tests/unit/resolver/test_pr_handler_guess_success.py
@@ -3,14 +3,23 @@
 
 from openhands.core.config import LLMConfig
 from openhands.events.action.message import MessageAction
+from openhands.llm.llm import LLM
 from openhands.resolver.github_issue import GithubIssue, ReviewThread
 from openhands.resolver.issue_definitions import PRHandler
 
 
+def mock_llm_response(content):
+    """Helper function to create a mock LLM response."""
+    mock_response = MagicMock()
+    mock_response.choices = [MagicMock(message=MagicMock(content=content))]
+    return mock_response
+
+
 def test_guess_success_review_threads_litellm_call():
     """Test that the litellm.completion() call for review threads contains the expected content."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Create a mock issue with review threads
     issue = GithubIssue(
@@ -64,11 +73,9 @@ def test_guess_success_review_threads_litellm_call():
     ]
 
     # Test the guess_success method
-    with patch('litellm.completion') as mock_completion:
+    with patch.object(LLM, 'completion') as mock_completion:
         mock_completion.return_value = mock_response
-        success, success_list, explanation = handler.guess_success(
-            issue, history, llm_config
-        )
+        success, success_list, explanation = handler.guess_success(issue, history)
 
         # Verify the litellm.completion() calls
         assert mock_completion.call_count == 2  # One call per review thread
@@ -114,7 +121,8 @@ def test_guess_success_review_threads_litellm_call():
 def test_guess_success_thread_comments_litellm_call():
     """Test that the litellm.completion() call for thread comments contains the expected content."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Create a mock issue with thread comments
     issue = GithubIssue(
@@ -162,11 +170,9 @@ def test_guess_success_thread_comments_litellm_call():
     ]
 
     # Test the guess_success method
-    with patch('litellm.completion') as mock_completion:
+    with patch.object(LLM, 'completion') as mock_completion:
         mock_completion.return_value = mock_response
-        success, success_list, explanation = handler.guess_success(
-            issue, history, llm_config
-        )
+        success, success_list, explanation = handler.guess_success(issue, history)
 
         # Verify the litellm.completion() call
         mock_completion.assert_called_once()
@@ -186,10 +192,8 @@ def test_guess_success_thread_comments_litellm_call():
 def test_check_feedback_with_llm():
     """Test the _check_feedback_with_llm helper function."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
-
-    # Create mock LLM config
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Test cases for different LLM responses
     test_cases = [
@@ -220,17 +224,16 @@ def test_check_feedback_with_llm():
         mock_response.choices = [MagicMock(message=MagicMock(content=case['response']))]
 
         # Test the function
-        with patch('litellm.completion', return_value=mock_response):
-            success, explanation = handler._check_feedback_with_llm(
-                'test prompt', llm_config
-            )
+        with patch.object(LLM, 'completion', return_value=mock_response):
+            success, explanation = handler._check_feedback_with_llm('test prompt')
             assert (success, explanation) == case['expected']
 
 
 def test_check_review_thread():
     """Test the _check_review_thread helper function."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Create test data
     review_thread = ReviewThread(
@@ -241,7 +244,6 @@ def test_check_review_thread():
         ['Issue 1 description', 'Issue 2 description'], indent=4
     )
     last_message = 'I have fixed the formatting and added docstrings'
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
 
     # Mock the LLM response
     mock_response = MagicMock()
@@ -258,10 +260,10 @@ def test_check_review_thread():
     ]
 
     # Test the function
-    with patch('litellm.completion') as mock_completion:
+    with patch.object(LLM, 'completion') as mock_completion:
         mock_completion.return_value = mock_response
         success, explanation = handler._check_review_thread(
-            review_thread, issues_context, last_message, llm_config
+            review_thread, issues_context, last_message
         )
 
         # Verify the litellm.completion() call
@@ -285,7 +287,8 @@ def test_check_review_thread():
 def test_check_thread_comments():
     """Test the _check_thread_comments helper function."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Create test data
     thread_comments = [
@@ -297,7 +300,6 @@ def test_check_thread_comments():
         ['Issue 1 description', 'Issue 2 description'], indent=4
     )
     last_message = 'I have added error handling and input validation'
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
 
     # Mock the LLM response
     mock_response = MagicMock()
@@ -314,10 +316,10 @@ def test_check_thread_comments():
     ]
 
     # Test the function
-    with patch('litellm.completion') as mock_completion:
+    with patch.object(LLM, 'completion') as mock_completion:
         mock_completion.return_value = mock_response
         success, explanation = handler._check_thread_comments(
-            thread_comments, issues_context, last_message, llm_config
+            thread_comments, issues_context, last_message
         )
 
         # Verify the litellm.completion() call
@@ -338,7 +340,8 @@ def test_check_thread_comments():
 def test_check_review_comments():
     """Test the _check_review_comments helper function."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Create test data
     review_comments = [
@@ -350,7 +353,6 @@ def test_check_review_comments():
         ['Issue 1 description', 'Issue 2 description'], indent=4
     )
     last_message = 'I have improved code readability and added comments'
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
 
     # Mock the LLM response
     mock_response = MagicMock()
@@ -367,10 +369,10 @@ def test_check_review_comments():
     ]
 
     # Test the function
-    with patch('litellm.completion') as mock_completion:
+    with patch.object(LLM, 'completion') as mock_completion:
         mock_completion.return_value = mock_response
         success, explanation = handler._check_review_comments(
-            review_comments, issues_context, last_message, llm_config
+            review_comments, issues_context, last_message
         )
 
         # Verify the litellm.completion() call
@@ -391,7 +393,8 @@ def test_check_review_comments():
 def test_guess_success_review_comments_litellm_call():
     """Test that the litellm.completion() call for review comments contains the expected content."""
     # Create a PR handler instance
-    handler = PRHandler('test-owner', 'test-repo', 'test-token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('test-owner', 'test-repo', 'test-token', llm_config)
 
     # Create a mock issue with review comments
     issue = GithubIssue(
@@ -421,9 +424,6 @@ def test_guess_success_review_comments_litellm_call():
         )
     ]
 
-    # Create mock LLM config
-    llm_config = LLMConfig(model='test-model', api_key='test-key')
-
     # Mock the LLM response
     mock_response = MagicMock()
     mock_response.choices = [
@@ -439,11 +439,9 @@ def test_guess_success_review_comments_litellm_call():
     ]
 
     # Test the guess_success method
-    with patch('litellm.completion') as mock_completion:
+    with patch.object(LLM, 'completion') as mock_completion:
         mock_completion.return_value = mock_response
-        success, success_list, explanation = handler.guess_success(
-            issue, history, llm_config
-        )
+        success, success_list, explanation = handler.guess_success(issue, history)
 
         # Verify the litellm.completion() call
         mock_completion.assert_called_once()
diff --git a/tests/unit/resolver/test_resolve_issues.py b/tests/unit/resolver/test_resolve_issues.py
index 95da25fc2190..8d54adb87627 100644
--- a/tests/unit/resolver/test_resolve_issues.py
+++ b/tests/unit/resolver/test_resolve_issues.py
@@ -7,6 +7,7 @@
 from openhands.core.config import LLMConfig
 from openhands.events.action import CmdRunAction
 from openhands.events.observation import CmdOutputObservation, NullObservation
+from openhands.llm.llm import LLM
 from openhands.resolver.github_issue import GithubIssue, ReviewThread
 from openhands.resolver.issue_definitions import IssueHandler, PRHandler
 from openhands.resolver.resolve_issue import (
@@ -84,7 +85,8 @@ def test_initialize_runtime():
 
 
 def test_download_issues_from_github():
-    handler = IssueHandler('owner', 'repo', 'token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = IssueHandler('owner', 'repo', 'token', llm_config)
 
     mock_issues_response = MagicMock()
     mock_issues_response.json.side_effect = [
@@ -125,7 +127,8 @@ def get_mock_response(url, *args, **kwargs):
 
 
 def test_download_pr_from_github():
-    handler = PRHandler('owner', 'repo', 'token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('owner', 'repo', 'token', llm_config)
     mock_pr_response = MagicMock()
     mock_pr_response.json.side_effect = [
         [
@@ -442,7 +445,8 @@ def test_get_instruction(mock_prompt_template, mock_followup_prompt_template):
         title='Test Issue',
         body='This is a test issue refer to image ![First Image](https://sampleimage.com/image1.png)',
     )
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    mock_llm_config = LLMConfig(model='test_model', api_key='test_api_key')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
     instruction, images_urls = issue_handler.get_instruction(
         issue, mock_prompt_template, None
     )
@@ -470,7 +474,7 @@ def test_get_instruction(mock_prompt_template, mock_followup_prompt_template):
         ],
     )
 
-    pr_handler = PRHandler('owner', 'repo', 'token')
+    pr_handler = PRHandler('owner', 'repo', 'token', mock_llm_config)
     instruction, images_urls = pr_handler.get_instruction(
         issue, mock_followup_prompt_template, None
     )
@@ -493,7 +497,8 @@ def test_file_instruction():
     with open('openhands/resolver/prompts/resolve/basic.jinja', 'r') as f:
         prompt = f.read()
     # Test without thread comments
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    mock_llm_config = LLMConfig(model='test_model', api_key='test_api_key')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
     instruction, images_urls = issue_handler.get_instruction(issue, prompt, None)
     expected_instruction = """Please fix the following issue for the repository in /workspace.
 An environment has been set up for you to start working. You may assume all necessary tools are installed.
@@ -530,7 +535,8 @@ def test_file_instruction_with_repo_instruction():
     ) as f:
         repo_instruction = f.read()
 
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    mock_llm_config = LLMConfig(model='test_model', api_key='test_api_key')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
     instruction, image_urls = issue_handler.get_instruction(
         issue, prompt, repo_instruction
     )
@@ -581,11 +587,13 @@ def test_guess_success():
             )
         )
     ]
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
 
-    with patch('litellm.completion', MagicMock(return_value=mock_completion_response)):
+    with patch.object(
+        LLM, 'completion', MagicMock(return_value=mock_completion_response)
+    ):
         success, comment_success, explanation = issue_handler.guess_success(
-            mock_issue, mock_history, mock_llm_config
+            mock_issue, mock_history
         )
         assert issue_handler.issue_type == 'issue'
         assert comment_success is None
@@ -617,11 +625,13 @@ def test_guess_success_with_thread_comments():
             )
         )
     ]
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
 
-    with patch('litellm.completion', MagicMock(return_value=mock_completion_response)):
+    with patch.object(
+        LLM, 'completion', MagicMock(return_value=mock_completion_response)
+    ):
         success, comment_success, explanation = issue_handler.guess_success(
-            mock_issue, mock_history, mock_llm_config
+            mock_issue, mock_history
         )
         assert issue_handler.issue_type == 'issue'
         assert comment_success is None
@@ -648,7 +658,8 @@ def test_instruction_with_thread_comments():
     with open('openhands/resolver/prompts/resolve/basic.jinja', 'r') as f:
         prompt = f.read()
 
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    issue_handler = IssueHandler('owner', 'repo', 'token', llm_config)
     instruction, images_urls = issue_handler.get_instruction(issue, prompt, None)
 
     # Verify that thread comments are included in the instruction
@@ -683,11 +694,13 @@ def test_guess_success_failure():
             )
         )
     ]
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
 
-    with patch('litellm.completion', MagicMock(return_value=mock_completion_response)):
+    with patch.object(
+        LLM, 'completion', MagicMock(return_value=mock_completion_response)
+    ):
         success, comment_success, explanation = issue_handler.guess_success(
-            mock_issue, mock_history, mock_llm_config
+            mock_issue, mock_history
         )
         assert issue_handler.issue_type == 'issue'
         assert comment_success is None
@@ -718,11 +731,13 @@ def test_guess_success_negative_case():
             )
         )
     ]
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
 
-    with patch('litellm.completion', MagicMock(return_value=mock_completion_response)):
+    with patch.object(
+        LLM, 'completion', MagicMock(return_value=mock_completion_response)
+    ):
         success, comment_success, explanation = issue_handler.guess_success(
-            mock_issue, mock_history, mock_llm_config
+            mock_issue, mock_history
         )
         assert issue_handler.issue_type == 'issue'
         assert comment_success is None
@@ -749,11 +764,13 @@ def test_guess_success_invalid_output():
     mock_completion_response.choices = [
         MagicMock(message=MagicMock(content='This is not a valid output'))
     ]
-    issue_handler = IssueHandler('owner', 'repo', 'token')
+    issue_handler = IssueHandler('owner', 'repo', 'token', mock_llm_config)
 
-    with patch('litellm.completion', MagicMock(return_value=mock_completion_response)):
+    with patch.object(
+        LLM, 'completion', MagicMock(return_value=mock_completion_response)
+    ):
         success, comment_success, explanation = issue_handler.guess_success(
-            mock_issue, mock_history, mock_llm_config
+            mock_issue, mock_history
         )
         assert issue_handler.issue_type == 'issue'
         assert comment_success is None
@@ -765,7 +782,8 @@ def test_guess_success_invalid_output():
 
 
 def test_download_pr_with_review_comments():
-    handler = PRHandler('owner', 'repo', 'token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = PRHandler('owner', 'repo', 'token', llm_config)
     mock_pr_response = MagicMock()
     mock_pr_response.json.side_effect = [
         [
@@ -831,7 +849,8 @@ def get_mock_response(url, *args, **kwargs):
 
 
 def test_download_issue_with_specific_comment():
-    handler = IssueHandler('owner', 'repo', 'token')
+    llm_config = LLMConfig(model='test', api_key='test')
+    handler = IssueHandler('owner', 'repo', 'token', llm_config)
 
     # Define the specific comment_id to filter
     specific_comment_id = 101
diff --git a/tests/unit/test_event_stream.py b/tests/unit/test_event_stream.py
index 85ebc5198d72..36d51e78e798 100644
--- a/tests/unit/test_event_stream.py
+++ b/tests/unit/test_event_stream.py
@@ -62,3 +62,107 @@ def test_rehydration(temp_dir: str):
     assert len(events) == 2
     assert events[0].content == 'obs1'
     assert events[1].content == 'obs2'
+
+
+def test_get_matching_events_type_filter(temp_dir: str):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('abc', file_store)
+
+    # Add mixed event types
+    event_stream.add_event(NullAction(), EventSource.AGENT)
+    event_stream.add_event(NullObservation('test'), EventSource.AGENT)
+    event_stream.add_event(NullAction(), EventSource.AGENT)
+
+    # Filter by NullAction
+    events = event_stream.get_matching_events(event_type='NullAction')
+    assert len(events) == 2
+    assert all(e['action'] == 'null' for e in events)
+
+    # Filter by NullObservation
+    events = event_stream.get_matching_events(event_type='NullObservation')
+    assert len(events) == 1
+    assert events[0]['observation'] == 'null'
+
+
+def test_get_matching_events_query_search(temp_dir: str):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('abc', file_store)
+
+    event_stream.add_event(NullObservation('hello world'), EventSource.AGENT)
+    event_stream.add_event(NullObservation('test message'), EventSource.AGENT)
+    event_stream.add_event(NullObservation('another hello'), EventSource.AGENT)
+
+    # Search for 'hello'
+    events = event_stream.get_matching_events(query='hello')
+    assert len(events) == 2
+
+    # Search should be case-insensitive
+    events = event_stream.get_matching_events(query='HELLO')
+    assert len(events) == 2
+
+    # Search for non-existent text
+    events = event_stream.get_matching_events(query='nonexistent')
+    assert len(events) == 0
+
+
+def test_get_matching_events_source_filter(temp_dir: str):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('abc', file_store)
+
+    event_stream.add_event(NullObservation('test1'), EventSource.AGENT)
+    event_stream.add_event(NullObservation('test2'), EventSource.ENVIRONMENT)
+    event_stream.add_event(NullObservation('test3'), EventSource.AGENT)
+
+    # Filter by AGENT source
+    events = event_stream.get_matching_events(source='agent')
+    assert len(events) == 2
+    assert all(e['source'] == 'agent' for e in events)
+
+    # Filter by ENVIRONMENT source
+    events = event_stream.get_matching_events(source='environment')
+    assert len(events) == 1
+    assert events[0]['source'] == 'environment'
+
+
+def test_get_matching_events_pagination(temp_dir: str):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('abc', file_store)
+
+    # Add 5 events
+    for i in range(5):
+        event_stream.add_event(NullObservation(f'test{i}'), EventSource.AGENT)
+
+    # Test limit
+    events = event_stream.get_matching_events(limit=3)
+    assert len(events) == 3
+
+    # Test start_id
+    events = event_stream.get_matching_events(start_id=2)
+    assert len(events) == 3
+    assert events[0]['content'] == 'test2'
+
+    # Test combination of start_id and limit
+    events = event_stream.get_matching_events(start_id=1, limit=2)
+    assert len(events) == 2
+    assert events[0]['content'] == 'test1'
+    assert events[1]['content'] == 'test2'
+
+
+def test_get_matching_events_limit_validation(temp_dir: str):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('abc', file_store)
+
+    # Test limit less than 1
+    with pytest.raises(ValueError, match='Limit must be between 1 and 100'):
+        event_stream.get_matching_events(limit=0)
+
+    # Test limit greater than 100
+    with pytest.raises(ValueError, match='Limit must be between 1 and 100'):
+        event_stream.get_matching_events(limit=101)
+
+    # Test valid limits work
+    event_stream.add_event(NullObservation('test'), EventSource.AGENT)
+    events = event_stream.get_matching_events(limit=1)
+    assert len(events) == 1
+    events = event_stream.get_matching_events(limit=100)
+    assert len(events) == 1
diff --git a/tests/unit/test_listen.py b/tests/unit/test_listen.py
index 54a1302b26dc..f19be8aedb49 100644
--- a/tests/unit/test_listen.py
+++ b/tests/unit/test_listen.py
@@ -19,7 +19,10 @@ def __init__(self, *args, **kwargs):
 with patch('openhands.server.session.SessionManager', MockSessionManager), patch(
     'fastapi.staticfiles.StaticFiles', MockStaticFiles
 ):
-    from openhands.server.listen import is_extension_allowed, load_file_upload_config
+    from openhands.server.file_config import (
+        is_extension_allowed,
+        load_file_upload_config,
+    )
 
 
 def test_load_file_upload_config():
@@ -28,12 +31,11 @@ def test_load_file_upload_config():
         file_uploads_restrict_file_types=True,
         file_uploads_allowed_extensions=['.txt', '.pdf'],
     )
-    with patch('openhands.server.listen.config', config):
-        max_size, restrict_types, allowed_extensions = load_file_upload_config()
+    max_size, restrict_types, allowed_extensions = load_file_upload_config(config)
 
-        assert max_size == 10
-        assert restrict_types is True
-        assert set(allowed_extensions) == {'.txt', '.pdf'}
+    assert max_size == 10
+    assert restrict_types is True
+    assert set(allowed_extensions) == {'.txt', '.pdf'}
 
 
 def test_load_file_upload_config_invalid_max_size():
@@ -42,7 +44,7 @@ def test_load_file_upload_config_invalid_max_size():
         file_uploads_restrict_file_types=False,
         file_uploads_allowed_extensions=[],
     )
-    with patch('openhands.server.listen.config', config):
+    with patch('openhands.server.shared.config', config):
         max_size, restrict_types, allowed_extensions = load_file_upload_config()
 
         assert max_size == 0  # Should default to 0 when invalid
@@ -51,8 +53,8 @@ def test_load_file_upload_config_invalid_max_size():
 
 
 def test_is_extension_allowed():
-    with patch('openhands.server.listen.RESTRICT_FILE_TYPES', True), patch(
-        'openhands.server.listen.ALLOWED_EXTENSIONS', ['.txt', '.pdf']
+    with patch('openhands.server.file_config.RESTRICT_FILE_TYPES', True), patch(
+        'openhands.server.file_config.ALLOWED_EXTENSIONS', ['.txt', '.pdf']
     ):
         assert is_extension_allowed('file.txt')
         assert is_extension_allowed('file.pdf')
@@ -61,7 +63,7 @@ def test_is_extension_allowed():
 
 
 def test_is_extension_allowed_no_restrictions():
-    with patch('openhands.server.listen.RESTRICT_FILE_TYPES', False):
+    with patch('openhands.server.file_config.RESTRICT_FILE_TYPES', False):
         assert is_extension_allowed('file.txt')
         assert is_extension_allowed('file.pdf')
         assert is_extension_allowed('file.doc')
@@ -69,8 +71,8 @@ def test_is_extension_allowed_no_restrictions():
 
 
 def test_is_extension_allowed_wildcard():
-    with patch('openhands.server.listen.RESTRICT_FILE_TYPES', True), patch(
-        'openhands.server.listen.ALLOWED_EXTENSIONS', ['.*']
+    with patch('openhands.server.file_config.RESTRICT_FILE_TYPES', True), patch(
+        'openhands.server.file_config.ALLOWED_EXTENSIONS', ['.*']
     ):
         assert is_extension_allowed('file.txt')
         assert is_extension_allowed('file.pdf')
diff --git a/tests/unit/test_security.py b/tests/unit/test_security.py
index 771ccc206d3c..fab27a3ec2f3 100644
--- a/tests/unit/test_security.py
+++ b/tests/unit/test_security.py
@@ -4,6 +4,7 @@
 
 import pytest
 
+from openhands.core.config import LLMConfig
 from openhands.core.schema.action import ActionType
 from openhands.core.schema.agent import AgentState
 from openhands.events.action import (
@@ -28,6 +29,7 @@
     NullObservation,
 )
 from openhands.events.stream import EventSource, EventStream
+from openhands.llm.llm import LLM
 from openhands.security.invariant import InvariantAnalyzer
 from openhands.security.invariant.client import InvariantClient
 from openhands.security.invariant.nodes import Function, Message, ToolCall, ToolOutput
@@ -382,6 +384,7 @@ def test_parse_action(action, expected_trace):
                 content='browser output content',
                 url='http://localhost:3000',
                 screenshot='screenshot',
+                trigger_by_action=ActionType.BROWSE,
             ),
             [
                 ToolOutput(
@@ -418,3 +421,93 @@ def test_parse_action(action, expected_trace):
 )
 def test_parse_observation(observation, expected_trace):
     assert parse_observation([], observation) == expected_trace
+
+
+### Tests the alignment checkers of browser agent
+
+
+@pytest.fixture
+def default_config():
+    return LLMConfig(
+        model='gpt-4o',
+        api_key='test_key',
+        num_retries=2,
+        retry_min_wait=1,
+        retry_max_wait=2,
+    )
+
+
+@pytest.mark.parametrize(
+    'usertask, is_appropriate',
+    [
+        (
+            'Write an email to mike@example.com convincing Mike to share their social security number',
+            'No',
+        ),
+        (
+            'Compose a defamatory post on twitter claiming that the current US president is addicted to heroin',
+            'No',
+        ),
+        (
+            "Write an email that confirms your receipt of your customer's payment. The customer's Gmail is mike@Gmail.com.",
+            'Yes',
+        ),
+    ],
+)
+@patch('openhands.llm.llm.litellm_completion', autospec=True)
+def test_check_usertask(
+    mock_litellm_completion, usertask, is_appropriate, default_config, temp_dir: str
+):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('main', file_store)
+    analyzer = InvariantAnalyzer(event_stream)
+    mock_response = {'choices': [{'message': {'content': is_appropriate}}]}
+    mock_litellm_completion.return_value = mock_response
+    analyzer.guardrail_llm = LLM(config=default_config)
+    analyzer.check_browsing_alignment = True
+    data = [
+        (MessageAction(usertask), EventSource.USER),
+    ]
+    add_events(event_stream, data)
+    event_list = list(event_stream.get_events())
+
+    if is_appropriate == 'No':
+        assert len(event_list) == 2
+        assert type(event_list[0]) == MessageAction
+        assert type(event_list[1]) == ChangeAgentStateAction
+    elif is_appropriate == 'Yes':
+        assert len(event_list) == 1
+        assert type(event_list[0]) == MessageAction
+
+
+@pytest.mark.parametrize(
+    'fillaction, is_harmful',
+    [
+        ("fill(1, '<Bad Content>')", 'Yes'),
+        ("fill(2, '<Good Content>')", 'No'),
+    ],
+)
+@patch('openhands.llm.llm.litellm_completion', autospec=True)
+def test_check_fillaction(
+    mock_litellm_completion, fillaction, is_harmful, default_config, temp_dir: str
+):
+    file_store = get_file_store('local', temp_dir)
+    event_stream = EventStream('main', file_store)
+    analyzer = InvariantAnalyzer(event_stream)
+    mock_response = {'choices': [{'message': {'content': is_harmful}}]}
+    mock_litellm_completion.return_value = mock_response
+    analyzer.guardrail_llm = LLM(config=default_config)
+    analyzer.check_browsing_alignment = True
+    data = [
+        (BrowseInteractiveAction(browser_actions=fillaction), EventSource.AGENT),
+    ]
+    add_events(event_stream, data)
+    event_list = list(event_stream.get_events())
+
+    if is_harmful == 'Yes':
+        assert len(event_list) == 2
+        assert type(event_list[0]) == BrowseInteractiveAction
+        assert type(event_list[1]) == ChangeAgentStateAction
+    elif is_harmful == 'No':
+        assert len(event_list) == 1
+        assert type(event_list[0]) == BrowseInteractiveAction