From 54b74721af09de8cdc48fbc4b06a722fc128879c Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Wed, 27 Aug 2025 18:27:30 -0400
Subject: [PATCH 1/8] add ui portion of hint labeling (missing backend)

---
 browsergym/core/src/browsergym/core/env.py    |   8 +
 .../core/src/browsergym/core/hint_labeling.py |  28 ++
 .../hint_labeling_files/hint_labeling_ui.html | 313 ++++++++++++++++++
 browsergym/core/src/browsergym/utils/obs.py   |   7 +
 .../src/browsergym/experiments/loop.py        |   7 +-
 5 files changed, 359 insertions(+), 4 deletions(-)
 create mode 100644 browsergym/core/src/browsergym/core/hint_labeling.py
 create mode 100644 browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
diff --git a/browsergym/core/src/browsergym/core/env.py b/browsergym/core/src/browsergym/core/env.py
index 12c5e8bcb..2f918481e 100644
--- a/browsergym/core/src/browsergym/core/env.py
+++ b/browsergym/core/src/browsergym/core/env.py
@@ -14,6 +14,7 @@
 from .action.base import execute_python_code
 from .action.highlevel import HighLevelActionSet
 from .chat import Chat
+from .hint_labeling import HintLabeling
 from .constants import BROWSERGYM_ID_ATTRIBUTE, EXTRACT_OBS_MAX_TRIES
 from .observation import (
     MarkingError,
@@ -332,6 +333,13 @@ def override_property(task, env, property):
             chat_size=(500, max(viewport["height"], 800)),
             record_video_dir=self.record_video_dir,
         )
+        
+        # create the hint labeling ui
+        self.hint_labeling = HintLabeling(
+            headless=self.headless,
+            window_size=(500, max(viewport["height"], 800)),
+            record_video_dir=self.record_video_dir,
+        )
 
         # create a new page
         self.page = self.context.new_page()
diff --git a/browsergym/core/src/browsergym/core/hint_labeling.py b/browsergym/core/src/browsergym/core/hint_labeling.py
new file mode 100644
index 000000000..2b2d4e0a4
--- /dev/null
+++ b/browsergym/core/src/browsergym/core/hint_labeling.py
@@ -0,0 +1,28 @@
+import playwright.sync_api
+
+from importlib import resources
+
+from . import _get_global_playwright, hint_labeling_files
+
+HINT_LABELING_DIR = resources.files(hint_labeling_files)
+
+class HintLabeling:
+    def __init__(self, headless: bool, window_size=(500, 800), *args, **kwargs):
+        
+        pw: playwright.sync_api.Playwright = _get_global_playwright()
+        self.browser = pw.chromium.launch(
+            headless=headless, args=[f"--window-size={window_size[0]},{window_size[1]}"]
+        )
+        self.context = self.browser.new_context(
+            no_viewport=True,
+        )
+        self.page = self.context.new_page()
+
+        self.page.set_content(get_hint_labeling_ui(HINT_LABELING_DIR))
+        
+
+
+def get_hint_labeling_ui(hint_labeling_dir) -> str:
+    with open(hint_labeling_dir / "hint_labeling_ui.html", "r") as file:
+        hint_labeling_html = file.read()
+    return hint_labeling_html
\ No newline at end of file
diff --git a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
new file mode 100644
index 000000000..23f7c2774
--- /dev/null
+++ b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
@@ -0,0 +1,313 @@
+<!DOCTYPE html>
+<html lang="en">
+<head>
+  <meta charset="utf-8" />
+  <meta name="viewport" content="width=device-width, initial-scale=1" />
+  <title>Agent Reprompt UI</title>
+  <style>
+    :root{
+      --bg:#f4f6f8; --card:#fff; --muted:#6b7280; --text:#0f172a; --brand:#2563eb; --accent:#10b981; --danger:#ef4444; --border:#e5e7eb;
+    }
+    *{box-sizing:border-box}
+    body{margin:0;font-family:Inter,system-ui,Segoe UI,Roboto,Helvetica,Arial,sans-serif;background:var(--bg);color:var(--text)}
+    .container{max-width:1100px;margin:24px auto;padding:0 16px}
+
+    .grid{
+      display:grid;gap:16px;
+      grid-template-columns: 1fr 1fr;
+    }
+    .card{background:var(--card);border:1px solid var(--border);border-radius:16px;box-shadow:0 2px 6px rgba(0,0,0,.05)}
+    .card h2{margin:0 0 8px 0;font-size:14px;text-transform:uppercase;letter-spacing:.06em;color:var(--muted)}
+    .pad{padding:16px}
+
+    .tabs{display:flex;gap:8px;padding:8px 8px 0}
+    .tab{border:none;background:transparent;padding:10px 14px;border-radius:12px 12px 0 0;cursor:pointer;font-weight:600;color:var(--muted)}
+    .tab.active{background:var(--card);border:1px solid var(--border);border-bottom:none;color:var(--text)}
+    .tabpanel{border-top:1px solid var(--border)}
+
+    .screenshot{width:100%;height:520px;object-fit:contain;background:#0000000d;border-radius:8px}
+    .axtree{width:100%;height:520px;resize:none;border:none;padding:12px;font-family:ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;background:#0b10241a}
+
+    .hints-row{display:grid;grid-template-columns: 1fr 140px;gap:12px;align-items:start}
+    textarea.hint{width:100%;min-height:120px;resize:vertical;padding:12px;border:1px solid var(--border);border-radius:12px;font-size:14px}
+    .btn{display:inline-flex;align-items:center;justify-content:center;gap:8px;border:none;border-radius:12px;padding:12px 16px;font-weight:600;cursor:pointer}
+    .btn-primary{background:var(--brand);color:#fff}
+    .btn-primary[disabled]{opacity:.6;cursor:not-allowed}
+    .btn-ghost{background:transparent;border:1px solid var(--border)}
+
+    .choices{margin-top:12px;display:flex;flex-direction:column;gap:10px}
+    .choice{display:grid;grid-template-columns:32px 1fr;gap:12px;align-items:start;background:#ffffff;border:1px solid var(--border);border-radius:14px;padding:12px}
+    .choice input[type="radio"]{margin-top:6px;width:18px;height:18px}
+    .choice .action{font-weight:800}
+    .choice .row{display:flex;gap:6px;flex-wrap:wrap}
+    .choice .label{font-weight:700}
+    .choice .value{color:#0f172a}
+    .choice .reason{font-size:13px;color:#111827}
+
+    .footer{display:flex;justify-content:flex-end;gap:12px;margin-top:10px}
+
+    .banner{margin:12px 0;padding:10px 12px;border-radius:10px;font-size:14px}
+    .banner.info{background:#dbeafe;border:1px solid #bfdbfe}
+    .banner.error{background:#fee2e2;border:1px solid #fecaca;color:#991b1b}
+
+    .pill{display:inline-block;padding:6px 10px;border-radius:999px;background:#f1f5f9;color:#0f172a;border:1px solid var(--border);font-size:12px}
+
+    @media (max-width: 900px){
+      .grid{grid-template-columns: 1fr}
+      .screenshot,.axtree{height:420px}
+    }
+  </style>
+</head>
+<body>
+  <div class="container">
+    <!-- Top: Goal & Error -->
+    <div class="grid" style="display: flex; gap: 16px;">
+      <div class="card pad" style="flex: 1; height: 150px; overflow-y: auto;">
+        <h2>Goal</h2>
+        <div id="goalBox" style="padding: 12px 14px; font-size: 15px; background: #f8fafc;"></div>
+      </div>
+      <div class="card pad" style="flex: 1; height: 150px; overflow-y: auto;">
+        <h2>Error Feedback</h2>
+        <div id="errorBox" style="padding: 12px 14px; font-size: 15px; background: #fef2f2;"></div>
+      </div>
+    </div>
+
+    <!-- Middle: Tabs -->
+    <div class="card" style="margin-top:16px">
+      <div class="tabs">
+        <button class="tab active" data-tab="screenshot">Screenshot</button>
+        <button class="tab" data-tab="axtree">AxTree</button>
+        <button class="tab" data-tab="history">History</button>
+      </div>
+      <div class="pad tabpanel">
+        <div id="tab-screenshot" class="tabcontent">
+          <img id="screenshotImg" alt="screenshot" class="screenshot" />
+        </div>
+        <div id="tab-axtree" class="tabcontent" hidden>
+          <textarea id="axtreeArea" class="axtree" readonly></textarea>
+        </div>
+        <div id="tab-history" class="tabcontent" hidden>
+          <!-- intentionally empty for now -->
+          <div class="banner info">History will appear here.</div>
+        </div>
+      </div>
+    </div>
+
+    <!-- Hints & Reprompt -->
+    <div class="card pad" style="margin-top:16px">
+      <h2>Hints</h2>
+      <textarea id="hintInput" class="hint" placeholder="Type guidance for the next reprompt…" style="width: 100%;"></textarea>
+      <button id="repromptBtn" class="btn btn-primary" title="Send hint to get refreshed suggestions" style="margin-top: 12px;">Reprompt</button>
+      <div id="repromptStatus" class="banner info" style="display:none"></div>
+    </div>
+
+    <!-- Suggestions / Radio list -->
+    <div class="card pad" style="margin-top:16px">
+      <h2>Suggestions</h2>
+      <div id="choices" class="choices"></div>
+      <div id="choicesNote" class="banner info" style="display:none" title="Hover to see more details"></div>
+      <div class="footer">
+        <button id="resetBtn" class="btn btn-ghost" type="button" title="Click to clear all selections">Clear Selection</button>
+        <button id="submitBtn" class="btn btn-primary" disabled title="Select an action to enable">Send Action</button>
+      </div>
+      <div id="submitStatus" class="banner info" style="display:none" title="Hover to see submission status"></div>
+    </div>
+  </div>
+
+  <script>
+    /**
+     * Bootstrapping contract
+     * You can overwrite window.__BOOTSTRAP_DATA__ from your server-side template.
+     * Fields:
+     *   goal: string
+     *   error_feedback: string
+     *   screenshot_b64: base64 string (no data: prefix required)
+     *   axtree: string
+     *   action_suggestions: Array<{ action: string, COT: string, id?: string }>
+     */
+    window.__BOOTSTRAP_DATA__ = window.__BOOTSTRAP_DATA__ || {
+      goal: "go to the hardware catalog store and order a developer laptop",
+      error_feedback: "playwright error when clicking on something that is not visible (from the previous step)",
+      screenshot_b64: "", // fill with base64 (PNG/JPG). When empty, we show a placeholder.
+      axtree: "<root>\n  <window name=\"VITASPHERE\">…</window>\n</root>",
+      action_suggestions: [
+        { id: "1", action: "click(\"42\")", COT: "The button with id 42 advances the form." },
+        { id: "2", action: "type(\"Assigned to\", \"John Doe\")", COT: "Fills the assignee field before submission." },
+        { id: "3", action: "open(\"/hardware-catalog\")", COT: "Navigate directly to the catalog page." }
+      ]
+    };
+
+    // Placeholder endpoints (replace later)
+    const ENDPOINTS = {
+      REPROMPT: "/api/reprompt",   // expects POST {hint} -> returns {action_suggestions: [...]} 
+      SUBMIT: "/api/submit"        // expects POST {hint, action, COT, id?} -> returns {action_suggestions?: [...]} (optional)
+    };
+
+    // DOM references
+    const goalBox = document.getElementById('goalBox');
+    const errorBox = document.getElementById('errorBox');
+    const screenshotImg = document.getElementById('screenshotImg');
+    const axtreeArea = document.getElementById('axtreeArea');
+    const hintInput = document.getElementById('hintInput');
+    const repromptBtn = document.getElementById('repromptBtn');
+    const repromptStatus = document.getElementById('repromptStatus');
+    const choicesEl = document.getElementById('choices');
+    const choicesNote = document.getElementById('choicesNote');
+    const submitBtn = document.getElementById('submitBtn');
+    const submitStatus = document.getElementById('submitStatus');
+    const resetBtn = document.getElementById('resetBtn');
+
+    // State
+    let currentSuggestions = [];
+    let selectedId = null;
+
+    // Helpers
+    function setVisible(el, visible){ el.style.display = visible ? '' : 'none'; }
+    function setBanner(el, text, variant='info'){ el.className = `banner ${variant}`; el.textContent = text; setVisible(el,true); }
+
+    function dataUrlFromBase64(b64){
+      if(!b64) return 'data:image/svg+xml;charset=utf-8,' + encodeURIComponent(`<svg xmlns=\"http://www.w3.org/2000/svg\" width=\"1600\" height=\"900\"><rect width=\"100%\" height=\"100%\" fill=\"#eef2ff\"/><text x=\"50%\" y=\"50%\" font-family=\"sans-serif\" font-size=\"24\" text-anchor=\"middle\" fill=\"#64748b\">No screenshot provided</text></svg>`);
+      // naive sniff for png/jpg
+      const pref = b64.trim().startsWith('/') || b64.trim().startsWith('iVBOR') ? 'image/png' : 'image/jpeg';
+      return `data:${pref};base64,${b64}`;
+    }
+
+    function renderSuggestions(suggestions){
+      currentSuggestions = suggestions.slice(0,5); // cap at 5
+      choicesEl.innerHTML = '';
+      selectedId = null;
+      submitBtn.disabled = true;
+
+      if(currentSuggestions.length === 0){
+        setBanner(choicesNote, 'No suggestions yet. Try reprompting with a hint.');
+        return;
+      }
+      setVisible(choicesNote,false);
+
+      currentSuggestions.forEach((sugg, idx)=>{
+        const id = sugg.id || String(idx+1);
+        const wrapper = document.createElement('label');
+        wrapper.className = 'choice';
+        wrapper.setAttribute('for', `choice-${id}`);
+
+        const radio = document.createElement('input');
+        radio.type = 'radio';
+        radio.name = 'choice';
+        radio.id = `choice-${id}`;
+        radio.value = id;
+        radio.addEventListener('change', ()=>{ selectedId = id; submitBtn.disabled = false; });
+
+        const box = document.createElement('div');
+        const actionRow = document.createElement('div');
+        actionRow.className = 'row';
+        const actionLabel = document.createElement('span');
+        actionLabel.className = 'label action';
+        actionLabel.textContent = 'action:';
+        const actionVal = document.createElement('span');
+        actionVal.className = 'value action';
+        actionVal.textContent = ` ${sugg.action}`;
+        actionRow.appendChild(actionLabel); actionRow.appendChild(actionVal);
+
+        const reasonRow = document.createElement('div');
+        reasonRow.className = 'row reason';
+        const reasonLabel = document.createElement('span');
+        reasonLabel.className = 'label';
+        reasonLabel.textContent = 'reasoning:';
+        const reasonVal = document.createElement('span');
+        reasonVal.className = 'value';
+        reasonVal.textContent = ` ${sugg.COT}`;
+        reasonRow.appendChild(reasonLabel); reasonRow.appendChild(reasonVal);
+
+        box.appendChild(actionRow);
+        box.appendChild(reasonRow);
+
+        wrapper.appendChild(radio);
+        wrapper.appendChild(box);
+        choicesEl.appendChild(wrapper);
+      });
+    }
+
+    function currentSelection(){
+      if(!selectedId) return null;
+      const obj = currentSuggestions.find(s=> (s.id||String(currentSuggestions.indexOf(s)+1)) === selectedId);
+      return obj || null;
+    }
+
+    // Tab logic
+    document.querySelectorAll('.tab').forEach(btn=>{
+      btn.addEventListener('click',()=>{
+        document.querySelectorAll('.tab').forEach(b=>b.classList.remove('active'));
+        btn.classList.add('active');
+        const name = btn.dataset.tab;
+        document.querySelectorAll('.tabcontent').forEach(c=>c.hidden = true);
+        document.getElementById('tab-'+name).hidden = false;
+      });
+    });
+
+    // Actions
+    repromptBtn.addEventListener('click', async ()=>{
+      setBanner(repromptStatus, 'Requesting new suggestions…');
+      try{
+        const res = await fetch(ENDPOINTS.REPROMPT,{
+          method:'POST', headers:{'Content-Type':'application/json'},
+          body: JSON.stringify({ hint: hintInput.value })
+        });
+        const data = await res.json().catch(()=>({}));
+        if(!res.ok) throw new Error(data?.error || 'Reprompt failed');
+        if(Array.isArray(data.action_suggestions)){
+          renderSuggestions(data.action_suggestions);
+          setBanner(repromptStatus, 'Suggestions updated.');
+        }else{
+          setBanner(repromptStatus, 'No suggestions returned.');
+        }
+      }catch(err){
+        setBanner(repromptStatus, String(err), 'error');
+      } finally{
+        setTimeout(()=>setVisible(repromptStatus,false), 1600);
+      }
+    });
+
+    submitBtn.addEventListener('click', async ()=>{
+      const selection = currentSelection();
+      if(!selection){ return; }
+      setBanner(submitStatus, 'Submitting selection…');
+      submitBtn.disabled = true;
+      try{
+        const payload = { hint: hintInput.value, action: selection.action, COT: selection.COT, id: selection.id };
+        const res = await fetch(ENDPOINTS.SUBMIT,{
+          method:'POST', headers:{'Content-Type':'application/json'},
+          body: JSON.stringify(payload)
+        });
+        const data = await res.json().catch(()=>({}));
+        if(!res.ok) throw new Error(data?.error || 'Submit failed');
+        // Clear hint ONLY after successful submit
+        hintInput.value = '';
+        if(Array.isArray(data.action_suggestions)){
+          renderSuggestions(data.action_suggestions);
+        }
+        setBanner(submitStatus, 'Submitted successfully.');
+      }catch(err){
+        setBanner(submitStatus, String(err), 'error');
+      } finally{
+        setTimeout(()=>setVisible(submitStatus,false), 1600);
+      }
+    });
+
+    resetBtn.addEventListener('click', ()=>{
+      document.querySelectorAll('input[name="choice"]').forEach(r=> r.checked=false);
+      selectedId = null; submitBtn.disabled = true;
+    });
+
+    // Initial render from BOOTSTRAP_DATA
+    (function init(){
+      const d = window.__BOOTSTRAP_DATA__;
+      goalBox.textContent = d.goal || '';
+      errorBox.textContent = d.error_feedback || '';
+      screenshotImg.src = dataUrlFromBase64(d.screenshot_b64 || '');
+      axtreeArea.value = d.axtree || '';
+      renderSuggestions(Array.isArray(d.action_suggestions) ? d.action_suggestions : []);
+      // Start with Screenshot tab visible (already default)
+    })();
+  </script>
+</body>
+</html>
diff --git a/browsergym/core/src/browsergym/utils/obs.py b/browsergym/core/src/browsergym/utils/obs.py
index db5b8ce03..0abeb30e4 100644
--- a/browsergym/core/src/browsergym/utils/obs.py
+++ b/browsergym/core/src/browsergym/utils/obs.py
@@ -320,6 +320,13 @@ def dfs(node_idx: int, depth: int, parent_node_filtered: bool, parent_node_name:
             pass
         else:
             node_name = node["name"]["value"]
+            # if node_name == "":
+            #     try:
+            #         node_name_sources = node["name"]["sources"]
+            #         node_name_sources = [elem for elem in node_name_sources if elem.get("type") == "contents"][0]
+            #         node_name = node_name_sources.get("value", {}).get("value", "")
+            #     except Exception as e:
+            #         logger.warning(f"Failed to extract node name: {e}")
             if "value" in node and "value" in node["value"]:
                 node_value = node["value"]["value"]
             else:
diff --git a/browsergym/experiments/src/browsergym/experiments/loop.py b/browsergym/experiments/src/browsergym/experiments/loop.py
index 0ebb9e94c..9ed20fdde 100644
--- a/browsergym/experiments/src/browsergym/experiments/loop.py
+++ b/browsergym/experiments/src/browsergym/experiments/loop.py
@@ -17,16 +17,15 @@
 from pathlib import Path
 from typing import Optional
 
-from browsergym.core.env import BrowserEnv
 import gymnasium as gym
 import numpy as np
+from browsergym.core.action.parsers import highlevel_action_parser
+from browsergym.core.chat import Chat
+from browsergym.core.env import BrowserEnv
 from dataclasses_json import DataClassJsonMixin
 from PIL import Image
 from tqdm import tqdm
 
-from browsergym.core.action.parsers import highlevel_action_parser
-from browsergym.core.chat import Chat
-
 from .agent import Agent
 from .utils import count_messages_token, count_tokens
 

From ae4fe73308ab0df9c53be4229ce919e09c76d8c1 Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 00:24:19 -0400
Subject: [PATCH 2/8] update HintLabeling UI

---
 .../core/src/browsergym/core/hint_labeling.py | 124 +++++++++++++++++-
 .../hint_labeling_files/hint_labeling_ui.html |  47 +++++--
 2 files changed, 158 insertions(+), 13 deletions(-)

diff --git a/browsergym/core/src/browsergym/core/hint_labeling.py b/browsergym/core/src/browsergym/core/hint_labeling.py
index 2b2d4e0a4..a576099f6 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling.py
+++ b/browsergym/core/src/browsergym/core/hint_labeling.py
@@ -1,11 +1,31 @@
-import playwright.sync_api
-
 from importlib import resources
+from typing import Dict, List, Optional
 
+from queue import Queue, Empty
+import playwright.sync_api
+from pydantic import BaseModel, Field
+import logging
+import json
 from . import _get_global_playwright, hint_labeling_files
 
+logger = logging.getLogger(__name__)
+
 HINT_LABELING_DIR = resources.files(hint_labeling_files)
 
+# ------- Data Classes -------
+
+class HintLabelingInputs(BaseModel):
+    goal: str
+    error_feedback: str = ""
+    screenshot: str  # base64 screenshot
+    axtree: str
+    history: List[Dict[str, str]] = Field(default_factory=list)
+    hint: str = ""
+    # keep 'suggestions' on Python side, but we’ll map to UI 'action_suggestions'
+    suggestions: List[Dict[str, str]] = Field(default_factory=list)
+
+# ------- Hint Labeling backend class -------
+
 class HintLabeling:
     def __init__(self, headless: bool, window_size=(500, 800), *args, **kwargs):
         
@@ -17,10 +37,110 @@ def __init__(self, headless: bool, window_size=(500, 800), *args, **kwargs):
             no_viewport=True,
         )
         self.page = self.context.new_page()
+        self._resp_queue: "Queue[dict]" = Queue()
 
+        self.page.route("**/api/reprompt", self._route_reprompt)
+        self.page.route("**/api/submit", self._route_submit)
         self.page.set_content(get_hint_labeling_ui(HINT_LABELING_DIR))
         
+        # internal state
+        self._context: HintLabelingInputs = None
+        self._running = False
+
+    def _route_reprompt(self, route: playwright.sync_api.Route, request: playwright.sync_api.Request):
+        logger.info("Route hit: %s %s", request.method, request.url)
+        try:
+            body = json.loads(request.post_data() or "{}")
+        except Exception:
+            body = {}
+        # enqueue output 1 (reprompt)
+        msg = {"type": "reprompt", "payload": {"hint": body.get("hint", "")}}
+        self._resp_queue.put(msg)
+        # Respond something minimal so UI doesn’t break; it will be refreshed by a later update_context()
+        route.fulfill(
+            status=200,
+            content_type="application/json",
+            body=json.dumps({"action_suggestions": []}),
+        )
+
+    def _route_submit(self, route: playwright.sync_api.Route, request: playwright.sync_api.Request):
+        logger.info("Route hit: %s %s", request.method, request.url)
+        try:
+            body = json.loads(request.post_data() or "{}")
+        except Exception:
+            body = {}
+        # Map UI payload -> your step shape
+        msg = {
+            "type": "step",
+            "payload": {
+                "think": body.get("think", ""),
+                "action": body.get("action", ""),
+            },
+        }
+        self._resp_queue.put(msg)
+        # UI expects 200 JSON; we can optionally send new suggestions here too.
+        route.fulfill(
+            status=200,
+            content_type="application/json",
+            body=json.dumps({"action_suggestions": []}),
+        )
+
+    def _to_ui_bootstrap(self, ctx: HintLabelingInputs) -> dict:
+        # Map 'suggestions' [{action, thought}] -> 'action_suggestions' [{action, think}]
+        action_suggestions = [
+            {"id": str(i + 1), "action": s.get("action", ""), "think": s.get("think", "")}
+            for i, s in enumerate(ctx.suggestions or [])
+        ]
+        return {
+            "goal": ctx.goal,
+            "error_feedback": ctx.error_feedback,
+            "screenshot": ctx.screenshot,
+            "axtree": ctx.axtree,
+            "history": ctx.history,
+            "hint": ctx.hint,
+            "action_suggestions": action_suggestions,
+        }
+
+    def update_context(self, context: HintLabelingInputs):
+        self._context = context
+        ui_payload = self._to_ui_bootstrap(context)
+        # call JS function with arg (no string concat)
+        self.page.evaluate("updateContext", ui_payload)
+
+    def wait_for_response(self, timeout: Optional[float] = 600) -> dict:
+        """
+        Wait until the page makes a request to /api/reprompt or /api/submit,
+        then parse the request body and return it in your schema.
+        """
+        logger.info("Waiting for response from Hint Labeling UI...")
+
+        def is_api(req: playwright.sync_api.Request) -> bool:
+            u = req.url
+            return (u.endswith("/api/reprompt") or u.endswith("/api/submit")) and req.method == "POST"
+
+        # This pumps Playwright internally; no busy waiting.
+        with self.page.expect_request(is_api, timeout=(timeout * 1000 if timeout else 0)) as req_info:
+            req = req_info.value
+
+        body_text = req.post_data or "{}"
+        try:
+            body = json.loads(body_text)
+        except Exception as e:
+            print("JSON parse error:", e)
+            body = {}
+
+        if req.url.endswith("/api/reprompt"):
+            msg = {"type": "reprompt", "payload": {"hint": body.get("hint", "")}}
+        else:
+            msg = {"type": "step",
+                "payload": {"think": body.get("think", ""), "action": body.get("action", "")}}
+
+        logger.info("Response received: %s", msg)
+        return msg
 
+    def close(self):
+        self.context.close()
+        self.browser.close()
 
 def get_hint_labeling_ui(hint_labeling_dir) -> str:
     with open(hint_labeling_dir / "hint_labeling_ui.html", "r") as file:
diff --git a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
index 23f7c2774..889bd0cce 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
+++ b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
@@ -3,6 +3,7 @@
 <head>
   <meta charset="utf-8" />
   <meta name="viewport" content="width=device-width, initial-scale=1" />
+  <base href="http://route.local/"><!-- NEW: gives fetch a resolvable origin -->
   <title>Agent Reprompt UI</title>
   <style>
     :root{
@@ -121,26 +122,50 @@ <h2>Suggestions</h2>
      * Fields:
      *   goal: string
      *   error_feedback: string
-     *   screenshot_b64: base64 string (no data: prefix required)
+     *   screenshot: base64 string (no data: prefix required)
      *   axtree: string
-     *   action_suggestions: Array<{ action: string, COT: string, id?: string }>
+     *   hint: string
+     *   action_suggestions: Array<{ action: string, think: string, id?: string }>
      */
     window.__BOOTSTRAP_DATA__ = window.__BOOTSTRAP_DATA__ || {
       goal: "go to the hardware catalog store and order a developer laptop",
       error_feedback: "playwright error when clicking on something that is not visible (from the previous step)",
-      screenshot_b64: "", // fill with base64 (PNG/JPG). When empty, we show a placeholder.
+      screenshot: "", // fill with base64 (PNG/JPG). When empty, we show a placeholder.
       axtree: "<root>\n  <window name=\"VITASPHERE\">…</window>\n</root>",
-      action_suggestions: [
-        { id: "1", action: "click(\"42\")", COT: "The button with id 42 advances the form." },
-        { id: "2", action: "type(\"Assigned to\", \"John Doe\")", COT: "Fills the assignee field before submission." },
-        { id: "3", action: "open(\"/hardware-catalog\")", COT: "Navigate directly to the catalog page." }
+      history: [],
+      hint: "",
+      suggestions: [
+        { id: "1", action: "click(\"42\")", think: "The button with id 42 advances the form." },
+        { id: "2", action: "type(\"Assigned to\", \"John Doe\")", think: "Fills the assignee field before submission." },
+        { id: "3", action: "open(\"/hardware-catalog\")", think: "Navigate directly to the catalog page." }
       ]
     };
 
+    var RECEIVED_RESPONSE = false;
+
+    function applyContext(d){
+      goalBox.textContent = d.goal || '';
+      errorBox.textContent = d.error_feedback || '';
+      screenshotImg.src = dataUrlFromBase64(d.screenshot || '');
+      axtreeArea.value = d.axtree || '';
+      if (Array.isArray(d.action_suggestions)) {
+        renderSuggestions(d.action_suggestions);
+      }
+      // keep the hint textarea in sync only if it's currently empty,
+      // so we don't clobber user typing
+      if (!hintInput.value) hintInput.value = d.hint || '';
+    }
+
+    // REPLACE your old updateContext with this:
+    function updateContext(data){
+      window.__BOOTSTRAP_DATA__ = data || {};
+      applyContext(window.__BOOTSTRAP_DATA__);
+    }
+
     // Placeholder endpoints (replace later)
     const ENDPOINTS = {
       REPROMPT: "/api/reprompt",   // expects POST {hint} -> returns {action_suggestions: [...]} 
-      SUBMIT: "/api/submit"        // expects POST {hint, action, COT, id?} -> returns {action_suggestions?: [...]} (optional)
+      SUBMIT: "/api/submit"        // expects POST {hint, action, think, id?} -> returns {action_suggestions?: [...]} (optional)
     };
 
     // DOM references
@@ -215,7 +240,7 @@ <h2>Suggestions</h2>
         reasonLabel.textContent = 'reasoning:';
         const reasonVal = document.createElement('span');
         reasonVal.className = 'value';
-        reasonVal.textContent = ` ${sugg.COT}`;
+        reasonVal.textContent = ` ${sugg.think}`;
         reasonRow.appendChild(reasonLabel); reasonRow.appendChild(reasonVal);
 
         box.appendChild(actionRow);
@@ -273,7 +298,7 @@ <h2>Suggestions</h2>
       setBanner(submitStatus, 'Submitting selection…');
       submitBtn.disabled = true;
       try{
-        const payload = { hint: hintInput.value, action: selection.action, COT: selection.COT, id: selection.id };
+        const payload = { hint: hintInput.value, action: selection.action, think: selection.think, id: selection.id };
         const res = await fetch(ENDPOINTS.SUBMIT,{
           method:'POST', headers:{'Content-Type':'application/json'},
           body: JSON.stringify(payload)
@@ -303,7 +328,7 @@ <h2>Suggestions</h2>
       const d = window.__BOOTSTRAP_DATA__;
       goalBox.textContent = d.goal || '';
       errorBox.textContent = d.error_feedback || '';
-      screenshotImg.src = dataUrlFromBase64(d.screenshot_b64 || '');
+      screenshotImg.src = dataUrlFromBase64(d.screenshot || '');
       axtreeArea.value = d.axtree || '';
       renderSuggestions(Array.isArray(d.action_suggestions) ? d.action_suggestions : []);
       // Start with Screenshot tab visible (already default)

From 8643b912dbc50a62e476fb65e61d187dc2750bf4 Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 00:44:11 -0400
Subject: [PATCH 3/8] bugfix

---
 .../core/src/browsergym/core/hint_labeling.py | 15 ++++-------
 .../hint_labeling_files/hint_labeling_ui.html | 25 ++++++++++---------
 2 files changed, 18 insertions(+), 22 deletions(-)

diff --git a/browsergym/core/src/browsergym/core/hint_labeling.py b/browsergym/core/src/browsergym/core/hint_labeling.py
index a576099f6..f0e4a3062 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling.py
+++ b/browsergym/core/src/browsergym/core/hint_labeling.py
@@ -21,7 +21,7 @@ class HintLabelingInputs(BaseModel):
     axtree: str
     history: List[Dict[str, str]] = Field(default_factory=list)
     hint: str = ""
-    # keep 'suggestions' on Python side, but we’ll map to UI 'action_suggestions'
+    # keep 'suggestions' on Python side, but we’ll map to UI 'suggestions'
     suggestions: List[Dict[str, str]] = Field(default_factory=list)
 
 # ------- Hint Labeling backend class -------
@@ -60,7 +60,7 @@ def _route_reprompt(self, route: playwright.sync_api.Route, request: playwright.
         route.fulfill(
             status=200,
             content_type="application/json",
-            body=json.dumps({"action_suggestions": []}),
+            body=json.dumps({"suggestions": []}),
         )
 
     def _route_submit(self, route: playwright.sync_api.Route, request: playwright.sync_api.Request):
@@ -82,15 +82,10 @@ def _route_submit(self, route: playwright.sync_api.Route, request: playwright.sy
         route.fulfill(
             status=200,
             content_type="application/json",
-            body=json.dumps({"action_suggestions": []}),
+            body=json.dumps({"suggestions": []}),
         )
 
     def _to_ui_bootstrap(self, ctx: HintLabelingInputs) -> dict:
-        # Map 'suggestions' [{action, thought}] -> 'action_suggestions' [{action, think}]
-        action_suggestions = [
-            {"id": str(i + 1), "action": s.get("action", ""), "think": s.get("think", "")}
-            for i, s in enumerate(ctx.suggestions or [])
-        ]
         return {
             "goal": ctx.goal,
             "error_feedback": ctx.error_feedback,
@@ -98,14 +93,14 @@ def _to_ui_bootstrap(self, ctx: HintLabelingInputs) -> dict:
             "axtree": ctx.axtree,
             "history": ctx.history,
             "hint": ctx.hint,
-            "action_suggestions": action_suggestions,
+            "suggestions": ctx.suggestions,
         }
 
     def update_context(self, context: HintLabelingInputs):
         self._context = context
         ui_payload = self._to_ui_bootstrap(context)
         # call JS function with arg (no string concat)
-        self.page.evaluate("updateContext", ui_payload)
+        self.page.evaluate("(d) => updateContext(d)", ui_payload)
 
     def wait_for_response(self, timeout: Optional[float] = 600) -> dict:
         """
diff --git a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
index 889bd0cce..ead39429d 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
+++ b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
@@ -125,7 +125,7 @@ <h2>Suggestions</h2>
      *   screenshot: base64 string (no data: prefix required)
      *   axtree: string
      *   hint: string
-     *   action_suggestions: Array<{ action: string, think: string, id?: string }>
+     *   suggestions: Array<{ action: string, think: string, id?: string }>
      */
     window.__BOOTSTRAP_DATA__ = window.__BOOTSTRAP_DATA__ || {
       goal: "go to the hardware catalog store and order a developer laptop",
@@ -148,8 +148,8 @@ <h2>Suggestions</h2>
       errorBox.textContent = d.error_feedback || '';
       screenshotImg.src = dataUrlFromBase64(d.screenshot || '');
       axtreeArea.value = d.axtree || '';
-      if (Array.isArray(d.action_suggestions)) {
-        renderSuggestions(d.action_suggestions);
+      if (Array.isArray(d.suggestions)) {
+        renderSuggestions(d.suggestions);
       }
       // keep the hint textarea in sync only if it's currently empty,
       // so we don't clobber user typing
@@ -164,8 +164,8 @@ <h2>Suggestions</h2>
 
     // Placeholder endpoints (replace later)
     const ENDPOINTS = {
-      REPROMPT: "/api/reprompt",   // expects POST {hint} -> returns {action_suggestions: [...]} 
-      SUBMIT: "/api/submit"        // expects POST {hint, action, think, id?} -> returns {action_suggestions?: [...]} (optional)
+      REPROMPT: "/api/reprompt",   // expects POST {hint} -> returns {suggestions: [...]} 
+      SUBMIT: "/api/submit"        // expects POST {hint, action, think, id?} -> returns {suggestions?: [...]} (optional)
     };
 
     // DOM references
@@ -279,11 +279,12 @@ <h2>Suggestions</h2>
         });
         const data = await res.json().catch(()=>({}));
         if(!res.ok) throw new Error(data?.error || 'Reprompt failed');
-        if(Array.isArray(data.action_suggestions)){
-          renderSuggestions(data.action_suggestions);
+        if (Array.isArray(data.suggestions) && data.suggestions.length > 0){
+          renderSuggestions(data.suggestions);
           setBanner(repromptStatus, 'Suggestions updated.');
-        }else{
-          setBanner(repromptStatus, 'No suggestions returned.');
+        } else {
+          // don't clear the current list; just keep the banner
+          setBanner(repromptStatus, 'Request sent. Waiting for new suggestions…');
         }
       }catch(err){
         setBanner(repromptStatus, String(err), 'error');
@@ -307,8 +308,8 @@ <h2>Suggestions</h2>
         if(!res.ok) throw new Error(data?.error || 'Submit failed');
         // Clear hint ONLY after successful submit
         hintInput.value = '';
-        if(Array.isArray(data.action_suggestions)){
-          renderSuggestions(data.action_suggestions);
+        if(Array.isArray(data.suggestions)){
+          renderSuggestions(data.suggestions);
         }
         setBanner(submitStatus, 'Submitted successfully.');
       }catch(err){
@@ -330,7 +331,7 @@ <h2>Suggestions</h2>
       errorBox.textContent = d.error_feedback || '';
       screenshotImg.src = dataUrlFromBase64(d.screenshot || '');
       axtreeArea.value = d.axtree || '';
-      renderSuggestions(Array.isArray(d.action_suggestions) ? d.action_suggestions : []);
+      renderSuggestions(Array.isArray(d.suggestions) ? d.suggestions : []);
       // Start with Screenshot tab visible (already default)
     })();
   </script>

From e1fa7c3d0ee5f91eab02ee10410d7d541defb0f7 Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 09:15:15 -0400
Subject: [PATCH 4/8] update UI

---
 browsergym/core/src/browsergym/core/hint_labeling.py |  2 +-
 .../core/hint_labeling_files/hint_labeling_ui.html   | 12 +++++++-----
 2 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/browsergym/core/src/browsergym/core/hint_labeling.py b/browsergym/core/src/browsergym/core/hint_labeling.py
index f0e4a3062..ca5bc5b1a 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling.py
+++ b/browsergym/core/src/browsergym/core/hint_labeling.py
@@ -27,7 +27,7 @@ class HintLabelingInputs(BaseModel):
 # ------- Hint Labeling backend class -------
 
 class HintLabeling:
-    def __init__(self, headless: bool, window_size=(500, 800), *args, **kwargs):
+    def __init__(self, headless: bool, window_size=(600, 1000), *args, **kwargs):
         
         pw: playwright.sync_api.Playwright = _get_global_playwright()
         self.browser = pw.chromium.launch(
diff --git a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
index ead39429d..1d7b069c0 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
+++ b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
@@ -26,7 +26,7 @@
     .tab.active{background:var(--card);border:1px solid var(--border);border-bottom:none;color:var(--text)}
     .tabpanel{border-top:1px solid var(--border)}
 
-    .screenshot{width:100%;height:520px;object-fit:contain;background:#0000000d;border-radius:8px}
+    .screenshot{width:100%;aspect-ratio: 16 / 9;object-fit:contain;background:#0000000d;border-radius:8px}
     .axtree{width:100%;height:520px;resize:none;border:none;padding:12px;font-family:ui-monospace,SFMono-Regular,Menlo,Monaco,Consolas,monospace;background:#0b10241a}
 
     .hints-row{display:grid;grid-template-columns: 1fr 140px;gap:12px;align-items:start}
@@ -55,7 +55,7 @@
 
     @media (max-width: 900px){
       .grid{grid-template-columns: 1fr}
-      .screenshot,.axtree{height:420px}
+      .axtree{height:420px}
     }
   </style>
 </head>
@@ -85,7 +85,7 @@ <h2>Error Feedback</h2>
           <img id="screenshotImg" alt="screenshot" class="screenshot" />
         </div>
         <div id="tab-axtree" class="tabcontent" hidden>
-          <textarea id="axtreeArea" class="axtree" readonly></textarea>
+          <textarea id="axtreeArea" class="axtree" readonly style="font-size: 12px; white-space: pre; overflow-wrap: normal;"></textarea>
         </div>
         <div id="tab-history" class="tabcontent" hidden>
           <!-- intentionally empty for now -->
@@ -240,6 +240,8 @@ <h2>Suggestions</h2>
         reasonLabel.textContent = 'reasoning:';
         const reasonVal = document.createElement('span');
         reasonVal.className = 'value';
+        reasonVal.style.maxHeight = '3em';
+        reasonVal.style.overflowY = 'auto';
         reasonVal.textContent = ` ${sugg.think}`;
         reasonRow.appendChild(reasonLabel); reasonRow.appendChild(reasonVal);
 
@@ -327,8 +329,8 @@ <h2>Suggestions</h2>
     // Initial render from BOOTSTRAP_DATA
     (function init(){
       const d = window.__BOOTSTRAP_DATA__;
-      goalBox.textContent = d.goal || '';
-      errorBox.textContent = d.error_feedback || '';
+      goalBox.innerHTML = (d.goal || '').replace(/\n/g, '<br>');
+      errorBox.innerHTML = (d.error_feedback || '').replace(/\n/g, '<br>');
       screenshotImg.src = dataUrlFromBase64(d.screenshot || '');
       axtreeArea.value = d.axtree || '';
       renderSuggestions(Array.isArray(d.suggestions) ? d.suggestions : []);

From 1ef4629d9ac0a6b6f2bf6f00e5d2520b00cecd60 Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 12:12:01 -0400
Subject: [PATCH 5/8] cosmetic changes

---
 browsergym/core/src/browsergym/core/env.py    | 35 +++++++++++++------
 .../core/src/browsergym/core/hint_labeling.py | 28 ++++++++++-----
 .../hint_labeling_files/hint_labeling_ui.html | 19 ++++++----
 .../src/browsergym/experiments/loop.py        |  2 ++
 4 files changed, 60 insertions(+), 24 deletions(-)

diff --git a/browsergym/core/src/browsergym/core/env.py b/browsergym/core/src/browsergym/core/env.py
index 2f918481e..548a1e919 100644
--- a/browsergym/core/src/browsergym/core/env.py
+++ b/browsergym/core/src/browsergym/core/env.py
@@ -69,6 +69,8 @@ def __init__(
         tags_to_mark: Literal["all", "standard_html"] = "standard_html",
         # interactive / debugging arguments
         headless: bool = True,
+        use_chat_ui: bool = False,
+        use_hint_labeling_ui: bool = False,
         wait_for_user_message: bool = False,
         terminate_on_infeasible: bool = True,
         resizeable_window: bool = False,
@@ -121,6 +123,8 @@ def __init__(
         self.action_mapping = action_mapping
         self.use_raw_page_output = use_raw_page_output
         self.pre_observation_delay = pre_observation_delay
+        self.use_chat_ui = use_chat_ui
+        self.use_hint_labeling_ui = use_hint_labeling_ui
 
         # check argument values
         assert tags_to_mark in ("all", "standard_html")
@@ -137,6 +141,10 @@ def __init__(
         # chat
         self.chat: Chat = None
 
+        # hint labeling
+        if self.use_hint_labeling_ui:
+            self.hint_labeling: "HintLabeling" = None
+
         # observation space
         if use_raw_page_output:
             self.observation_space = gym.spaces.Dict(
@@ -209,9 +217,12 @@ def close(self):
             self.task.teardown()
             self.task = None
         # close the chat
-        if self.chat:
-            self.chat.close()
-            self.chat = None
+        self.chat.close()
+        self.chat = None
+
+        if self.use_hint_labeling_ui and self.hint_labeling:
+            self.hint_labeling.close()
+            self.hint_labeling = None
         # close the browser context
         if self.context:
             self.context.close()
@@ -229,6 +240,8 @@ def reset(self, seed=None, *args, **kwargs):
             self.task.teardown()
             self.context.close()
             self.chat.close()
+            if self.use_hint_labeling_ui:
+                self.hint_labeling.close()
             self.browser.close()
 
         # create a new task
@@ -328,18 +341,20 @@ def override_property(task, env, property):
         )
 
         # create the chat
+        # chat always exist even is use_chat_ui is False since we use it to keep track of messages
         self.chat = Chat(
-            headless=self.headless,
+            headless=not (self.headless is False and self.use_chat_ui is True),
             chat_size=(500, max(viewport["height"], 800)),
             record_video_dir=self.record_video_dir,
         )
-        
+
         # create the hint labeling ui
-        self.hint_labeling = HintLabeling(
-            headless=self.headless,
-            window_size=(500, max(viewport["height"], 800)),
-            record_video_dir=self.record_video_dir,
-        )
+        if self.use_hint_labeling_ui:
+            self.hint_labeling = HintLabeling(
+                headless=self.headless,
+                window_size=(500, max(viewport["height"], 800)),
+                record_video_dir=self.record_video_dir,
+            )
 
         # create a new page
         self.page = self.context.new_page()
diff --git a/browsergym/core/src/browsergym/core/hint_labeling.py b/browsergym/core/src/browsergym/core/hint_labeling.py
index ca5bc5b1a..ae0cf4fc4 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling.py
+++ b/browsergym/core/src/browsergym/core/hint_labeling.py
@@ -14,6 +14,7 @@
 
 # ------- Data Classes -------
 
+
 class HintLabelingInputs(BaseModel):
     goal: str
     error_feedback: str = ""
@@ -24,11 +25,13 @@ class HintLabelingInputs(BaseModel):
     # keep 'suggestions' on Python side, but we’ll map to UI 'suggestions'
     suggestions: List[Dict[str, str]] = Field(default_factory=list)
 
+
 # ------- Hint Labeling backend class -------
 
+
 class HintLabeling:
     def __init__(self, headless: bool, window_size=(600, 1000), *args, **kwargs):
-        
+
         pw: playwright.sync_api.Playwright = _get_global_playwright()
         self.browser = pw.chromium.launch(
             headless=headless, args=[f"--window-size={window_size[0]},{window_size[1]}"]
@@ -42,12 +45,14 @@ def __init__(self, headless: bool, window_size=(600, 1000), *args, **kwargs):
         self.page.route("**/api/reprompt", self._route_reprompt)
         self.page.route("**/api/submit", self._route_submit)
         self.page.set_content(get_hint_labeling_ui(HINT_LABELING_DIR))
-        
+
         # internal state
         self._context: HintLabelingInputs = None
         self._running = False
 
-    def _route_reprompt(self, route: playwright.sync_api.Route, request: playwright.sync_api.Request):
+    def _route_reprompt(
+        self, route: playwright.sync_api.Route, request: playwright.sync_api.Request
+    ):
         logger.info("Route hit: %s %s", request.method, request.url)
         try:
             body = json.loads(request.post_data() or "{}")
@@ -111,10 +116,14 @@ def wait_for_response(self, timeout: Optional[float] = 600) -> dict:
 
         def is_api(req: playwright.sync_api.Request) -> bool:
             u = req.url
-            return (u.endswith("/api/reprompt") or u.endswith("/api/submit")) and req.method == "POST"
+            return (
+                u.endswith("/api/reprompt") or u.endswith("/api/submit")
+            ) and req.method == "POST"
 
         # This pumps Playwright internally; no busy waiting.
-        with self.page.expect_request(is_api, timeout=(timeout * 1000 if timeout else 0)) as req_info:
+        with self.page.expect_request(
+            is_api, timeout=(timeout * 1000 if timeout else 0)
+        ) as req_info:
             req = req_info.value
 
         body_text = req.post_data or "{}"
@@ -127,8 +136,10 @@ def is_api(req: playwright.sync_api.Request) -> bool:
         if req.url.endswith("/api/reprompt"):
             msg = {"type": "reprompt", "payload": {"hint": body.get("hint", "")}}
         else:
-            msg = {"type": "step",
-                "payload": {"think": body.get("think", ""), "action": body.get("action", "")}}
+            msg = {
+                "type": "step",
+                "payload": {"think": body.get("think", ""), "action": body.get("action", "")},
+            }
 
         logger.info("Response received: %s", msg)
         return msg
@@ -137,7 +148,8 @@ def close(self):
         self.context.close()
         self.browser.close()
 
+
 def get_hint_labeling_ui(hint_labeling_dir) -> str:
     with open(hint_labeling_dir / "hint_labeling_ui.html", "r") as file:
         hint_labeling_html = file.read()
-    return hint_labeling_html
\ No newline at end of file
+    return hint_labeling_html
diff --git a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
index 1d7b069c0..6fc9c636b 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
+++ b/browsergym/core/src/browsergym/core/hint_labeling_files/hint_labeling_ui.html
@@ -57,19 +57,26 @@
       .grid{grid-template-columns: 1fr}
       .axtree{height:420px}
     }
+
+    #goalBox,
+    #errorBox {
+      white-space: pre-wrap;     /* respects \n; collapses multiple spaces nicely */
+      overflow-wrap: anywhere;   /* wrap very long tokens (URLs/unbroken text) */
+      word-break: break-word;    /* fallback for older engines */
+    }
   </style>
 </head>
 <body>
   <div class="container">
     <!-- Top: Goal & Error -->
     <div class="grid" style="display: flex; gap: 16px;">
-      <div class="card pad" style="flex: 1; height: 150px; overflow-y: auto;">
+      <div class="card pad" style="flex: 1; height: 150px;">
         <h2>Goal</h2>
-        <div id="goalBox" style="padding: 12px 14px; font-size: 15px; background: #f8fafc;"></div>
+        <div id="goalBox" style="padding: 12px 14px; font-size: 15px; background: #f8fafc; height: 80%; overflow-y: auto;"></div>
       </div>
-      <div class="card pad" style="flex: 1; height: 150px; overflow-y: auto;">
+      <div class="card pad" style="flex: 1; height: 150px;">
         <h2>Error Feedback</h2>
-        <div id="errorBox" style="padding: 12px 14px; font-size: 15px; background: #fef2f2;"></div>
+        <div id="errorBox" style="padding: 12px 14px; font-size: 15px; background: #fef2f2; height: 80%; overflow-y: auto;"></div>
       </div>
     </div>
 
@@ -329,8 +336,8 @@ <h2>Suggestions</h2>
     // Initial render from BOOTSTRAP_DATA
     (function init(){
       const d = window.__BOOTSTRAP_DATA__;
-      goalBox.innerHTML = (d.goal || '').replace(/\n/g, '<br>');
-      errorBox.innerHTML = (d.error_feedback || '').replace(/\n/g, '<br>');
+      goalBox.textContent = d.goal || '';
+      errorBox.textContent = d.error_feedback || '';
       screenshotImg.src = dataUrlFromBase64(d.screenshot || '');
       axtreeArea.value = d.axtree || '';
       renderSuggestions(Array.isArray(d.suggestions) ? d.suggestions : []);
diff --git a/browsergym/experiments/src/browsergym/experiments/loop.py b/browsergym/experiments/src/browsergym/experiments/loop.py
index 9ed20fdde..40d36dd55 100644
--- a/browsergym/experiments/src/browsergym/experiments/loop.py
+++ b/browsergym/experiments/src/browsergym/experiments/loop.py
@@ -46,6 +46,8 @@ class EnvArgs(DataClassJsonMixin):
     slow_mo: Optional[int] = None  # use default value from BrowserGym
     storage_state: Optional[str | Path | dict] = None
     task_kwargs: Optional[dict] = None  # use default value from BrowserGym
+    use_chat_ui: bool = False
+    use_hint_labeling_ui: bool = False
 
     def make_env(
         self, action_mapping, exp_dir, exp_task_kwargs: dict = {}, use_raw_page_output=False

From 15f4c5e861390017e76ca0c0f5ad7f2d96fbef1a Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 14:31:25 -0400
Subject: [PATCH 6/8] clean up env.py

---
 browsergym/core/src/browsergym/core/env.py | 14 ++++++++------
 1 file changed, 8 insertions(+), 6 deletions(-)

diff --git a/browsergym/core/src/browsergym/core/env.py b/browsergym/core/src/browsergym/core/env.py
index 548a1e919..26581d3a6 100644
--- a/browsergym/core/src/browsergym/core/env.py
+++ b/browsergym/core/src/browsergym/core/env.py
@@ -14,8 +14,8 @@
 from .action.base import execute_python_code
 from .action.highlevel import HighLevelActionSet
 from .chat import Chat
-from .hint_labeling import HintLabeling
 from .constants import BROWSERGYM_ID_ATTRIBUTE, EXTRACT_OBS_MAX_TRIES
+from .hint_labeling import HintLabeling
 from .observation import (
     MarkingError,
     _post_extract,
@@ -143,7 +143,7 @@ def __init__(
 
         # hint labeling
         if self.use_hint_labeling_ui:
-            self.hint_labeling: "HintLabeling" = None
+            self.hint_labeling: HintLabeling = None
 
         # observation space
         if use_raw_page_output:
@@ -217,8 +217,9 @@ def close(self):
             self.task.teardown()
             self.task = None
         # close the chat
-        self.chat.close()
-        self.chat = None
+        if self.chat:
+            self.chat.close()
+            self.chat = None
 
         if self.use_hint_labeling_ui and self.hint_labeling:
             self.hint_labeling.close()
@@ -240,7 +241,7 @@ def reset(self, seed=None, *args, **kwargs):
             self.task.teardown()
             self.context.close()
             self.chat.close()
-            if self.use_hint_labeling_ui:
+            if self.use_hint_labeling_ui and self.hint_labeling:
                 self.hint_labeling.close()
             self.browser.close()
 
@@ -342,6 +343,7 @@ def override_property(task, env, property):
 
         # create the chat
         # chat always exist even is use_chat_ui is False since we use it to keep track of messages
+        # we only show the chat ui if both headless is False and use_chat_ui is True
         self.chat = Chat(
             headless=not (self.headless is False and self.use_chat_ui is True),
             chat_size=(500, max(viewport["height"], 800)),
@@ -352,7 +354,7 @@ def override_property(task, env, property):
         if self.use_hint_labeling_ui:
             self.hint_labeling = HintLabeling(
                 headless=self.headless,
-                window_size=(500, max(viewport["height"], 800)),
+                window_size=(600, max(viewport["height"], 1000)),
                 record_video_dir=self.record_video_dir,
             )
 

From 5dc7b63129c030b831fc4d4d491e0c48422b2305 Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 14:35:52 -0400
Subject: [PATCH 7/8] minimal cleanup

---
 .../core/src/browsergym/core/hint_labeling.py      | 13 ++++---------
 browsergym/core/src/browsergym/utils/obs.py        | 14 +++++++-------
 2 files changed, 11 insertions(+), 16 deletions(-)

diff --git a/browsergym/core/src/browsergym/core/hint_labeling.py b/browsergym/core/src/browsergym/core/hint_labeling.py
index ae0cf4fc4..45efac48d 100644
--- a/browsergym/core/src/browsergym/core/hint_labeling.py
+++ b/browsergym/core/src/browsergym/core/hint_labeling.py
@@ -1,19 +1,18 @@
+import json
+import logging
 from importlib import resources
+from queue import Queue
 from typing import Dict, List, Optional
 
-from queue import Queue, Empty
 import playwright.sync_api
 from pydantic import BaseModel, Field
-import logging
-import json
+
 from . import _get_global_playwright, hint_labeling_files
 
 logger = logging.getLogger(__name__)
 
 HINT_LABELING_DIR = resources.files(hint_labeling_files)
 
-# ------- Data Classes -------
-
 
 class HintLabelingInputs(BaseModel):
     goal: str
@@ -22,13 +21,9 @@ class HintLabelingInputs(BaseModel):
     axtree: str
     history: List[Dict[str, str]] = Field(default_factory=list)
     hint: str = ""
-    # keep 'suggestions' on Python side, but we’ll map to UI 'suggestions'
     suggestions: List[Dict[str, str]] = Field(default_factory=list)
 
 
-# ------- Hint Labeling backend class -------
-
-
 class HintLabeling:
     def __init__(self, headless: bool, window_size=(600, 1000), *args, **kwargs):
 
diff --git a/browsergym/core/src/browsergym/utils/obs.py b/browsergym/core/src/browsergym/utils/obs.py
index 0abeb30e4..6f70862a0 100644
--- a/browsergym/core/src/browsergym/utils/obs.py
+++ b/browsergym/core/src/browsergym/utils/obs.py
@@ -320,13 +320,13 @@ def dfs(node_idx: int, depth: int, parent_node_filtered: bool, parent_node_name:
             pass
         else:
             node_name = node["name"]["value"]
-            # if node_name == "":
-            #     try:
-            #         node_name_sources = node["name"]["sources"]
-            #         node_name_sources = [elem for elem in node_name_sources if elem.get("type") == "contents"][0]
-            #         node_name = node_name_sources.get("value", {}).get("value", "")
-            #     except Exception as e:
-            #         logger.warning(f"Failed to extract node name: {e}")
+            if node_name == "":
+                try:
+                    node_name_sources = node["name"]["sources"]
+                    node_name_sources = [elem for elem in node_name_sources if elem.get("type") == "contents"][0]
+                    node_name = node_name_sources.get("value", {}).get("value", "")
+                except Exception as e:
+                    logger.warning(f"Failed to extract node name: {e}")
             if "value" in node and "value" in node["value"]:
                 node_value = node["value"]["value"]
             else:

From 37bc1429e032ae2b4a714d192585eba905d766d0 Mon Sep 17 00:00:00 2001
From: Patrice Bechard <patrice.bechard@servicenow.com>
Date: Thu, 28 Aug 2025 14:37:16 -0400
Subject: [PATCH 8/8] remove unused changes

---
 browsergym/core/src/browsergym/utils/obs.py | 7 -------
 1 file changed, 7 deletions(-)

diff --git a/browsergym/core/src/browsergym/utils/obs.py b/browsergym/core/src/browsergym/utils/obs.py
index 6f70862a0..db5b8ce03 100644
--- a/browsergym/core/src/browsergym/utils/obs.py
+++ b/browsergym/core/src/browsergym/utils/obs.py
@@ -320,13 +320,6 @@ def dfs(node_idx: int, depth: int, parent_node_filtered: bool, parent_node_name:
             pass
         else:
             node_name = node["name"]["value"]
-            if node_name == "":
-                try:
-                    node_name_sources = node["name"]["sources"]
-                    node_name_sources = [elem for elem in node_name_sources if elem.get("type") == "contents"][0]
-                    node_name = node_name_sources.get("value", {}).get("value", "")
-                except Exception as e:
-                    logger.warning(f"Failed to extract node name: {e}")
             if "value" in node and "value" in node["value"]:
                 node_value = node["value"]["value"]
             else: