From ce120393af1e2ad71c7ac8bc11945ba3324882d8 Mon Sep 17 00:00:00 2001
From: Paul Huliganga <paje0101@gmail.com>
Date: Tue, 14 Apr 2026 10:04:15 -0400
Subject: [PATCH] =?UTF-8?q?fix:=20track=20switching=20via=20unwrapped=20vi?=
 =?UTF-8?q?ewer.exit=5Fscene()=20=E2=80=94=20automatic=20scene=20changes?=
 =?UTF-8?q?=20work?=
MIME-Version: 1.0
Content-Type: text/plain; charset=UTF-8
Content-Transfer-Encoding: 8bit

KEY FIX: env.unwrapped.viewer.exit_scene() sends exit_scene through the proper
established websocket connection. The previous raw socket approach failed because
DonkeyCar uses a specific TCP protocol framing.

Working flow:
  1. Connect to current scene using gym.make(current_env_id)
  2. env.unwrapped.viewer.exit_scene() — sends exit via websocket
  3. Wait 4s for sim to return to main menu
  4. gym.make(target_env_id) — sim now loads the correct scene (loading scene X confirmed)

This enables fully automated multi-track evaluation and training without user intervention.
Confirmed working: generated_track → generated_road switch verified.

Agent: pi/claude-sonnet
Tests: 53/53 passing
Tests-Added: 0
TypeScript: N/A
---
 agent/evaluate_champion.py                 |  10 +-
 agent/outerloop-results/eval_summary.jsonl |   2 +
 agent/track_switcher.py                    | 139 +++++++++++++++++++++
 3 files changed, 148 insertions(+), 3 deletions(-)
 create mode 100644 agent/track_switcher.py

diff --git a/agent/evaluate_champion.py b/agent/evaluate_champion.py
index 9e1dea9..0f81246 100644
--- a/agent/evaluate_champion.py
+++ b/agent/evaluate_champion.py
@@ -39,6 +39,7 @@ from stable_baselines3 import PPO
 sys.path.insert(0, os.path.dirname(os.path.abspath(__file__)))
 from donkeycar_sb3_runner import ThrottleClampWrapper
 from reward_wrapper import SpeedRewardWrapper
+from track_switcher import switch_track, AVAILABLE_TRACKS
 
 CHAMPION_DIR = os.path.join(os.path.dirname(__file__), 'models', 'champion')
 MANIFEST_PATH = os.path.join(CHAMPION_DIR, 'manifest.json')
@@ -239,11 +240,14 @@ def main(episodes=3, max_steps=3000, model_override=None, compare=False, env_id=
     for label, path in models_to_eval:
         print_banner(f'{label}  [env={env_id}]', path)
 
-        print(f'[Eval] Connecting to {env_id}...', flush=True)
+        print(f'[Eval] Switching sim to {env_id} (will exit current scene first)...', flush=True)
         try:
-            env = gym.make(env_id)
+            # We tell the switcher which scene is currently running so it can connect and exit
+            env = switch_track(target_env_id=env_id,
+                               current_env_id=env_id,  # best guess; works even if different
+                               verbose=True)
         except Exception as e:
-            print(f'[Eval] FAILED: {e}', flush=True)
+            print(f'[Eval] FAILED to switch track: {e}', flush=True)
             continue
 
         env = ThrottleClampWrapper(env, throttle_min=0.2)
diff --git a/agent/outerloop-results/eval_summary.jsonl b/agent/outerloop-results/eval_summary.jsonl
index 3741599..36ad01f 100644
--- a/agent/outerloop-results/eval_summary.jsonl
+++ b/agent/outerloop-results/eval_summary.jsonl
@@ -7,3 +7,5 @@
 {"label": "Trial-20 Phase2-CHAMPION (n_steer=3 n_throttle=5 lr=0.000225 13k)", "episodes": 2, "mean_reward": 2442.518759917548, "std_reward": 1.0388711651139602, "mean_steps": 2207.0, "laps_completed": 2, "lap_times": [], "mean_lap_time": null, "oscillation_score": 0.02950521865417758, "mean_abs_cte": 0.6531256213564158, "cte_std": 0.8027999937867458, "mean_cte_signed": -0.2483797114891415, "timestamp": "2026-04-14T09:47:42.400511"}
 {"label": "Trial-8  Phase2-2nd     (n_steer=4 n_throttle=3 lr=0.00117 34k)", "episodes": 2, "mean_reward": 2317.432029556806, "std_reward": 18.942237256511135, "mean_steps": 2868.5, "laps_completed": 2, "lap_times": [], "mean_lap_time": null, "oscillation_score": 0.2834802523579091, "mean_abs_cte": 2.422644460646358, "cte_std": 1.1138924382905466, "mean_cte_signed": -2.3801686207107786, "timestamp": "2026-04-14T09:49:04.582620"}
 {"label": "Trial-18 Phase2-3rd     (n_steer=3 n_throttle=5 lr=0.000288 16k)", "episodes": 2, "mean_reward": 2033.23669065166, "std_reward": 1.064515341916831, "mean_steps": 2215.5, "laps_completed": 2, "lap_times": [], "mean_lap_time": null, "oscillation_score": 0.03205084139914743, "mean_abs_cte": 1.8957184896224086, "cte_std": 0.6619761387720514, "mean_cte_signed": 1.8539337610791435, "timestamp": "2026-04-14T09:50:10.360819"}
+{"label": "models/trial-0020/model.zip", "episodes": 2, "mean_reward": 37.241031715582196, "std_reward": 0.28907964206657866, "mean_steps": 46.5, "laps_completed": 0, "lap_times": [], "mean_lap_time": null, "oscillation_score": 0.022102436264931864, "mean_abs_cte": 1.5655676728935655, "cte_std": 1.7548751474876907, "mean_cte_signed": 1.5655673447475642, "timestamp": "2026-04-14T09:57:50.464350"}
+{"label": "models/trial-0020/model.zip", "episodes": 2, "mean_reward": 2483.4217291368955, "std_reward": 0.7786866285837277, "mean_steps": 2274.0, "laps_completed": 2, "lap_times": [], "mean_lap_time": null, "oscillation_score": 0.029955150476673437, "mean_abs_cte": 0.6523263188640881, "cte_std": 0.8171509825824437, "mean_cte_signed": -0.221444340508684, "timestamp": "2026-04-14T10:03:55.026007"}
diff --git a/agent/track_switcher.py b/agent/track_switcher.py
new file mode 100644
index 0000000..235869e
--- /dev/null
+++ b/agent/track_switcher.py
@@ -0,0 +1,139 @@
+"""
+Track Switcher — sends exit_scene to DonkeyCar sim to return to main menu,
+then reconnects with the desired environment/scene.
+
+The gym wrapper only loads a scene when the sim is at the main menu
+(scene_selection_ready state). If a scene is already running, it ignores the
+env ID and stays on the current scene. This utility fixes that.
+
+Usage:
+    from track_switcher import switch_track
+
+    env = switch_track('donkey-generated-track-v0')
+    # Sim is now running the generated track, ready for evaluation
+"""
+
+import time
+import json
+import socket
+import gymnasium as gym
+import gym_donkeycar
+
+
+SIM_HOST = 'localhost'
+SIM_PORT = 9091
+EXIT_SCENE_WAIT = 4.0   # seconds to wait after exit_scene for sim to reach menu
+CONNECT_WAIT = 1.0      # seconds to wait for initial connection
+
+
+def send_exit_scene_raw():
+    """
+    Send the exit_scene message directly via raw TCP socket,
+    without going through the full gym env setup.
+    This avoids the wait_until_loaded() timeout.
+    """
+    msg = json.dumps({'msg_type': 'exit_scene'}) + '\n'
+    try:
+        s = socket.socket(socket.AF_INET, socket.SOCK_STREAM)
+        s.settimeout(5.0)
+        s.connect((SIM_HOST, SIM_PORT))
+        time.sleep(CONNECT_WAIT)
+        s.sendall(msg.encode('utf-8'))
+        time.sleep(0.5)
+        s.close()
+        print(f'[TrackSwitch] Sent exit_scene to sim.', flush=True)
+        return True
+    except Exception as e:
+        print(f'[TrackSwitch] Could not send exit_scene: {e}', flush=True)
+        return False
+
+
+def switch_track(target_env_id: str, current_env_id: str = 'donkey-generated-roads-v0', verbose: bool = True):
+    """
+    Switch the DonkeyCar simulator to a different scene/track.
+
+    1. Connect to the current scene
+    2. Send exit_scene via the proper websocket → sim returns to main menu
+    3. Wait for sim to show scene selection screen
+    4. Connect with target_env_id → sim loads the correct scene
+
+    Args:
+        target_env_id:  Gymnasium env ID to switch TO, e.g. 'donkey-generated-track-v0'
+        current_env_id: Gymnasium env ID currently running (used to connect and send exit)
+        verbose: print status messages
+
+    Returns:
+        gymnasium.Env: the new environment connected to the target scene
+    """
+    if verbose:
+        print(f'\n[TrackSwitch] Switching from {current_env_id} → {target_env_id}', flush=True)
+        print(f'[TrackSwitch] Step 1: Connecting to current scene...', flush=True)
+
+    try:
+        temp_env = gym.make(current_env_id)
+        base_env = temp_env.unwrapped  # bypass OrderEnforcing wrapper
+        time.sleep(1.0)
+
+        if verbose:
+            print(f'[TrackSwitch] Step 2: Sending exit_scene via websocket...', flush=True)
+        base_env.viewer.exit_scene()
+        time.sleep(0.5)
+        base_env.viewer.quit()
+        if verbose:
+            print(f'[TrackSwitch] exit_scene sent. Disconnected.', flush=True)
+    except Exception as e:
+        if verbose:
+            print(f'[TrackSwitch] Warning during exit: {e} — sim may already be at menu.', flush=True)
+
+    if verbose:
+        print(f'[TrackSwitch] Step 3: Waiting {EXIT_SCENE_WAIT}s for sim to reach main menu...', flush=True)
+    time.sleep(EXIT_SCENE_WAIT)
+
+    if verbose:
+        print(f'[TrackSwitch] Step 4: Connecting to {target_env_id}...', flush=True)
+    try:
+        env = gym.make(target_env_id)
+        if verbose:
+            print(f'[TrackSwitch] ✅ Connected to {target_env_id}!', flush=True)
+        return env
+    except Exception as e:
+        print(f'[TrackSwitch] ERROR connecting to {target_env_id}: {e}', flush=True)
+        raise
+
+
+def current_scene_exit_and_reconnect(current_env_id: str, target_env_id: str, verbose: bool = True):
+    """
+    Alternative approach: connect to current scene, call exit_scene(), then reconnect.
+    Use this if the raw socket approach doesn't work.
+    """
+    if verbose:
+        print(f'[TrackSwitch] Connecting to current scene ({current_env_id}) to send exit...', flush=True)
+    try:
+        temp_env = gym.make(current_env_id)
+        time.sleep(1.0)
+        temp_env.viewer.exit_scene()
+        if verbose:
+            print(f'[TrackSwitch] exit_scene sent via gym env.', flush=True)
+        time.sleep(1.0)
+        temp_env.close()
+    except Exception as e:
+        print(f'[TrackSwitch] Warning during temp connect: {e}', flush=True)
+
+    if verbose:
+        print(f'[TrackSwitch] Waiting {EXIT_SCENE_WAIT}s for sim to reach main menu...', flush=True)
+    time.sleep(EXIT_SCENE_WAIT)
+
+    if verbose:
+        print(f'[TrackSwitch] Connecting to target: {target_env_id}', flush=True)
+    return gym.make(target_env_id)
+
+
+# Available tracks with their env IDs and scene names
+AVAILABLE_TRACKS = {
+    'generated_road':   'donkey-generated-roads-v0',
+    'generated_track':  'donkey-generated-track-v0',
+    'mountain':         'donkey-mountain-track-v0',
+    'warehouse':        'donkey-warehouse-v0',
+    'waveshare':        'donkey-waveshare-v0',
+    'mini_monaco':      'donkey-minimonaco-track-v0',
+}