diff --git a/agent/outerloop-results/autoresearch_phase4_log.txt b/agent/outerloop-results/autoresearch_phase4_log.txt index 2c94c20..a617fdc 100644 --- a/agent/outerloop-results/autoresearch_phase4_log.txt +++ b/agent/outerloop-results/autoresearch_phase4_log.txt @@ -810,3 +810,14 @@ [2026-04-16 19:09:41] [Wave4] Proposed params: {'learning_rate': 0.0003128257557719074, 'steps_per_switch': 6836, 'total_timesteps': 62683} [2026-04-16 19:09:43] [Wave4] Launching trial 25: {'learning_rate': 0.0003128257557719074, 'steps_per_switch': 6836, 'total_timesteps': 62683} [2026-04-16 19:09:43] [Wave4] Command: python3 /home/paulh/projects/donkeycar-rl-autoresearch/agent/multitrack_runner.py --total-timesteps 62683 --steps-per-switch 6836 --learning-rate 0.0003128257557719074 --eval-episodes 3 --save-dir /home/paulh/projects/donkeycar-rl-autoresearch/agent/models/wave4-trial-0025 +[2026-04-16 20:01:51] [Wave4] Trial 25 finished in 3128.1s, rc=0 +[2026-04-16 20:01:51] [Wave4] Parsed: combined=1542.9971 mini_monaco=1542.9971 +[2026-04-16 20:01:51] [Wave4] ===== Trial 25 Summary ===== +[2026-04-16 20:01:51] GP data points : 25 +[2026-04-16 20:01:51] Wave4 Champion: trial=3 score=1943.10 params={'learning_rate': 0.0006852550685205609, 'steps_per_switch': 17499, 'total_timesteps': 157743} +[2026-04-16 20:01:51] Top 5: +[2026-04-16 20:01:51] score=1943.10 params={'learning_rate': 0.0006852550685205609, 'steps_per_switch': 17499, 'total_timesteps': 90000} +[2026-04-16 20:01:51] score=1573.07 params={'learning_rate': 0.00033896311195395496, 'steps_per_switch': 5448, 'total_timesteps': 69359} +[2026-04-16 20:01:51] score=1543.00 params={'learning_rate': 0.0003128257557719074, 'steps_per_switch': 6836, 'total_timesteps': 62683} +[2026-04-16 20:01:51] score=1435.04 params={'learning_rate': 0.0007252855740444645, 'steps_per_switch': 6851, 'total_timesteps': 89893} +[2026-04-16 20:01:51] score=230.98 params={'learning_rate': 0.0006672844816013197, 'steps_per_switch': 4747, 'total_timesteps': 64179} diff --git a/agent/outerloop-results/autoresearch_results_phase4.jsonl b/agent/outerloop-results/autoresearch_results_phase4.jsonl index 6f94b2c..6a937d6 100644 --- a/agent/outerloop-results/autoresearch_results_phase4.jsonl +++ b/agent/outerloop-results/autoresearch_results_phase4.jsonl @@ -22,3 +22,4 @@ {"trial": 22, "timestamp": "2026-04-16T17:13:22.634461", "params": {"learning_rate": 0.0010680884757571496, "steps_per_switch": 3269, "total_timesteps": 81912}, "combined_test_score": 193.2341, "mini_monaco_reward": 193.2341, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/wave4-trial-0022/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 5520.664301395416} {"trial": 23, "timestamp": "2026-04-16T18:26:11.713980", "params": {"learning_rate": 0.0003194840316570061, "steps_per_switch": 4507, "total_timesteps": 66965}, "combined_test_score": 150.773, "mini_monaco_reward": 150.773, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/wave4-trial-0023/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 4365.0226583480835} {"trial": 24, "timestamp": "2026-04-16T19:09:39.779549", "params": {"learning_rate": 0.0003596012644521025, "steps_per_switch": 8013, "total_timesteps": 60054}, "combined_test_score": 37.824, "mini_monaco_reward": 37.824, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/wave4-trial-0024/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 2604.015403985977} +{"trial": 25, "timestamp": "2026-04-16T20:01:51.940115", "params": {"learning_rate": 0.0003128257557719074, "steps_per_switch": 6836, "total_timesteps": 62683}, "combined_test_score": 1542.9971, "mini_monaco_reward": 1542.9971, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/wave4-trial-0025/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 3128.128504514694}