donkeycar-rl-autoresearch/agent/outerloop-results/autoresearch_results_phase1...

11 lines
4.6 KiB
JSON

{"trial": 1, "timestamp": "2026-04-13T12:31:19.488414", "params": {"n_steer": 9, "n_throttle": 3, "learning_rate": 0.00014623033103219074, "timesteps": 3139, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 270.5642, "std_reward": 0.1427, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0001/model.zip", "champion": true, "run_status": "ok", "elapsed_sec": 200.94285488128662, "reward_hacking_suspected": false}
{"trial": 2, "timestamp": "2026-04-13T12:33:09.872158", "params": {"n_steer": 6, "n_throttle": 4, "learning_rate": 0.0021131130619403186, "timesteps": 1622, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 15.537, "std_reward": 0.0257, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0002/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 106.36946535110474, "reward_hacking_suspected": false}
{"trial": 3, "timestamp": "2026-04-13T12:34:55.161415", "params": {"n_steer": 7, "n_throttle": 3, "learning_rate": 0.002684399373384131, "timesteps": 1755, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 15.0687, "std_reward": 0.0219, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0003/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 101.27748799324036, "reward_hacking_suspected": false}
{"trial": 4, "timestamp": "2026-04-13T12:39:56.555101", "params": {"n_steer": 9, "n_throttle": 3, "learning_rate": 0.0009549126527603771, "timesteps": 4279, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 627.6915, "std_reward": 2.3536, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0004/model.zip", "champion": true, "run_status": "ok", "elapsed_sec": 297.3021275997162, "reward_hacking_suspected": false}
{"trial": 5, "timestamp": "2026-04-13T12:45:43.094106", "params": {"n_steer": 7, "n_throttle": 3, "learning_rate": 0.0006801262090358742, "timesteps": 4787, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 4582.7984, "std_reward": 0.4849, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0005/model.zip", "champion": true, "run_status": "ok", "elapsed_sec": 342.3742210865021, "reward_hacking_suspected": false}
{"trial": 6, "timestamp": "2026-04-13T12:51:14.032008", "params": {"n_steer": 6, "n_throttle": 3, "learning_rate": 0.0005165618383365869, "timesteps": 4929, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 454.064, "std_reward": 2.7272, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0006/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 326.92552065849304, "reward_hacking_suspected": false}
{"trial": 7, "timestamp": "2026-04-13T12:56:20.922347", "params": {"n_steer": 7, "n_throttle": 4, "learning_rate": 0.002103379184926248, "timesteps": 4607, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 199.5367, "std_reward": 2.4906, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0007/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 302.873496055603, "reward_hacking_suspected": false}
{"trial": 8, "timestamp": "2026-04-13T13:01:28.616838", "params": {"n_steer": 8, "n_throttle": 3, "learning_rate": 0.0003097316245852375, "timesteps": 4938, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 306.1739, "std_reward": 13.6044, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0008/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 303.6810266971588, "reward_hacking_suspected": false}
{"trial": 9, "timestamp": "2026-04-13T13:05:16.112705", "params": {"n_steer": 7, "n_throttle": 3, "learning_rate": 0.0014813539623020004, "timesteps": 4054, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 15.5625, "std_reward": 0.0011, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0009/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 223.47979998588562, "reward_hacking_suspected": false}
{"trial": 10, "timestamp": "2026-04-13T13:11:06.106880", "params": {"n_steer": 7, "n_throttle": 2, "learning_rate": 0.0010464507674264373, "timesteps": 4450, "agent": "ppo", "eval_episodes": 3, "reward_shaping": true}, "mean_reward": 682.7352, "std_reward": 420.9113, "model_path": "/home/paulh/projects/donkeycar-rl-autoresearch/agent/models/trial-0010/model.zip", "champion": false, "run_status": "ok", "elapsed_sec": 345.9794178009033, "reward_hacking_suspected": false}