Improve PPO diagnostics and recharge behavior

This commit is contained in:
2026-04-26 20:24:26 +08:00
parent 5b6133db13
commit 69b8a692db
6 changed files with 463 additions and 31 deletions

View File

@@ -21,9 +21,9 @@ if __name__ == "__main__":
algorithm_name=algorithm_name,
algorithm_name_list=algorithm_name_list,
env_vars={
"replay_buffer_capacity": "10",
"preload_ratio": "0.2",
"replay_buffer_capacity": "8",
"preload_ratio": "0.1",
"train_batch_size": "2",
"dump_model_freq": "1",
"dump_model_freq": "100",
},
)