Improve PPO diagnostics and recharge behavior
This commit is contained in:
@@ -21,9 +21,9 @@ if __name__ == "__main__":
|
||||
algorithm_name=algorithm_name,
|
||||
algorithm_name_list=algorithm_name_list,
|
||||
env_vars={
|
||||
"replay_buffer_capacity": "10",
|
||||
"preload_ratio": "0.2",
|
||||
"replay_buffer_capacity": "8",
|
||||
"preload_ratio": "0.1",
|
||||
"train_batch_size": "2",
|
||||
"dump_model_freq": "1",
|
||||
"dump_model_freq": "100",
|
||||
},
|
||||
)
|
||||
|
||||
Reference in New Issue
Block a user