更新算法模版
This commit is contained in:
@@ -0,0 +1,25 @@
|
||||
{
|
||||
"algo_name": "PPO",
|
||||
"env_name": "CartPole-v0",
|
||||
"continuous": false,
|
||||
"train_eps": 200,
|
||||
"test_eps": 20,
|
||||
"gamma": 0.99,
|
||||
"batch_size": 5,
|
||||
"n_epochs": 4,
|
||||
"actor_lr": 0.0003,
|
||||
"critic_lr": 0.0003,
|
||||
"gae_lambda": 0.95,
|
||||
"policy_clip": 0.2,
|
||||
"update_fre": 20,
|
||||
"actor_hidden_dim": 256,
|
||||
"critic_hidden_dim": 256,
|
||||
"device": "cpu",
|
||||
"seed": 10,
|
||||
"show_fig": false,
|
||||
"save_fig": true,
|
||||
"result_path": "c:\\Users\\24438\\Desktop\\rl-tutorials\\codes\\PPO/outputs/CartPole-v0/20220920-213310/results/",
|
||||
"model_path": "c:\\Users\\24438\\Desktop\\rl-tutorials\\codes\\PPO/outputs/CartPole-v0/20220920-213310/models/",
|
||||
"n_states": 4,
|
||||
"n_actions": 2
|
||||
}
|
||||
Reference in New Issue
Block a user