更新算法模版
This commit is contained in:
@@ -0,0 +1,25 @@
|
||||
{
|
||||
"algo_name": "DDPG",
|
||||
"env_name": "Pendulum-v1",
|
||||
"train_eps": 300,
|
||||
"test_eps": 20,
|
||||
"max_steps": 100000,
|
||||
"gamma": 0.99,
|
||||
"critic_lr": 0.001,
|
||||
"actor_lr": 0.0001,
|
||||
"memory_capacity": 8000,
|
||||
"batch_size": 128,
|
||||
"target_update": 2,
|
||||
"tau": 0.01,
|
||||
"critic_hidden_dim": 256,
|
||||
"actor_hidden_dim": 256,
|
||||
"device": "cpu",
|
||||
"seed": 1,
|
||||
"show_fig": false,
|
||||
"save_fig": true,
|
||||
"result_path": "/Users/jj/Desktop/rl-tutorials/codes/DDPG/outputs/Pendulum-v1/20220927-155053/results/",
|
||||
"model_path": "/Users/jj/Desktop/rl-tutorials/codes/DDPG/outputs/Pendulum-v1/20220927-155053/models/",
|
||||
"n_states": 3,
|
||||
"n_actions": 1,
|
||||
"training_time": 358.8142900466919
|
||||
}
|
||||
Reference in New Issue
Block a user