更新算法模版
This commit is contained in:
@@ -0,0 +1,19 @@
|
||||
general_cfg:
|
||||
algo_name: QLearning
|
||||
device: cpu
|
||||
env_name: FrozenLakeNoSlippery-v1
|
||||
load_checkpoint: true
|
||||
load_path: Train_FrozenLakeNoSlippery-v1_QLearning_20221030-014504
|
||||
max_steps: 200
|
||||
mode: test
|
||||
save_fig: true
|
||||
seed: 10
|
||||
show_fig: false
|
||||
test_eps: 20
|
||||
train_eps: 800
|
||||
algo_cfg:
|
||||
epsilon_decay: 2000
|
||||
epsilon_end: 0.1
|
||||
epsilon_start: 0.7
|
||||
gamma: 0.95
|
||||
lr: 0.9
|
||||
@@ -0,0 +1,24 @@
|
||||
2022-10-30 01:45:52 - r - INFO: - n_states: 16, n_actions: 4
|
||||
2022-10-30 01:45:52 - r - INFO: - Start testing!
|
||||
2022-10-30 01:45:52 - r - INFO: - Env: FrozenLakeNoSlippery-v1, Algorithm: QLearning, Device: cpu
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 1/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 2/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 3/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 4/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 5/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 6/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 7/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 8/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 9/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 10/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 11/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 12/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 13/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 14/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 15/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 16/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 17/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 18/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 19/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Episode: 20/20, Steps:6 Reward: 1.00
|
||||
2022-10-30 01:45:52 - r - INFO: - Finish testing!
|
||||
Binary file not shown.
Binary file not shown.
|
After Width: | Height: | Size: 24 KiB |
@@ -0,0 +1,21 @@
|
||||
episodes,rewards,steps
|
||||
0,1.0,6
|
||||
1,1.0,6
|
||||
2,1.0,6
|
||||
3,1.0,6
|
||||
4,1.0,6
|
||||
5,1.0,6
|
||||
6,1.0,6
|
||||
7,1.0,6
|
||||
8,1.0,6
|
||||
9,1.0,6
|
||||
10,1.0,6
|
||||
11,1.0,6
|
||||
12,1.0,6
|
||||
13,1.0,6
|
||||
14,1.0,6
|
||||
15,1.0,6
|
||||
16,1.0,6
|
||||
17,1.0,6
|
||||
18,1.0,6
|
||||
19,1.0,6
|
||||
|
Reference in New Issue
Block a user