更新算法模版
This commit is contained in:
@@ -0,0 +1,21 @@
|
||||
general_cfg:
|
||||
algo_name: QLearning
|
||||
device: cpu
|
||||
env_name: CliffWalking-v0
|
||||
load_checkpoint: true
|
||||
load_path: Train_CliffWalking-v0_QLearning_20221030-013856
|
||||
max_steps: 200
|
||||
mode: test
|
||||
save_fig: true
|
||||
seed: 1
|
||||
show_fig: false
|
||||
test_eps: 20
|
||||
train_eps: 400
|
||||
algo_cfg:
|
||||
batch_size: 64
|
||||
buffer_size: 100000
|
||||
epsilon_decay: 300
|
||||
epsilon_end: 0.01
|
||||
epsilon_start: 0.95
|
||||
gamma: 0.95
|
||||
lr: 0.1
|
||||
@@ -0,0 +1,24 @@
|
||||
2022-10-30 01:41:51 - r - INFO: - n_states: 48, n_actions: 4
|
||||
2022-10-30 01:41:51 - r - INFO: - Start testing!
|
||||
2022-10-30 01:41:51 - r - INFO: - Env: CliffWalking-v0, Algorithm: QLearning, Device: cpu
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 1/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 2/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 3/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 4/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 5/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 6/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 7/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 8/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 9/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 10/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 11/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 12/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 13/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 14/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 15/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 16/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 17/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 18/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 19/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Episode: 20/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:41:51 - r - INFO: - Finish testing!
|
||||
Binary file not shown.
Binary file not shown.
|
After Width: | Height: | Size: 24 KiB |
@@ -0,0 +1,21 @@
|
||||
episodes,rewards,steps
|
||||
0,-13,13
|
||||
1,-13,13
|
||||
2,-13,13
|
||||
3,-13,13
|
||||
4,-13,13
|
||||
5,-13,13
|
||||
6,-13,13
|
||||
7,-13,13
|
||||
8,-13,13
|
||||
9,-13,13
|
||||
10,-13,13
|
||||
11,-13,13
|
||||
12,-13,13
|
||||
13,-13,13
|
||||
14,-13,13
|
||||
15,-13,13
|
||||
16,-13,13
|
||||
17,-13,13
|
||||
18,-13,13
|
||||
19,-13,13
|
||||
|
Reference in New Issue
Block a user