更新算法模版
This commit is contained in:
@@ -0,0 +1,19 @@
|
||||
general_cfg:
|
||||
algo_name: QLearning
|
||||
device: cpu
|
||||
env_name: Racetrack-v0
|
||||
load_checkpoint: true
|
||||
load_path: Train_Racetrack-v0_QLearning_20221030-014833
|
||||
max_steps: 200
|
||||
mode: test
|
||||
save_fig: true
|
||||
seed: 10
|
||||
show_fig: false
|
||||
test_eps: 20
|
||||
train_eps: 400
|
||||
algo_cfg:
|
||||
epsilon_decay: 300
|
||||
epsilon_end: 0.01
|
||||
epsilon_start: 0.95
|
||||
gamma: 0.9
|
||||
lr: 0.1
|
||||
@@ -0,0 +1,24 @@
|
||||
2022-10-30 01:49:58 - r - INFO: - n_states: 4, n_actions: 9
|
||||
2022-10-30 01:49:58 - r - INFO: - Start testing!
|
||||
2022-10-30 01:49:58 - r - INFO: - Env: Racetrack-v0, Algorithm: QLearning, Device: cpu
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 1/20, Steps:14 Reward: -4.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 2/20, Steps:8 Reward: 2.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 3/20, Steps:6 Reward: 4.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 4/20, Steps:22 Reward: -12.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 5/20, Steps:15 Reward: -15.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 6/20, Steps:6 Reward: 4.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 7/20, Steps:5 Reward: 5.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 8/20, Steps:8 Reward: 2.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 9/20, Steps:15 Reward: -5.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 10/20, Steps:8 Reward: 2.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 11/20, Steps:5 Reward: 5.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 12/20, Steps:15 Reward: -5.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 13/20, Steps:6 Reward: 4.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 14/20, Steps:31 Reward: -51.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 15/20, Steps:13 Reward: -13.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 16/20, Steps:7 Reward: 3.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 17/20, Steps:6 Reward: 4.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 18/20, Steps:5 Reward: 5.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 19/20, Steps:17 Reward: -17.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Episode: 20/20, Steps:15 Reward: -5.00
|
||||
2022-10-30 01:49:58 - r - INFO: - Finish testing!
|
||||
Binary file not shown.
Binary file not shown.
|
After Width: | Height: | Size: 41 KiB |
@@ -0,0 +1,21 @@
|
||||
episodes,rewards,steps
|
||||
0,-4,14
|
||||
1,2,8
|
||||
2,4,6
|
||||
3,-12,22
|
||||
4,-15,15
|
||||
5,4,6
|
||||
6,5,5
|
||||
7,2,8
|
||||
8,-5,15
|
||||
9,2,8
|
||||
10,5,5
|
||||
11,-5,15
|
||||
12,4,6
|
||||
13,-51,31
|
||||
14,-13,13
|
||||
15,3,7
|
||||
16,4,6
|
||||
17,5,5
|
||||
18,-17,17
|
||||
19,-5,15
|
||||
|
Reference in New Issue
Block a user