update Q-learning

This commit is contained in:
JohnJim0816
2021-01-05 09:43:28 +08:00
parent e594e3b378
commit 198fc4d17b
8 changed files with 4 additions and 4 deletions

View File

@@ -5,7 +5,7 @@ Author: John
Email: johnjim0816@gmail.com Email: johnjim0816@gmail.com
Date: 2020-09-11 23:03:00 Date: 2020-09-11 23:03:00
LastEditor: John LastEditor: John
LastEditTime: 2020-11-24 19:56:23 LastEditTime: 2021-01-05 09:41:34
Discription: Discription:
Environment: Environment:
''' '''
@@ -92,7 +92,7 @@ def train(cfg):
plot(rewards) plot(rewards)
plot(MA_rewards,ylabel='moving_average_rewards_train') plot(MA_rewards,ylabel='moving_average_rewards_train')
def test(cfg): def eval(cfg, saved_model_path = SAVED_MODEL_PATH):
env = gym.make("CliffWalking-v0") # 0 up, 1 right, 2 down, 3 left env = gym.make("CliffWalking-v0") # 0 up, 1 right, 2 down, 3 left
env = CliffWalkingWapper(env) env = CliffWalkingWapper(env)
@@ -102,7 +102,7 @@ def test(cfg):
learning_rate=cfg.policy_lr, learning_rate=cfg.policy_lr,
gamma=cfg.gamma, gamma=cfg.gamma,
epsilon_start=cfg.epsilon_start,epsilon_end=cfg.epsilon_end,epsilon_decay=cfg.epsilon_decay) epsilon_start=cfg.epsilon_start,epsilon_end=cfg.epsilon_end,epsilon_decay=cfg.epsilon_decay)
agent.load() # 导入保存的模型 agent.load_model(saved_model_path+'checkpoint.npy') # 导入保存的模型
rewards = [] # 记录所有episode的reward rewards = [] # 记录所有episode的reward
MA_rewards = [] # 记录滑动平均的reward MA_rewards = [] # 记录滑动平均的reward
steps = []# 记录所有episode的steps steps = []# 记录所有episode的steps

Binary file not shown.

Before

Width:  |  Height:  |  Size: 32 KiB

After

Width:  |  Height:  |  Size: 24 KiB

Binary file not shown.

Before

Width:  |  Height:  |  Size: 31 KiB

After

Width:  |  Height:  |  Size: 16 KiB

Binary file not shown.

View File

@@ -5,7 +5,7 @@
@Email: johnjim0816@gmail.com @Email: johnjim0816@gmail.com
@Date: 2020-06-12 00:48:57 @Date: 2020-06-12 00:48:57
@LastEditor: John @LastEditor: John
LastEditTime: 2020-11-23 11:58:17 LastEditTime: 2021-01-05 09:41:02
@Discription: @Discription:
@Environment: python 3.7.7 @Environment: python 3.7.7
''' '''