update Q-learning
This commit is contained in:
@@ -5,7 +5,7 @@ Author: John
|
|||||||
Email: johnjim0816@gmail.com
|
Email: johnjim0816@gmail.com
|
||||||
Date: 2020-09-11 23:03:00
|
Date: 2020-09-11 23:03:00
|
||||||
LastEditor: John
|
LastEditor: John
|
||||||
LastEditTime: 2020-11-24 19:56:23
|
LastEditTime: 2021-01-05 09:41:34
|
||||||
Discription:
|
Discription:
|
||||||
Environment:
|
Environment:
|
||||||
'''
|
'''
|
||||||
@@ -92,7 +92,7 @@ def train(cfg):
|
|||||||
plot(rewards)
|
plot(rewards)
|
||||||
plot(MA_rewards,ylabel='moving_average_rewards_train')
|
plot(MA_rewards,ylabel='moving_average_rewards_train')
|
||||||
|
|
||||||
def test(cfg):
|
def eval(cfg, saved_model_path = SAVED_MODEL_PATH):
|
||||||
|
|
||||||
env = gym.make("CliffWalking-v0") # 0 up, 1 right, 2 down, 3 left
|
env = gym.make("CliffWalking-v0") # 0 up, 1 right, 2 down, 3 left
|
||||||
env = CliffWalkingWapper(env)
|
env = CliffWalkingWapper(env)
|
||||||
@@ -102,7 +102,7 @@ def test(cfg):
|
|||||||
learning_rate=cfg.policy_lr,
|
learning_rate=cfg.policy_lr,
|
||||||
gamma=cfg.gamma,
|
gamma=cfg.gamma,
|
||||||
epsilon_start=cfg.epsilon_start,epsilon_end=cfg.epsilon_end,epsilon_decay=cfg.epsilon_decay)
|
epsilon_start=cfg.epsilon_start,epsilon_end=cfg.epsilon_end,epsilon_decay=cfg.epsilon_decay)
|
||||||
agent.load() # 导入保存的模型
|
agent.load_model(saved_model_path+'checkpoint.npy') # 导入保存的模型
|
||||||
rewards = [] # 记录所有episode的reward
|
rewards = [] # 记录所有episode的reward
|
||||||
MA_rewards = [] # 记录滑动平均的reward
|
MA_rewards = [] # 记录滑动平均的reward
|
||||||
steps = []# 记录所有episode的steps
|
steps = []# 记录所有episode的steps
|
||||||
|
|||||||
Binary file not shown.
BIN
codes/Q-learning/result/20210105-094149/rewards_train.npy
Normal file
BIN
codes/Q-learning/result/20210105-094149/rewards_train.npy
Normal file
Binary file not shown.
Binary file not shown.
|
Before Width: | Height: | Size: 32 KiB After Width: | Height: | Size: 24 KiB |
Binary file not shown.
|
Before Width: | Height: | Size: 31 KiB After Width: | Height: | Size: 16 KiB |
BIN
codes/Q-learning/saved_model/20210105-094149/checkpoint.npy
Normal file
BIN
codes/Q-learning/saved_model/20210105-094149/checkpoint.npy
Normal file
Binary file not shown.
BIN
codes/Q-learning/saved_model/checkpoint.npy
Normal file
BIN
codes/Q-learning/saved_model/checkpoint.npy
Normal file
Binary file not shown.
@@ -5,7 +5,7 @@
|
|||||||
@Email: johnjim0816@gmail.com
|
@Email: johnjim0816@gmail.com
|
||||||
@Date: 2020-06-12 00:48:57
|
@Date: 2020-06-12 00:48:57
|
||||||
@LastEditor: John
|
@LastEditor: John
|
||||||
LastEditTime: 2020-11-23 11:58:17
|
LastEditTime: 2021-01-05 09:41:02
|
||||||
@Discription:
|
@Discription:
|
||||||
@Environment: python 3.7.7
|
@Environment: python 3.7.7
|
||||||
'''
|
'''
|
||||||
|
|||||||
Reference in New Issue
Block a user