update PolicyGradient

This commit is contained in:
JohnJim0816
2020-11-23 12:13:34 +08:00
parent 4f192c7aac
commit 4cc12bf97f
5 changed files with 185 additions and 0 deletions

View File

@@ -0,0 +1,27 @@
#!/usr/bin/env python
# coding=utf-8
'''
Author: John
Email: johnjim0816@gmail.com
Date: 2020-11-22 23:18:46
LastEditor: John
LastEditTime: 2020-11-23 01:58:22
Discription:
Environment:
'''
import torch.nn as nn
import torch.nn.functional as F
class FCN(nn.Module):
''' 全连接网络'''
def __init__(self,n_states):
super(FCN, self).__init__()
# 24和36为hidden layer的层数可根据n_states, n_actions的情况来改变
self.fc1 = nn.Linear(n_states, 24)
self.fc2 = nn.Linear(24, 36)
self.fc3 = nn.Linear(36, 1) # Prob of Left
def forward(self, x):
x = F.relu(self.fc1(x))
x = F.relu(self.fc2(x))
x = F.sigmoid(self.fc3(x))
return x