There was an error while loading. Please reload this page.
2 parents 2bc4454 + 3dc0077 commit 4dece01Copy full SHA for 4dece01
actor_critic/main.py
@@ -34,17 +34,15 @@
34
class Policy(nn.Module):
35
def __init__(self):
36
super(Policy, self).__init__()
37
- self.affine1 = nn.Linear(4, 16)
38
- self.affine2 = nn.Linear(16, 32)
39
- self.action_head = nn.Linear(32, 2)
40
- self.value_head = nn.Linear(32, 1)
+ self.affine1 = nn.Linear(4, 128)
+ self.action_head = nn.Linear(128, 2)
+ self.value_head = nn.Linear(128, 1)
41
42
self.saved_actions = []
43
self.rewards = []
44
45
def forward(self, x):
46
x = F.relu(self.affine1(x))
47
- x = F.relu(self.affine2(x))
48
action_scores = self.action_head(x)
49
state_values = self.value_head(x)
50
return F.softmax(action_scores), state_values
0 commit comments