Skip to content

Commit 4dece01

Browse files
authored
Merge pull request #34 from ebetica/fix1
Bigger network converges in 160 steps
2 parents 2bc4454 + 3dc0077 commit 4dece01

File tree

1 file changed

+3
-5
lines changed

1 file changed

+3
-5
lines changed

actor_critic/main.py

Lines changed: 3 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -34,17 +34,15 @@
3434
class Policy(nn.Module):
3535
def __init__(self):
3636
super(Policy, self).__init__()
37-
self.affine1 = nn.Linear(4, 16)
38-
self.affine2 = nn.Linear(16, 32)
39-
self.action_head = nn.Linear(32, 2)
40-
self.value_head = nn.Linear(32, 1)
37+
self.affine1 = nn.Linear(4, 128)
38+
self.action_head = nn.Linear(128, 2)
39+
self.value_head = nn.Linear(128, 1)
4140

4241
self.saved_actions = []
4342
self.rewards = []
4443

4544
def forward(self, x):
4645
x = F.relu(self.affine1(x))
47-
x = F.relu(self.affine2(x))
4846
action_scores = self.action_head(x)
4947
state_values = self.value_head(x)
5048
return F.softmax(action_scores), state_values

0 commit comments

Comments
 (0)