Skip to content

Commit 66e03ba

Browse files
committed
update readme and cleanup
1 parent 5dcb244 commit 66e03ba

File tree

4 files changed

+7
-7
lines changed

4 files changed

+7
-7
lines changed

README.md

+6
Original file line numberDiff line numberDiff line change
@@ -22,6 +22,12 @@ Install most recent nightly build (version '0.1.10+2fd4d08' or later) of PyTorch
2222
pip install git+https://github.com/pytorch/pytorch
2323
`
2424

25+
## Dependencies
26+
* pytorch
27+
* torchvision
28+
* universe (for now)
29+
* [tensorboard logger](https://github.com/TeamHG-Memex/tensorboard_logger)
30+
2531
## Results
2632

2733
With 16 processes it converges for PongDeterministic-v3 in 15 minutes.

main.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -65,8 +65,8 @@ def setup_loggings(args):
6565
if __name__ == '__main__':
6666
args = parser.parse_args()
6767
setup_loggings(args)
68-
6968
torch.manual_seed(args.seed)
69+
7070
env = create_atari_env(args.env_name)
7171
shared_model = ActorCritic(
7272
env.observation_space.shape[0], env.action_space)

model.py

-4
Original file line numberDiff line numberDiff line change
@@ -44,12 +44,8 @@ def __init__(self, num_inputs, action_space):
4444
self.lstm = nn.LSTMCell(32 * 3 * 3, 256)
4545

4646
num_outputs = action_space.n
47-
4847
self.critic_linear = nn.Linear(256, 1)
4948
self.actor_linear = nn.Linear(256, num_outputs)
50-
#self.critic_linear = nn.Linear(288, 1)
51-
#self.actor_linear = nn.Linear(288, num_outputs)
52-
5349
self.apply(weights_init)
5450
self.actor_linear.weight.data = normalized_columns_initializer(
5551
self.actor_linear.weight.data, 0.01)

train.py

-2
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,6 @@
11
import math
22
import os
33
import sys
4-
import resource
5-
import gc
64

75
import torch
86
import torch.nn.functional as F

0 commit comments

Comments
 (0)