fixes for cleanliness

stan-stripe · Jun 18, 2017 · ca62ad4 · ca62ad4
1 parent 4facbbc
commit ca62ad4
Show file tree

Hide file tree

Showing 4 changed files with 8 additions and 2 deletions.
diff --git a/README.md b/README.md
@@ -1,5 +1,7 @@
 # pytorch-a3c
 
+xvfb-run -s "-screen 0 1400x900x24" python main.py
+
 This is a PyTorch implementation of Asynchronous Advantage Actor Critic (A3C) from ["Asynchronous Methods for Deep Reinforcement Learning"](https://arxiv.org/pdf/1602.01783v1.pdf).
 
 This implementation is inspired by [Universe Starter Agent](https://github.com/openai/universe-starter-agent).

diff --git a/main.py b/main.py
@@ -45,6 +45,10 @@
     env = create_car_racing_env()
     model = ActorCritic(env.observation_space.shape[0], env.action_space)
 
+    itr = 0
     while True:
+        if itr % 10 == 0:
+            print ("Itr: ", itr)
         train(args, model, env)
         test(args, model, env)
+        itr += 1
diff --git a/test.py b/test.py
@@ -35,7 +35,7 @@ def test(args, model, env):
     actions = deque(maxlen=100)
     episode_length = 0
     while True:
-        env.render()
+        #env.render()
         episode_length += 1
         # Sync with the shared model
         if done:

diff --git a/train.py b/train.py
@@ -33,7 +33,7 @@ def train(args, model, env, optimizer=None):
     episode_length = 0
     u = 0
     while u < args.num_updates:
-        print ("update: ", u)
+        #print ("update: ", u)
         episode_length += 1
         # Sync with the shared model
         # model.load_state_dict(shared_model.state_dict())