xeviknal · ziritrion · Apr 6, 2021 · Apr 6, 2021 · Apr 8, 2021
diff --git a/main.py b/main.py
@@ -11,7 +11,7 @@
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 
 #for concurrent runs and logging
-experiment='ppo-nm'
+experiment='ppo-nm-exp2'
 if __name__ == "__main__":
     hyperparams = {
         'num_epochs': 25000,  # Number of training episodes
@@ -23,12 +23,12 @@
         'c2': 0.01,  # Entropy coeff
         'lr': 1e-3,  # Learning rate
         'gamma': 0.99,  # Discount rate
-        'log_interval': 10,  # controls how often we log progress
+        'log_interval': 5,  # controls how often we log progress
         'stack_frames': 4,
         'device': device,
         'experiment':experiment,
         'params_path': f'./params/policy-params-{experiment}.dl',
-        'action_set_num': 0,
+        'action_set_num': 1,
         'train': True
     }
 

diff --git a/params/policy-params-ppo-nm-exp2.dl b/params/policy-params-ppo-nm-exp2.dl
diff --git a/runs/Apr06_18-50-38_kenya/download.md b/runs/Apr06_18-50-38_kenya/download.md
@@ -0,0 +1 @@
+Download the TensorBoard run from [this Dropbox URL](https://www.dropbox.com/s/m1g0r1p4tkhea4h/events.out.tfevents.1617727838.kenya.108129.0?dl=0)
Original file line number	Diff line number	Diff line change
		@@ -0,0 +1 @@
		Download the TensorBoard run from [this Dropbox URL](https://www.dropbox.com/s/m1g0r1p4tkhea4h/events.out.tfevents.1617727838.kenya.108129.0?dl=0)