changed logs

Jason-CKY · Jason-CKY · commit 39ab731ad3a3 · 2020-10-25T14:19:24.000+08:00
diff --git a/Algorithms/ddpg/ddpg.py b/Algorithms/ddpg/ddpg.py
@@ -151,7 +151,7 @@ def update(self, experiences):
         
         # MSE loss
         loss_q = ((Q_values-Qprime)**2).mean()
-        loss_info = dict(Qvals=Q_values.detach().cpu().numpy())
+        loss_info = dict(Qvals=Q_values.detach().cpu().numpy().tolist())
 
         loss_q.backward()
         self.q_optimizer.step()
diff --git a/Algorithms/td3/td3.py b/Algorithms/td3/td3.py
@@ -171,8 +171,8 @@ def update(self, experiences, update_policy=False):
         
         # MSE loss
         loss_q = ((q1-Qprime)**2).mean() + ((q2-Qprime)**2).mean()
-        loss_info = dict(Q1vals=q1.detach().cpu().numpy(),
-                        Q2Vals=q2.detach().cpu().numpy())
+        loss_info = dict(Q1vals=q1.detach().cpu().numpy().tolist(),
+                        Q2Vals=q2.detach().cpu().numpy().tolist())
 
         loss_q.backward()
         self.q_optimizer.step()
diff --git a/Logger/logger.py b/Logger/logger.py
@@ -50,27 +50,18 @@ def dump(self):
         Write all of the diagnostics from the current iteration.
         Writes to the output file.
         """
-        # print(self.logger_dict)
-        # with open(self.output_filepath, 'wb') as f:
-        #     pickle.dump(self.logger_dict, f)
-
-        if self.init:
-            assert len(self.logger_dict) > 0, "no variables stored inside dictionary to dump!"
-            self.logger_list.append(self.logger_dict)
-            self.init = False
-        else:
-            self.logger_list[-1] = self.logger_dict
-
+        assert len(self.logger_dict) > 0, "no variables stored inside dictionary to dump!"
+        
         with open(self.output_filepath, 'w') as f:
-            f.write(json.dumps(self.logger_list, indent=4))
+            f.write(json.dumps(self.logger_list + [self.logger_dict], indent=4))
     
     def reset(self):
         '''
         Reset the log dict for a new experiment. Used for training the same algorithm multiple times
         '''
-        self.logger_dict = {}
         self.logger_list.append(self.logger_dict)
-
+        self.logger_dict = {}
+        
         with open(self.output_filepath, 'w') as f:
             f.write(json.dumps(self.logger_list, indent=4))