update tsp_distribution

RoyalSkye · Nov 2, 2022 · fdb346e · fdb346e
1 parent 1f4821c
commit fdb346e
Show file tree

Hide file tree

Showing 6 changed files with 196 additions and 118 deletions.
diff --git a/.gitignore b/.gitignore
@@ -13,6 +13,7 @@ __pycache__/
 
 # data & pretrain-model
 backup/
+AM/
 data/
 pretrained/
 

diff --git a/POMO/TSP/TSPTester.py b/POMO/TSP/TSPTester.py
@@ -219,11 +219,11 @@ def _fine_tune_one_batch(self, fine_tune_data):
             prob_list = torch.cat((prob_list, prob[:, :, None]), dim=2)
 
         # Loss
-        aug_reward = reward.reshape(aug_factor, batch_size, self.env.pomo_size).permute(1, 0, 2).view(batch_size, -1)
+        aug_reward = reward.reshape(aug_factor, batch_size, self.env.pomo_size).permute(1, 0, 2).reshape(batch_size, -1)
         # shape: (batch, augmentation * pomo)
         advantage = aug_reward - aug_reward.float().mean(dim=1, keepdims=True)
         # shape: (batch, augmentation * pomo)
-        log_prob = prob_list.log().sum(dim=2).reshape(aug_factor, batch_size, self.env.pomo_size).permute(1, 0, 2).view(batch_size, -1)
+        log_prob = prob_list.log().sum(dim=2).reshape(aug_factor, batch_size, self.env.pomo_size).permute(1, 0, 2).reshape(batch_size, -1)
         # size = (batch, augmentation * pomo)
         loss = -advantage * log_prob  # Minus Sign: To Increase REWARD
         # shape: (batch, augmentation * pomo)
-Original file line number
+Diff line change
@@ Expand Up / @@ -13,6 +13,7 @@ __pycache__/ @@
     # data & pretrain-model
     backup/
+    AM/
     data/
     pretrained/
@@ Expand Down @@