Update ml-agents/mlagents/trainers/torch/distributions.py

cmard · maryamhonari · web-flow · commit 98da4b1717f5 · 2021-11-03T14:09:45.000-04:00
Co-authored-by: Maryam Honari &lt;honari.m94@gmail.com&gt;
diff --git a/ml-agents/mlagents/trainers/torch/distributions.py b/ml-agents/mlagents/trainers/torch/distributions.py
@@ -124,7 +124,7 @@ def sample(self):
         return torch.multinomial(self.probs, 1)
 
     def deterministic_sample(self):
-        return torch.argmax(self.probs).reshape((1, 1))
+        return torch.argmax(self.probs, dim=1, keepdim=True)
 
     def pdf(self, value):
         # This function is equivalent to torch.diag(self.probs.T[value.flatten().long()]),