We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
2 parents d5847e8 + c2da672 commit 346e64bCopy full SHA for 346e64b
agents/actor_critic_agents/SAC_Discrete.py
@@ -52,7 +52,7 @@ def produce_action_and_action_info(self, state):
52
"""Given the state, produces an action, the probability of the action, the log probability of the action, and
53
the argmax action"""
54
action_probabilities = self.actor_local(state)
55
- max_probability_action = torch.argmax(action_probabilities, dim=1)
+ max_probability_action = torch.argmax(action_probabilities, dim=-1)
56
action_distribution = create_actor_distribution(self.action_types, action_probabilities, self.action_size)
57
action = action_distribution.sample().cpu()
58
# Have to deal with situation of 0.0 probabilities because we can't do log 0
0 commit comments