diff --git a/ReinforcementLearning/PolicyGradient/actor_critic/tensorflow2/actor_critic.py b/ReinforcementLearning/PolicyGradient/actor_critic/tensorflow2/actor_critic.py index 4e90340..5048964 100644 --- a/ReinforcementLearning/PolicyGradient/actor_critic/tensorflow2/actor_critic.py +++ b/ReinforcementLearning/PolicyGradient/actor_critic/tensorflow2/actor_critic.py @@ -21,7 +21,6 @@ def choose_action(self, observation): action_probabilities = tfp.distributions.Categorical(probs=probs) action = action_probabilities.sample() - log_prob = action_probabilities.log_prob(action) self.action = action return action.numpy()[0]