diff --git a/ReinforcementLearning/PolicyGradient/SAC/sac_torch.py b/ReinforcementLearning/PolicyGradient/SAC/sac_torch.py index 5117b57..01e2412 100644 --- a/ReinforcementLearning/PolicyGradient/SAC/sac_torch.py +++ b/ReinforcementLearning/PolicyGradient/SAC/sac_torch.py @@ -8,7 +8,7 @@ class Agent(): def __init__(self, alpha=0.0003, beta=0.0003, input_dims=[8], env=None, gamma=0.99, n_actions=2, max_size=1000000, tau=0.005, - layer1_size=256, layer2_size=256, batch_size=256, reward_scale=2): + batch_size=256, reward_scale=2): self.gamma = gamma self.tau = tau self.memory = ReplayBuffer(max_size, input_dims, n_actions)