diff --git a/main.py b/main.py index e1bb8b1a285bf6823914fd9fcfe00a4f64c6e588..bff7053b0503cf97a53d91b7263ff9ad1593d1f8 100644 --- a/main.py +++ b/main.py @@ -163,7 +163,7 @@ def run_single_exploration(args, env, agent:CSCCQLSAC, buffer:ReplayBuffer, stat # During training, add experiences to buffer if train: buffer.add( - state, action, reward, cost, next_state, not terminated + state, action, reward, cost, next_state, terminated ) # End episode if the cost exceeded the limit