timurgepard
/

symphony

Model card Files Files and versions

timurgepard commited on 3 days ago

Commit

cffa147

·

verified ·

1 Parent(s): 6820093

Update symphony_S2/train.py

Files changed (1) hide show

symphony_S2/train.py +3 -3

symphony_S2/train.py CHANGED Viewed

@@ -193,9 +193,9 @@ def sim_loop(env, episodes, testing, Q_learning, algo, total_rewards, total_step
                 save(algo, total_rewards, total_steps)
                 print("start testing")
                 log_file.write(str(total_steps) + ",")
-                Return = sim_loop(env_test, 25, True, Q_learning, algo, [], total_steps=0)
                 print("end of testing")
-                log_file.write(str(round(Return, 2)) + "\n")
             # if steps is close to episode limit (e.g. 950) we shut down actions and leave noise to get Terminal Transition:
@@ -230,4 +230,4 @@ Q_learning, total_rewards, total_steps = load(algo, Q_learning)
 if not Q_learning: log_file.clean()
 # Training
-sim_loop(env, num_episodes, False, Q_learning, algo, total_rewards, total_steps)

                 save(algo, total_rewards, total_steps)
                 print("start testing")
                 log_file.write(str(total_steps) + ",")
+                test_return = sim_loop(env_test, 25, True, Q_learning, algo, [], total_steps=0)
                 print("end of testing")
+                log_file.write(str(round(test_return, 2)) + "\n")
             # if steps is close to episode limit (e.g. 950) we shut down actions and leave noise to get Terminal Transition:
 if not Q_learning: log_file.clean()
 # Training
+sim_loop(env, num_episodes, False, Q_learning, algo, total_rewards, total_steps)