changed early stopping criterion in tuner

2 years ago · c7c2296c71
1 changed files with 1 additions and 1 deletions
--- a/examples/shields/rl/15_train_eval_tune.py
+++ b/examples/shields/rl/15_train_eval_tune.py
@ -74,7 +74,7 @@ def ppo(args):

                       ),
                        run_config=air.RunConfig(
-                                stop = {"episode_reward_mean": 94,
+                                stop = {"episode_reward_mean": 1,
                                        "timesteps_total": args.steps,},
                                checkpoint_config=air.CheckpointConfig(checkpoint_at_end=True,
                                                                       num_to_keep=1,