From c7c2296c711ec2bfd31d8ab774957560704d71fc Mon Sep 17 00:00:00 2001 From: sp Date: Wed, 3 Jan 2024 19:39:57 +0100 Subject: [PATCH] changed early stopping criterion in tuner --- examples/shields/rl/15_train_eval_tune.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/examples/shields/rl/15_train_eval_tune.py b/examples/shields/rl/15_train_eval_tune.py index ad9d5c1..3bf53e9 100644 --- a/examples/shields/rl/15_train_eval_tune.py +++ b/examples/shields/rl/15_train_eval_tune.py @@ -74,7 +74,7 @@ def ppo(args): ), run_config=air.RunConfig( - stop = {"episode_reward_mean": 94, + stop = {"episode_reward_mean": 1, "timesteps_total": args.steps,}, checkpoint_config=air.CheckpointConfig(checkpoint_at_end=True, num_to_keep=1,