From efc6e67a457f28f74127a5d4311d11be073aa1a6 Mon Sep 17 00:00:00 2001 From: itaicaspi-intel Date: Mon, 19 Mar 2018 17:48:57 +0200 Subject: [PATCH] update evaluation periods --- presets.py | 6 ++++-- 1 file changed, 4 insertions(+), 2 deletions(-) diff --git a/presets.py b/presets.py index a5b2ceb..3f4fb1d 100644 --- a/presets.py +++ b/presets.py @@ -538,8 +538,10 @@ class Humanoid_ClippedPPO(Preset): self.env.level = 'Humanoid-v1' self.learning_rate = 0.0001 self.num_heatup_steps = 0 - self.agent.num_consecutive_training_steps = 1 - self.agent.num_consecutive_playing_steps = 2048 + self.agent.num_consecutive_training_steps = 0 + self.agent.num_consecutive_playing_steps = 200 + self.evaluate_every_x_episodes = 1 + self.evaluation_episodes = 10000 self.agent.discount = 0.99 self.batch_size = 64 self.agent.policy_gradient_rescaler = 'GAE'