1
0
mirror of https://github.com/gryf/coach.git synced 2025-12-17 19:20:19 +01:00

adding pickling of running_stats and updating the beta entropy for ClippedPPO

This commit is contained in:
itaicaspi-intel
2018-03-19 14:37:05 +02:00
parent f7979b05e4
commit 24a0f24279
2 changed files with 10 additions and 3 deletions

View File

@@ -442,7 +442,7 @@ class ClippedPPO(AgentParameters):
batch_size = 64
use_separate_networks_per_head = True
step_until_collecting_full_episodes = True
beta_entropy = 0.01
beta_entropy = 0.001
class DFP(AgentParameters):
type = 'DFPAgent'