mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
adding pickling of running_stats and updating the beta entropy for ClippedPPO
This commit is contained in:
@@ -442,7 +442,7 @@ class ClippedPPO(AgentParameters):
|
||||
batch_size = 64
|
||||
use_separate_networks_per_head = True
|
||||
step_until_collecting_full_episodes = True
|
||||
beta_entropy = 0.01
|
||||
beta_entropy = 0.001
|
||||
|
||||
class DFP(AgentParameters):
|
||||
type = 'DFPAgent'
|
||||
|
||||
Reference in New Issue
Block a user