mirror of
https://github.com/gryf/coach.git
synced 2025-12-18 03:30:19 +01:00
Add is_on_policy property to agents (#480)
This commit is contained in:
@@ -111,8 +111,11 @@ class ACERAgent(PolicyOptimizationAgent):
|
||||
self.V_Values = self.register_signal('Values')
|
||||
self.kl_divergence = self.register_signal('KL Divergence')
|
||||
|
||||
def _learn_from_batch(self, batch):
|
||||
@property
|
||||
def is_on_policy(self) -> bool:
|
||||
return False
|
||||
|
||||
def _learn_from_batch(self, batch):
|
||||
fetches = [self.networks['main'].online_network.output_heads[1].probability_loss,
|
||||
self.networks['main'].online_network.output_heads[1].bias_correction_loss,
|
||||
self.networks['main'].online_network.output_heads[1].kl_divergence]
|
||||
|
||||
Reference in New Issue
Block a user