mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
Add is_on_policy property to agents (#480)
This commit is contained in:
@@ -92,6 +92,10 @@ class NStepQAgent(ValueOptimizationAgent, PolicyOptimizationAgent):
|
||||
self.q_values = self.register_signal('Q Values')
|
||||
self.value_loss = self.register_signal('Value Loss')
|
||||
|
||||
@property
|
||||
def is_on_policy(self) -> bool:
|
||||
return False
|
||||
|
||||
def learn_from_batch(self, batch):
|
||||
# batch contains a list of episodes to learn from
|
||||
network_keys = self.ap.network_wrappers['main'].input_embedders_parameters.keys()
|
||||
|
||||
Reference in New Issue
Block a user