mirror of
https://github.com/gryf/coach.git
synced 2025-12-18 03:30:19 +01:00
Add is_on_policy property to agents (#480)
This commit is contained in:
@@ -141,6 +141,12 @@ class DFPAgent(Agent):
|
||||
self.current_goal = self.ap.algorithm.goal_vector
|
||||
self.target_measurements_scale_factors = None
|
||||
|
||||
@property
|
||||
def is_on_policy(self) -> bool:
|
||||
# This is only somewhat correct as the algorithm uses a very small (20k) ER keeping only recent samples seen.
|
||||
# So, it is approximately on-policy (although if too be completely strict it is off-policy)
|
||||
return True
|
||||
|
||||
def learn_from_batch(self, batch):
|
||||
network_keys = self.ap.network_wrappers['main'].input_embedders_parameters.keys()
|
||||
|
||||
|
||||
Reference in New Issue
Block a user