mirror of
https://github.com/gryf/coach.git
synced 2025-12-18 03:30:19 +01:00
OPE: Weighted Importance Sampling (#299)
This commit is contained in:
@@ -522,6 +522,7 @@ class Agent(AgentInterface):
|
||||
self.agent_logger.create_signal_value('Inverse Propensity Score', np.nan, overwrite=False)
|
||||
self.agent_logger.create_signal_value('Direct Method Reward', np.nan, overwrite=False)
|
||||
self.agent_logger.create_signal_value('Doubly Robust', np.nan, overwrite=False)
|
||||
self.agent_logger.create_signal_value('Weighted Importance Sampling', np.nan, overwrite=False)
|
||||
self.agent_logger.create_signal_value('Sequential Doubly Robust', np.nan, overwrite=False)
|
||||
|
||||
for signal in self.episode_signals:
|
||||
|
||||
Reference in New Issue
Block a user