mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
bug fix - correcting the evaluation exploration control parameter logging
This commit is contained in:
@@ -67,4 +67,4 @@ class EGreedy(ExplorationPolicy):
|
|||||||
return np.squeeze(action_values + (np.random.rand() < epsilon) * noise)
|
return np.squeeze(action_values + (np.random.rand() < epsilon) * noise)
|
||||||
|
|
||||||
def get_control_param(self):
|
def get_control_param(self):
|
||||||
return self.epsilon
|
return self.evaluation_epsilon if self.phase == RunPhase.TEST else self.epsilon
|
||||||
|
|||||||
Reference in New Issue
Block a user