mirror of
https://github.com/gryf/coach.git
synced 2025-12-18 03:30:19 +01:00
Distiller's AMC induced changes (#359)
* override episode rewards with the last transition reward * EWMA normalization filter * allowing control over when the pre_network filter runs
This commit is contained in:
@@ -213,6 +213,14 @@ class AlgorithmParameters(Parameters):
|
||||
# Support for parameter noise
|
||||
self.supports_parameter_noise = False
|
||||
|
||||
# Override, in retrospective, all the episode rewards with the last reward in the episode
|
||||
# (sometimes useful for sparse, end of the episode, rewards problems)
|
||||
self.override_episode_rewards_with_the_last_transition_reward = False
|
||||
|
||||
# Filters - TODO consider creating a FilterParameters class and initialize the filters with it
|
||||
self.update_pre_network_filters_state_on_train = False
|
||||
self.update_pre_network_filters_state_on_inference = True
|
||||
|
||||
|
||||
class PresetValidationParameters(Parameters):
|
||||
def __init__(self,
|
||||
|
||||
Reference in New Issue
Block a user