Distiller's AMC induced changes (#359)

* override episode rewards with the last transition reward * EWMA normalization filter * allowing control over when the pre_network filter runs
2026-02-15 05:25:55 +01:00 · 2019-08-05 10:24:58 +03:00
parent 7df67dafa3
commit c1d1fae342
10 changed files with 137 additions and 30 deletions
--- a/rl_coach/base_parameters.py
+++ b/rl_coach/base_parameters.py
@@ -213,6 +213,14 @@ class AlgorithmParameters(Parameters):
        # Support for parameter noise
        self.supports_parameter_noise = False

+        # Override, in retrospective, all the episode rewards with the last reward in the episode
+        # (sometimes useful for sparse, end of the episode, rewards problems)
+        self.override_episode_rewards_with_the_last_transition_reward = False
+
+        # Filters - TODO consider creating a FilterParameters class and initialize the filters with it
+        self.update_pre_network_filters_state_on_train = False
+        self.update_pre_network_filters_state_on_inference = True
+        

 class PresetValidationParameters(Parameters):
    def __init__(self,