RL in Large Discrete Action Spaces - Wolpertinger Agent (#394)

* Currently this is specific to the case of discretizing a continuous action space. Can easily be adapted to other case by feeding the kNN otherwise, and removing the usage of a discretizing output action filter
2026-02-25 11:45:46 +01:00 · 2019-09-08 12:53:49 +03:00
parent fc50398544
commit 138ced23ba
46 changed files with 1193 additions and 51 deletions
--- a/rl_coach/filters/action/partial_discrete_action_space_map.py
+++ b/rl_coach/filters/action/partial_discrete_action_space_map.py
@@ -48,7 +48,8 @@ class PartialDiscreteActionSpaceMap(ActionFilter):

    def get_unfiltered_action_space(self, output_action_space: ActionSpace) -> DiscreteActionSpace:
        self.output_action_space = output_action_space
-        self.input_action_space = DiscreteActionSpace(len(self.target_actions), self.descriptions)
+        self.input_action_space = DiscreteActionSpace(len(self.target_actions), self.descriptions,
+                                                      filtered_action_space=output_action_space)
        return self.input_action_space

    def filter(self, action: ActionType) -> ActionType: