imitation related bug fixes

2026-02-15 05:25:55 +01:00 · 2018-09-12 14:54:33 +03:00
parent a9bd1047c4
commit 171fe97a3a
7 changed files with 21 additions and 22 deletions
--- a/rl_coach/graph_managers/graph_manager.py
+++ b/rl_coach/graph_managers/graph_manager.py
@@ -340,9 +340,11 @@ class GraphManager(object):
                break

            # add the diff between the total steps before and after stepping, such that environment initialization steps
-            # (like in Atari) will not be counted
+            # (like in Atari) will not be counted.
+            # We add at least one step so that even if no steps were made (in case no actions are taken in the training
+            # phase), the loop will end eventually.
            self.total_steps_counters[self.phase][EnvironmentSteps] += \
-                self.environments[0].total_steps_counter - current_steps
+                max(1, self.environments[0].total_steps_counter - current_steps)

            if result.game_over:
                hold_until_a_full_episode = False