1
0
mirror of https://github.com/gryf/coach.git synced 2025-12-17 19:20:19 +01:00

imitation related bug fixes

This commit is contained in:
itaicaspi-intel
2018-09-12 14:54:33 +03:00
parent a9bd1047c4
commit 171fe97a3a
7 changed files with 21 additions and 22 deletions

View File

@@ -340,9 +340,11 @@ class GraphManager(object):
break
# add the diff between the total steps before and after stepping, such that environment initialization steps
# (like in Atari) will not be counted
# (like in Atari) will not be counted.
# We add at least one step so that even if no steps were made (in case no actions are taken in the training
# phase), the loop will end eventually.
self.total_steps_counters[self.phase][EnvironmentSteps] += \
self.environments[0].total_steps_counter - current_steps
max(1, self.environments[0].total_steps_counter - current_steps)
if result.game_over:
hold_until_a_full_episode = False