1
0
mirror of https://github.com/gryf/coach.git synced 2025-12-17 19:20:19 +01:00

integration test changes to reach the train part (#254)

* integration test changes to override heatup to 1000 steps +  run each preset for 30 sec (to make sure we reach the train part)

* fixes to failing presets uncovered with this change + changes in the golden testing to properly test BatchRL

* fix for rainbow dqn

* fix to gym_environment (due to a change in Gym 0.12.1) + fix for rainbow DQN + some bug-fix in utils.squeeze_list

* fix for NEC agent
This commit is contained in:
Gal Leibovich
2019-03-27 21:14:19 +02:00
committed by GitHub
parent 6e08c55ad5
commit 310d31c227
8 changed files with 28 additions and 17 deletions

View File

@@ -85,7 +85,7 @@ class CategoricalDQNAgent(ValueOptimizationAgent):
def get_all_q_values_for_states(self, states: StateType):
if self.exploration_policy.requires_action_values():
q_values = self.get_prediction(states,
outputs=self.networks['main'].online_network.output_heads[0].q_values)
outputs=[self.networks['main'].online_network.output_heads[0].q_values])
else:
q_values = None
return q_values