mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 11:10:20 +01:00
fix qr_dqn_agent
This commit is contained in:
@@ -101,9 +101,7 @@ class ActorCriticAgent(PolicyOptimizationAgent):
|
||||
actions = np.expand_dims(actions, -1)
|
||||
|
||||
# train
|
||||
inputs = copy.copy(current_states)
|
||||
inputs['output_1_0'] = actions
|
||||
result = self.main_network.online_network.accumulate_gradients(inputs,
|
||||
result = self.main_network.online_network.accumulate_gradients({**current_states, 'output_1_0': actions},
|
||||
[state_value_head_targets, action_advantages])
|
||||
|
||||
# logging
|
||||
|
||||
Reference in New Issue
Block a user