1
0
mirror of https://github.com/gryf/coach.git synced 2026-04-02 10:03:33 +02:00

bug fixes for OPE (#311)

This commit is contained in:
Gal Leibovich
2019-05-21 16:39:11 +03:00
committed by GitHub
parent 85d70dd7d5
commit acceb03ac0
8 changed files with 38 additions and 21 deletions

View File

@@ -155,7 +155,7 @@ class DDQNBCQAgent(DQNAgent):
reward_model_loss = 0
imitation_model_loss = 0
total_transitions_processed = 0
for i, batch in enumerate(self.call_memory('get_shuffled_data_generator', batch_size)):
for i, batch in enumerate(self.call_memory('get_shuffled_training_data_generator', batch_size)):
batch = Batch(batch)
# reward model