fix n_step_q_agent

2026-02-11 11:15:49 +01:00 · 2018-02-16 20:25:33 -05:00
parent 5cf10e5f52
commit e1ad86417f
3 changed files with 20 additions and 19 deletions
--- a/utils.py
+++ b/utils.py
@@ -351,3 +351,14 @@ def stack_observation(curr_stack, observation, stack_size):
        curr_stack = np.delete(curr_stack, 0, -1)

    return curr_stack
+
+
+def last_sample(state):
+    """
+    given a batch of states, return the last sample of the batch with length 1
+    batch axis.
+    """
+    return {
+        k: np.expand_dims(v[-1], 0)
+        for k, v in state.items()
+    }