mirror of
https://github.com/gryf/coach.git
synced 2026-05-06 08:03:00 +02:00
N-step returns for rainbow (#67)
* n_step returns for rainbow * Rename CartPole_PPO -> CartPole_ClippedPPO
This commit is contained in:
@@ -139,7 +139,7 @@ class EpisodicHindsightExperienceReplay(EpisodicExperienceReplay):
|
||||
hindsight_transition.reward, hindsight_transition.game_over = \
|
||||
self.goals_space.get_reward_for_goal_and_state(goal, hindsight_transition.next_state)
|
||||
|
||||
hindsight_transition.total_return = None
|
||||
hindsight_transition.n_step_discounted_rewards = None
|
||||
episode.insert(hindsight_transition)
|
||||
|
||||
super().store_episode(episode)
|
||||
|
||||
Reference in New Issue
Block a user