mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
Adding target reward and target sucess (#58)
* Adding target reward * Adding target successs * Addressing comments * Using custom_reward_threshold and target_success_rate * Adding exit message * Moving success rate to environment * Making target_success_rate optional
This commit is contained in:
committed by
Balaji Subramaniam
parent
0fe583186e
commit
875d6ef017
@@ -40,8 +40,9 @@ def training_worker(graph_manager, checkpoint_dir):
|
||||
graph_manager.phase = core_types.RunPhase.UNDEFINED
|
||||
|
||||
if steps * graph_manager.agent_params.algorithm.num_consecutive_playing_steps.num_steps > graph_manager.steps_between_evaluation_periods.num_steps * eval_offset:
|
||||
graph_manager.evaluate(graph_manager.evaluation_steps)
|
||||
eval_offset += 1
|
||||
if graph_manager.evaluate(graph_manager.evaluation_steps):
|
||||
break
|
||||
|
||||
if graph_manager.agent_params.algorithm.distributed_coach_synchronization_type == DistributedCoachSynchronizationType.SYNC:
|
||||
graph_manager.save_checkpoint()
|
||||
|
||||
Reference in New Issue
Block a user