mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
benchmark update (#250)
This commit is contained in:
Binary file not shown.
|
Before Width: | Height: | Size: 66 KiB After Width: | Height: | Size: 65 KiB |
Binary file not shown.
|
Before Width: | Height: | Size: 65 KiB After Width: | Height: | Size: 60 KiB |
@@ -68,7 +68,7 @@ class ACERAlgorithmParameters(AlgorithmParameters):
|
|||||||
self.num_steps_between_gradient_updates = 5000
|
self.num_steps_between_gradient_updates = 5000
|
||||||
self.ratio_of_replay = 4
|
self.ratio_of_replay = 4
|
||||||
self.num_transitions_to_start_replay = 10000
|
self.num_transitions_to_start_replay = 10000
|
||||||
self.rate_for_copying_weights_to_target = 0.99
|
self.rate_for_copying_weights_to_target = 0.01
|
||||||
self.importance_weight_truncation = 10.0
|
self.importance_weight_truncation = 10.0
|
||||||
self.use_trust_region_optimization = True
|
self.use_trust_region_optimization = True
|
||||||
self.max_KL_divergence = 1.0
|
self.max_KL_divergence = 1.0
|
||||||
|
|||||||
@@ -11,7 +11,7 @@ from rl_coach.memories.memory import MemoryGranularity
|
|||||||
# Graph Scheduling #
|
# Graph Scheduling #
|
||||||
####################
|
####################
|
||||||
schedule_params = ScheduleParameters()
|
schedule_params = ScheduleParameters()
|
||||||
schedule_params.improve_steps = TrainingSteps(10000000000)
|
schedule_params.improve_steps = TrainingSteps(10000000)
|
||||||
schedule_params.steps_between_evaluation_periods = EnvironmentEpisodes(100)
|
schedule_params.steps_between_evaluation_periods = EnvironmentEpisodes(100)
|
||||||
schedule_params.evaluation_steps = EnvironmentEpisodes(3)
|
schedule_params.evaluation_steps = EnvironmentEpisodes(3)
|
||||||
schedule_params.heatup_steps = EnvironmentSteps(0)
|
schedule_params.heatup_steps = EnvironmentSteps(0)
|
||||||
|
|||||||
Reference in New Issue
Block a user