1
0
mirror of https://github.com/gryf/coach.git synced 2025-12-17 19:20:19 +01:00

Parallel agents fixes (#95)

* Parallel agents related bug fixes: checkpoint restore, tensorboard integration.
Adding narrow networks support.
Reference code for unlimited number of checkpoints
This commit is contained in:
Itai Caspi
2018-05-24 14:24:19 +03:00
committed by GitHub
parent 6c0b59b4de
commit d302168c8c
10 changed files with 75 additions and 41 deletions

View File

@@ -32,11 +32,6 @@ class InputTypes(object):
TimedObservation = 5
class EmbedderComplexity(object):
Shallow = 1
Deep = 2
class OutputTypes(object):
Q = 1
DuelingQ = 2
@@ -51,6 +46,17 @@ class OutputTypes(object):
QuantileRegressionQ = 11
class EmbedderDepth(object):
Shallow = 1
Deep = 2
class EmbedderWidth(object):
Narrow = 1
Wide = 2
class MiddlewareTypes(object):
LSTM = 1
FC = 2
@@ -82,7 +88,8 @@ class AgentParameters(Parameters):
middleware_type = MiddlewareTypes.FC
loss_weights = [1.0]
stop_gradients_from_head = [False]
embedder_complexity = EmbedderComplexity.Shallow
embedder_depth = EmbedderDepth.Shallow
embedder_width = EmbedderWidth.Wide
num_output_head_copies = 1
use_measurements = False
use_accumulated_reward_as_measurement = False