1
0
mirror of https://github.com/gryf/coach.git synced 2025-12-17 19:20:19 +01:00

new feature - implementation of Quantile Regression DQN (https://arxiv.org/pdf/1710.10044v1.pdf)

API change - Distributional DQN renamed to Categorical DQN
This commit is contained in:
Itai Caspi
2017-11-01 15:09:07 +02:00
parent 1ad6262307
commit a8bce9828c
10 changed files with 157 additions and 17 deletions

View File

@@ -42,7 +42,8 @@ class OutputTypes(object):
NAF = 7
PPO = 8
PPO_V = 9
DistributionalQ = 10
CategoricalQ = 10
QuantileRegressionQ = 11
class MiddlewareTypes(object):
@@ -307,14 +308,20 @@ class BootstrappedDQN(DQN):
num_output_head_copies = 10
class DistributionalDQN(DQN):
type = 'DistributionalDQNAgent'
output_types = [OutputTypes.DistributionalQ]
class CategoricalDQN(DQN):
type = 'CategoricalDQNAgent'
output_types = [OutputTypes.CategoricalQ]
v_min = -10.0
v_max = 10.0
atoms = 51
class QuantileRegressionDQN(DQN):
type = 'QuantileRegressionDQNAgent'
output_types = [OutputTypes.QuantileRegressionQ]
atoms = 51
class NEC(AgentParameters):
type = 'NECAgent'
optimizer_type = 'RMSProp'