mirror of
https://github.com/gryf/coach.git
synced 2025-12-17 19:20:19 +01:00
new feature - implementation of Quantile Regression DQN (https://arxiv.org/pdf/1710.10044v1.pdf)
API change - Distributional DQN renamed to Categorical DQN
This commit is contained in:
@@ -42,7 +42,8 @@ class OutputTypes(object):
|
||||
NAF = 7
|
||||
PPO = 8
|
||||
PPO_V = 9
|
||||
DistributionalQ = 10
|
||||
CategoricalQ = 10
|
||||
QuantileRegressionQ = 11
|
||||
|
||||
|
||||
class MiddlewareTypes(object):
|
||||
@@ -307,14 +308,20 @@ class BootstrappedDQN(DQN):
|
||||
num_output_head_copies = 10
|
||||
|
||||
|
||||
class DistributionalDQN(DQN):
|
||||
type = 'DistributionalDQNAgent'
|
||||
output_types = [OutputTypes.DistributionalQ]
|
||||
class CategoricalDQN(DQN):
|
||||
type = 'CategoricalDQNAgent'
|
||||
output_types = [OutputTypes.CategoricalQ]
|
||||
v_min = -10.0
|
||||
v_max = 10.0
|
||||
atoms = 51
|
||||
|
||||
|
||||
class QuantileRegressionDQN(DQN):
|
||||
type = 'QuantileRegressionDQNAgent'
|
||||
output_types = [OutputTypes.QuantileRegressionQ]
|
||||
atoms = 51
|
||||
|
||||
|
||||
class NEC(AgentParameters):
|
||||
type = 'NECAgent'
|
||||
optimizer_type = 'RMSProp'
|
||||
|
||||
Reference in New Issue
Block a user