From 3fd433ffabdaf18581ec16a3d9fae5985b740872 Mon Sep 17 00:00:00 2001 From: Itai Caspi <30383381+itaicaspi-intel@users.noreply.github.com> Date: Fri, 9 Nov 2018 18:17:04 +0200 Subject: [PATCH] fix ddpg head (#78) --- .../tensorflow_components/heads/ddpg_actor_head.py | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/rl_coach/architectures/tensorflow_components/heads/ddpg_actor_head.py b/rl_coach/architectures/tensorflow_components/heads/ddpg_actor_head.py index 6b3112a..45545b4 100644 --- a/rl_coach/architectures/tensorflow_components/heads/ddpg_actor_head.py +++ b/rl_coach/architectures/tensorflow_components/heads/ddpg_actor_head.py @@ -46,9 +46,12 @@ class DDPGActor(Head): def _build_module(self, input_layer): # mean pre_activation_policy_values_mean = self.dense_layer(self.num_actions)(input_layer, name='fc_mean') - policy_values_mean = batchnorm_activation_dropout(pre_activation_policy_values_mean, self.batchnorm, - self.activation_function, - False, 0, is_training=False, name="BatchnormActivationDropout_0")[-1] + policy_values_mean = batchnorm_activation_dropout(input_layer=pre_activation_policy_values_mean, + batchnorm=self.batchnorm, + activation_function=self.activation_function, + dropout_rate=0, + is_training=False, + name="BatchnormActivationDropout_0")[-1] self.policy_mean = tf.multiply(policy_values_mean, self.output_scale, name='output_mean') if self.is_local: