mirror of
https://github.com/gryf/coach.git
synced 2026-03-06 09:15:50 +01:00
Corrected MXNet's PPO Head for Continuous Action Spaces (#84)
* Changes required for Continuous PPO Head with MXNet. Used in MountainCarContinuous_ClippedPPO. * Simplified changes for continuous ppo. * Cleaned up to avoid duplicate code, and simplified covariance creation.
This commit is contained in:
committed by
Scott Leishman
parent
fde73ced13
commit
3358e04a6a
@@ -412,7 +412,10 @@ class SingleModel(HybridBlock):
|
||||
# Head
|
||||
outputs = tuple()
|
||||
for head in self._output_heads:
|
||||
outputs += (head(state_embedding),)
|
||||
out = head(state_embedding)
|
||||
if not isinstance(out, tuple):
|
||||
out = (out,)
|
||||
outputs += out
|
||||
|
||||
return outputs
|
||||
|
||||
|
||||
Reference in New Issue
Block a user