Add tensor input type for arbitrary dimensional observation (#125)

* Allow arbitrary dimensional observation (non vector or image) * Added creating PlanarMapsObservationSpace to GymEnvironment when number of channels is not 1 or 3
2026-03-05 00:15:50 +01:00 · 2018-11-19 06:41:12 -08:00
parent 7ba1a4393f
commit 67a90ee87e
10 changed files with 194 additions and 24 deletions
--- a/rl_coach/architectures/mxnet_components/embedders/tensor_embedder.py
+++ b/rl_coach/architectures/mxnet_components/embedders/tensor_embedder.py
@@ -0,0 +1,53 @@
+from typing import Union
+from types import ModuleType
+
+import mxnet as mx
+from rl_coach.architectures.embedder_parameters import InputEmbedderParameters
+from rl_coach.architectures.mxnet_components.embedders.embedder import InputEmbedder
+
+nd_sym_type = Union[mx.nd.NDArray, mx.sym.Symbol]
+
+
+class TensorEmbedder(InputEmbedder):
+    def __init__(self, params: InputEmbedderParameters):
+        """
+        A tensor embedder is an input embedder that takes a tensor with arbitrary dimension and produces a vector
+        embedding by passing it through a neural network. An example is video data or 3D image data (i.e. 4D tensors)
+    or other type of data that is more than 1 dimension (i.e. not vector) but is not an image.
+
+        NOTE: There are no pre-defined schemes for tensor embedder. User must define a custom scheme by passing
+        a callable object as InputEmbedderParameters.scheme when defining the respective preset. This callable
+        object must return a Gluon HybridBlock. The hybrid_forward() of this block must accept a single input,
+        normalized observation, and return an embedding vector for each sample in the batch.
+        Keep in mind that the scheme is a list of blocks, which are stacked by optional batchnorm,
+        activation, and dropout in between as specified in InputEmbedderParameters.
+
+        :param params: parameters object containing input_clipping, input_rescaling, batchnorm, activation_function
+            and dropout properties.
+        """
+        super(TensorEmbedder, self).__init__(params)
+        self.input_rescaling = params.input_rescaling['tensor']
+        self.input_offset = params.input_offset['tensor']
+
+    @property
+    def schemes(self) -> dict:
+        """
+        Schemes are the pre-defined network architectures of various depths and complexities that can be used. Are used
+        to create Block when InputEmbedder is initialised.
+
+        Note: Tensor embedder doesn't define any pre-defined scheme. User must provide custom scheme in preset.
+
+        :return: dictionary of schemes, with key of type EmbedderScheme enum and value being list of mxnet.gluon.Block.
+            For tensor embedder, this is an empty dictionary.
+        """
+        return {}
+
+    def hybrid_forward(self, F: ModuleType, x: nd_sym_type, *args, **kwargs) -> nd_sym_type:
+        """
+        Used for forward pass through embedder network.
+
+        :param F: backend api, either `mxnet.nd` or `mxnet.sym` (if block has been hybridized).
+        :param x: image representing environment state, of shape (batch_size, in_channels, height, width).
+        :return: embedding of environment state, of shape (batch_size, channels).
+        """
+        return super(TensorEmbedder, self).hybrid_forward(F, x, *args, **kwargs)