mirror of
https://github.com/gryf/coach.git
synced 2025-12-19 04:00:18 +01:00
Add tensor input type for arbitrary dimensional observation (#125)
* Allow arbitrary dimensional observation (non vector or image) * Added creating PlanarMapsObservationSpace to GymEnvironment when number of channels is not 1 or 3
This commit is contained in:
committed by
Gal Leibovich
parent
7ba1a4393f
commit
67a90ee87e
@@ -0,0 +1,53 @@
|
||||
from typing import Union
|
||||
from types import ModuleType
|
||||
|
||||
import mxnet as mx
|
||||
from rl_coach.architectures.embedder_parameters import InputEmbedderParameters
|
||||
from rl_coach.architectures.mxnet_components.embedders.embedder import InputEmbedder
|
||||
|
||||
nd_sym_type = Union[mx.nd.NDArray, mx.sym.Symbol]
|
||||
|
||||
|
||||
class TensorEmbedder(InputEmbedder):
|
||||
def __init__(self, params: InputEmbedderParameters):
|
||||
"""
|
||||
A tensor embedder is an input embedder that takes a tensor with arbitrary dimension and produces a vector
|
||||
embedding by passing it through a neural network. An example is video data or 3D image data (i.e. 4D tensors)
|
||||
or other type of data that is more than 1 dimension (i.e. not vector) but is not an image.
|
||||
|
||||
NOTE: There are no pre-defined schemes for tensor embedder. User must define a custom scheme by passing
|
||||
a callable object as InputEmbedderParameters.scheme when defining the respective preset. This callable
|
||||
object must return a Gluon HybridBlock. The hybrid_forward() of this block must accept a single input,
|
||||
normalized observation, and return an embedding vector for each sample in the batch.
|
||||
Keep in mind that the scheme is a list of blocks, which are stacked by optional batchnorm,
|
||||
activation, and dropout in between as specified in InputEmbedderParameters.
|
||||
|
||||
:param params: parameters object containing input_clipping, input_rescaling, batchnorm, activation_function
|
||||
and dropout properties.
|
||||
"""
|
||||
super(TensorEmbedder, self).__init__(params)
|
||||
self.input_rescaling = params.input_rescaling['tensor']
|
||||
self.input_offset = params.input_offset['tensor']
|
||||
|
||||
@property
|
||||
def schemes(self) -> dict:
|
||||
"""
|
||||
Schemes are the pre-defined network architectures of various depths and complexities that can be used. Are used
|
||||
to create Block when InputEmbedder is initialised.
|
||||
|
||||
Note: Tensor embedder doesn't define any pre-defined scheme. User must provide custom scheme in preset.
|
||||
|
||||
:return: dictionary of schemes, with key of type EmbedderScheme enum and value being list of mxnet.gluon.Block.
|
||||
For tensor embedder, this is an empty dictionary.
|
||||
"""
|
||||
return {}
|
||||
|
||||
def hybrid_forward(self, F: ModuleType, x: nd_sym_type, *args, **kwargs) -> nd_sym_type:
|
||||
"""
|
||||
Used for forward pass through embedder network.
|
||||
|
||||
:param F: backend api, either `mxnet.nd` or `mxnet.sym` (if block has been hybridized).
|
||||
:param x: image representing environment state, of shape (batch_size, in_channels, height, width).
|
||||
:return: embedding of environment state, of shape (batch_size, channels).
|
||||
"""
|
||||
return super(TensorEmbedder, self).hybrid_forward(F, x, *args, **kwargs)
|
||||
Reference in New Issue
Block a user