package emote.nn
Functions
def ortho_init_(m, gain) -> None
Classes
class ActionValueMlp(nn.Module):
Methods
def __init__(self, observation_dim, action_dim, hidden_dims) -> None
def forward(self, action, obs) -> Tensor
class GaussianMlpPolicy(nn.Module):
Methods
def __init__(self, observation_dim, action_dim, hidden_dims) -> None
def forward(self, obs, epsilon) -> Tensor | Tuple[Tensor]
class GaussianPolicyHead(nn.Module):
Methods
def __init__(self, hidden_dim, action_dim) -> None
def forward(self, x, epsilon) -> Tensor | Tuple[Tensor]
Sample pre-actions and associated log-probabilities.
Arguments:
x(Tensor)
epsilon(Tensor | None)
Returns:
- Direct samples (pre-actions) from the policy log- probabilities associated to those samples