Updating value model to be stochastic
This commit is contained in:
parent
e6e11f90b7
commit
7c9e75030b
@ -149,7 +149,8 @@ class ValueModel(nn.Module):
|
|||||||
|
|
||||||
def forward(self, state):
|
def forward(self, state):
|
||||||
value = self.value_model(state)
|
value = self.value_model(state)
|
||||||
return value
|
value_dist = torch.distributions.independent.Independent(torch.distributions.Normal(value, 1), 1)
|
||||||
|
return value_dist
|
||||||
|
|
||||||
|
|
||||||
class TransitionModel(nn.Module):
|
class TransitionModel(nn.Module):
|
||||||
|
Loading…
Reference in New Issue
Block a user