Updating value model to be stochastic
This commit is contained in:
parent
e6e11f90b7
commit
7c9e75030b
@ -149,7 +149,8 @@ class ValueModel(nn.Module):
|
||||
|
||||
def forward(self, state):
|
||||
value = self.value_model(state)
|
||||
return value
|
||||
value_dist = torch.distributions.independent.Independent(torch.distributions.Normal(value, 1), 1)
|
||||
return value_dist
|
||||
|
||||
|
||||
class TransitionModel(nn.Module):
|
||||
|
Loading…
Reference in New Issue
Block a user