@@ -4710,7 +4710,7 @@ def _create_mock_actor(
4710
4710
):
4711
4711
# Actor
4712
4712
action_spec = OneHot(action_dim)
4713
- net = nn.Sequential(nn. Linear(obs_dim, 2 * action_dim), NormalParamExtractor() )
4713
+ net = nn.Linear(obs_dim, action_dim)
4714
4714
module = TensorDictModule(net, in_keys=[observation_key], out_keys=["logits"])
4715
4715
actor = ProbabilisticActor(
4716
4716
spec=action_spec,
@@ -11388,7 +11388,7 @@ def _create_mock_actor(self, batch=2, obs_dim=3, action_dim=4, device="cpu"):
11388
11388
action_spec = Bounded(
11389
11389
-torch.ones(action_dim), torch.ones(action_dim), (action_dim,)
11390
11390
)
11391
- net = nn.Sequential(nn. Linear(obs_dim, 2 * action_dim), NormalParamExtractor() )
11391
+ net = nn.Linear(obs_dim, action_dim)
11392
11392
module = TensorDictModule(net, in_keys=["observation"], out_keys=["param"])
11393
11393
actor = ProbabilisticActor(
11394
11394
module=module,
@@ -12632,7 +12632,7 @@ def _create_mock_actor(
12632
12632
):
12633
12633
# Actor
12634
12634
action_spec = OneHot(action_dim)
12635
- net = nn.Sequential(nn. Linear(obs_dim, 2 * action_dim), NormalParamExtractor() )
12635
+ net = nn.Linear(obs_dim, action_dim)
12636
12636
module = TensorDictModule(net, in_keys=[observation_key], out_keys=["logits"])
12637
12637
actor = ProbabilisticActor(
12638
12638
spec=action_spec,
@@ -12729,8 +12729,7 @@ def _create_mock_common_layer_setup(
12729
12729
common = Mod(common_net, in_keys=["obs"], out_keys=["hidden"])
12730
12730
actor = ProbSeq(
12731
12731
common,
12732
- Mod(actor_net, in_keys=["hidden"], out_keys=["param"]),
12733
- Mod(NormalParamExtractor(), in_keys=["param"], out_keys=["logits"]),
12732
+ Mod(actor_net, in_keys=["hidden"], out_keys=["logits"]),
12734
12733
ProbMod(
12735
12734
in_keys=["logits"],
12736
12735
out_keys=["action"],
0 commit comments