We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 6d7df9d commit 393be07Copy full SHA for 393be07
examples/trpo_gym_cartpole.py
@@ -16,7 +16,7 @@ def run_task(*_):
16
policy = CategoricalMLPPolicy(
17
env_spec=env.spec,
18
# The neural network policy should have two hidden layers, each with 32 hidden units.
19
- hidden_sizes=(8, 8)
+ hidden_sizes=(32, 32)
20
)
21
22
baseline = LinearFeatureBaseline(env_spec=env.spec)
examples/trpo_gym_pendulum.py
@@ -15,7 +15,7 @@ def run_task(*_):
15
policy = GaussianMLPPolicy(
0 commit comments