diff --git a/examples/locomotion/go2_env.py b/examples/locomotion/go2_env.py index 4368b8a..f3d8f17 100644 --- a/examples/locomotion/go2_env.py +++ b/examples/locomotion/go2_env.py @@ -154,7 +154,7 @@ def step(self, actions): time_out_idx = (self.episode_length_buf > self.max_episode_length).nonzero(as_tuple=False).flatten() self.extras["time_outs"] = torch.zeros_like(self.reset_buf, device=self.device, dtype=gs.tc_float) self.extras["time_outs"][time_out_idx] = 1.0 - + self.reset_idx(self.reset_buf.nonzero(as_tuple=False).flatten()) # compute reward