revert adding observation in ret

This commit is contained in:
Wael Karkoub 2024-06-10 17:13:10 +01:00
parent cbbdbc0f08
commit 9c0c82f1e9
1 changed files with 1 additions and 2 deletions

View File

@ -99,7 +99,7 @@ def rollout(
"reward": A (batch, sequence) tensor of rewards received for applying the actions.
"success": A (batch, sequence) tensor of success conditions (the only time this can be True is upon
environment termination/truncation).
"don": A (batch, sequence) tensor of **cumulative** done conditions. For any given batch element,
"done": A (batch, sequence) tensor of **cumulative** done conditions. For any given batch element,
the first True is followed by True's all the way till the end. This can be used for masking
extraneous elements from the sequences above.
@ -195,7 +195,6 @@ def rollout(
"reward": torch.stack(all_rewards, dim=1),
"success": torch.stack(all_successes, dim=1),
"done": torch.stack(all_dones, dim=1),
"observation": None,
}
if return_observations:
stacked_observations = {}