fix losses unpadding bug
Use original_action_dim instead of self.config.max_action_dim when processing losses to exclude padded regions. Including padding areas in loss computation would impair the model's action reconstruction capability.
This commit is contained in:
parent
5322417c03
commit
294948eff5
|
@ -325,7 +325,8 @@ class PI0Policy(PreTrainedPolicy):
|
||||||
loss_dict["losses_after_in_ep_bound"] = losses.clone()
|
loss_dict["losses_after_in_ep_bound"] = losses.clone()
|
||||||
|
|
||||||
# Remove padding
|
# Remove padding
|
||||||
losses = losses[:, :, : self.config.max_action_dim]
|
original_action_dim = self.config.action_feature.shape[0]
|
||||||
|
losses = losses[:, :, :original_action_dim]
|
||||||
loss_dict["losses_after_rm_padding"] = losses.clone()
|
loss_dict["losses_after_rm_padding"] = losses.clone()
|
||||||
|
|
||||||
# For backward pass
|
# For backward pass
|
||||||
|
|
Loading…
Reference in New Issue