[Port HIL-SERL] Add resnet-10 as default encoder for HIL-SERL (#696)

Co-authored-by: Khalil Meftah <kmeftah.khalil@gmail.com>
Co-authored-by: Adil Zouitine <adilzouitinegm@gmail.com>
Co-authored-by: Michel Aractingi <michel.aractingi@huggingface.co>
Co-authored-by: Ke Wang <superwk1017@gmail.com>
This commit is contained in:
Eugene Mironov 2025-02-11 17:37:00 +07:00 committed by GitHub
parent a7db3959f5
commit a1d16fb400
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
3 changed files with 3 additions and 3 deletions

View File

@ -10,7 +10,7 @@ class ClassifierConfig:
num_classes: int = 2
hidden_dim: int = 256
dropout_rate: float = 0.1
model_name: str = "microsoft/resnet-50"
model_name: str = "helper2424/resnet10"
device: str = "cpu"
model_type: str = "cnn" # "transformer" or "cnn"
num_cameras: int = 2

View File

@ -61,7 +61,7 @@ class SACConfig:
)
camera_number: int = 1
# Add type annotations for these fields:
vision_encoder_name: str | None = field(default="microsoft/resnet-18")
vision_encoder_name: str | None = field(default="helper2424/resnet10")
freeze_vision_encoder: bool = True
image_encoder_hidden_dim: int = 32
shared_encoder: bool = True

View File

@ -36,7 +36,7 @@ eval:
policy:
name: "hilserl/classifier/push_green_cube_hf_cropped_resized" #"hilserl/classifier/pick_place_lego_cube_1"
model_name: "facebook/convnext-base-224"
model_name: "helper2424/resnet10"
model_type: "cnn"
num_cameras: 2 # Has to be len(training.image_keys)