Added an s keyboard command to force success in the case the reward classifier fails Co-authored-by: Adil Zouitine <adilzouitinegm@gmail.com>
54 lines
1.3 KiB
YAML
54 lines
1.3 KiB
YAML
# @package _global_
|
|
|
|
defaults:
|
|
- _self_
|
|
|
|
seed: 13
|
|
dataset_repo_id: aractingi/push_cube_square_light_reward_cropped_resized
|
|
# aractingi/push_cube_square_reward_1_cropped_resized
|
|
dataset_root: data/aractingi/push_cube_square_light_reward_cropped_resized
|
|
local_files_only: true
|
|
train_split_proportion: 0.8
|
|
|
|
# Required by logger
|
|
env:
|
|
name: "classifier"
|
|
task: "binary_classification"
|
|
|
|
|
|
training:
|
|
num_epochs: 6
|
|
batch_size: 16
|
|
learning_rate: 1e-4
|
|
num_workers: 4
|
|
grad_clip_norm: 10
|
|
use_amp: true
|
|
log_freq: 1
|
|
eval_freq: 1 # How often to run validation (in epochs)
|
|
save_freq: 1 # How often to save checkpoints (in epochs)
|
|
save_checkpoint: true
|
|
image_keys: ["observation.images.front", "observation.images.side"]
|
|
label_key: "next.reward"
|
|
profile_inference_time: false
|
|
profile_inference_time_iters: 20
|
|
|
|
eval:
|
|
batch_size: 16
|
|
num_samples_to_log: 30 # Number of validation samples to log in the table
|
|
|
|
policy:
|
|
name: "hilserl/classifier"
|
|
model_name: "helper2424/resnet10" # "facebook/convnext-base-224
|
|
model_type: "cnn"
|
|
num_cameras: 2 # Has to be len(training.image_keys)
|
|
|
|
wandb:
|
|
enable: false
|
|
project: "classifier-training"
|
|
job_name: "classifier_training_0"
|
|
disable_artifact: false
|
|
|
|
device: "mps"
|
|
resume: false
|
|
output_dir: "outputs/classifier/old_trainer_resnet10_frozen"
|