Remove latency, tdmpc policy passes tests (TODO: make it work with online RL)

2024-04-07 16:01:22 +00:00
parent 44656d2706
commit 4371a5570d
8 changed files with 123 additions and 133 deletions
--- a/lerobot/configs/policy/diffusion.yaml
+++ b/lerobot/configs/policy/diffusion.yaml
@@ -16,7 +16,6 @@ seed: 100000
 horizon: 16
 n_obs_steps: 2
 n_action_steps: 8
-n_latency_steps: 0
 dataset_obs_steps: ${n_obs_steps}
 past_action_visible: False
 keypoint_visible_rate: 1.0
@@ -38,7 +37,6 @@ policy:
  shape_meta: ${shape_meta}

  horizon: ${horizon}
-  # n_action_steps: ${eval:'${n_action_steps}+${n_latency_steps}'}
  n_obs_steps: ${n_obs_steps}
  num_inference_steps: 100
  obs_as_global_cond: ${obs_as_global_cond}
@@ -64,6 +62,11 @@ policy:
  lr_warmup_steps: 500
  grad_clip_norm: 10

+  delta_timestamps:
+    observation.image: [-.1, 0]
+    observation.state: [-.1, 0]
+    action: [-.1, 0, .1, .2, .3, .4, .5, .6, .7, .8, .9, 1.0, 1.1, 1.2, 1.3, 1.4]
+
 noise_scheduler:
  _target_: diffusers.schedulers.scheduling_ddpm.DDPMScheduler
  num_train_timesteps: 100