| { |
| "dataset": { |
| "repo_id": "kelvinzhaozg/digit3a_hardware_box_pickup_dataset_depth", |
| "root": null, |
| "episodes": null, |
| "image_transforms": { |
| "enable": false, |
| "max_num_transforms": 3, |
| "random_order": false, |
| "tfs": { |
| "brightness": { |
| "weight": 1.0, |
| "type": "ColorJitter", |
| "kwargs": { |
| "brightness": [ |
| 0.8, |
| 1.2 |
| ] |
| } |
| }, |
| "contrast": { |
| "weight": 1.0, |
| "type": "ColorJitter", |
| "kwargs": { |
| "contrast": [ |
| 0.8, |
| 1.2 |
| ] |
| } |
| }, |
| "saturation": { |
| "weight": 1.0, |
| "type": "ColorJitter", |
| "kwargs": { |
| "saturation": [ |
| 0.5, |
| 1.5 |
| ] |
| } |
| }, |
| "hue": { |
| "weight": 1.0, |
| "type": "ColorJitter", |
| "kwargs": { |
| "hue": [ |
| -0.05, |
| 0.05 |
| ] |
| } |
| }, |
| "sharpness": { |
| "weight": 1.0, |
| "type": "SharpnessJitter", |
| "kwargs": { |
| "sharpness": [ |
| 0.5, |
| 1.5 |
| ] |
| } |
| } |
| } |
| }, |
| "revision": null, |
| "use_imagenet_stats": false, |
| "video_backend": "torchcodec" |
| }, |
| "env": null, |
| "policy": { |
| "type": "diffusion", |
| "n_obs_steps": 1, |
| "normalization_mapping": { |
| "VISUAL": "IDENTITY", |
| "STATE": "MIN_MAX", |
| "ACTION": "MIN_MAX" |
| }, |
| "input_features": { |
| "observation.images.depth": { |
| "type": "VISUAL", |
| "shape": [ |
| 1, |
| 240, |
| 424 |
| ] |
| }, |
| "observation.state": { |
| "type": "STATE", |
| "shape": [ |
| 24 |
| ] |
| } |
| }, |
| "output_features": { |
| "action": { |
| "type": "ACTION", |
| "shape": [ |
| 21 |
| ] |
| } |
| }, |
| "device": "cuda", |
| "use_amp": false, |
| "push_to_hub": true, |
| "repo_id": "kelvinzhaozg/diffusion_digit3a_hardware_box_pickup_depth", |
| "private": null, |
| "tags": null, |
| "license": null, |
| "horizon": 64, |
| "n_action_steps": 32, |
| "per_feature_normalization_overrides": { |
| "observation.images.depth": "MEAN_STD" |
| }, |
| "drop_n_last_frames": 7, |
| "vision_backbone": "resnet18", |
| "crop_shape": null, |
| "crop_is_random": true, |
| "pretrained_backbone_weights": null, |
| "use_group_norm": true, |
| "spatial_softmax_num_keypoints": 32, |
| "use_separate_rgb_encoder_per_camera": false, |
| "use_depth_as_channel": true, |
| "use_depth_only": true, |
| "rgbd_pretrained_backbone_weights": null, |
| "norm_rgb": false, |
| "norm_depth": false, |
| "down_dims": [ |
| 512, |
| 1024, |
| 2048 |
| ], |
| "kernel_size": 5, |
| "n_groups": 8, |
| "diffusion_step_embed_dim": 128, |
| "use_film_scale_modulation": true, |
| "noise_scheduler_type": "DDIM", |
| "num_train_timesteps": 100, |
| "beta_schedule": "squaredcos_cap_v2", |
| "beta_start": 0.0001, |
| "beta_end": 0.02, |
| "prediction_type": "sample", |
| "clip_sample": true, |
| "clip_sample_range": 1.0, |
| "num_inference_steps": null, |
| "do_mask_loss_for_padding": false, |
| "optimizer_lr": 0.0001, |
| "optimizer_betas": [ |
| 0.95, |
| 0.999 |
| ], |
| "optimizer_eps": 1e-08, |
| "optimizer_weight_decay": 1e-06, |
| "scheduler_name": "cosine", |
| "scheduler_warmup_steps": 500 |
| }, |
| "output_dir": "outputs/train/2025-10-16/16-49-40_diffusion", |
| "job_name": "diffusion", |
| "resume": false, |
| "seed": 1000, |
| "num_workers": 4, |
| "batch_size": 8, |
| "steps": 200000, |
| "eval_freq": 20000, |
| "log_freq": 200, |
| "save_checkpoint": true, |
| "save_freq": 20000, |
| "use_policy_training_preset": true, |
| "optimizer": { |
| "type": "adam", |
| "lr": 0.0001, |
| "weight_decay": 1e-06, |
| "grad_clip_norm": 10.0, |
| "betas": [ |
| 0.95, |
| 0.999 |
| ], |
| "eps": 1e-08 |
| }, |
| "scheduler": { |
| "type": "diffuser", |
| "num_warmup_steps": 500, |
| "name": "cosine" |
| }, |
| "eval": { |
| "n_episodes": 50, |
| "batch_size": 50, |
| "use_async_envs": false |
| }, |
| "wandb": { |
| "enable": true, |
| "disable_artifact": true, |
| "project": "digit3a_rgbd", |
| "entity": null, |
| "notes": null, |
| "run_id": "egik8o1l", |
| "mode": null |
| } |
| } |