diff --git a/.gitattributes b/.gitattributes index 9dda2938357861f19e73f967818aa5ab96baa5b8..4198f4cdce2144cd0fe4ffa02b7501c484b84cc6 100644 --- a/.gitattributes +++ b/.gitattributes @@ -36,3 +36,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text checkpoints/diffusion_unet_dino/joints/wandb/run-20260515_204227-cgfzze2z/run-cgfzze2z.wandb filter=lfs diff=lfs merge=lfs -text checkpoints/diffusion_unet_dino_data_augmentation/wandb/run-20260516_204526-1c59314z/run-1c59314z.wandb filter=lfs diff=lfs merge=lfs -text checkpoints/diffusion_dagger_iter1_20260517_225259/wandb/run-20260517_225306-kmyshjri/run-kmyshjri.wandb filter=lfs diff=lfs merge=lfs -text +checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/run-d8akc176.wandb filter=lfs diff=lfs merge=lfs -text diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6d9e0e843e5fa2dbe7d14fccf5efa4dee2ddb9 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/config.json @@ -0,0 +1,92 @@ +{ + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/model.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f70dc01f24f5ae7d573c73c421f9609473d4168c --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29b628f8a3b16768596fc3e4a30a1b369358aff0cc4b38d061b53cac5086f013 +size 1095367712 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_postprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_postprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c5e6cea7850bb999ab193f96021fa0129ce4db --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_postprocessor.json @@ -0,0 +1,32 @@ +{ + "name": "policy_postprocessor", + "steps": [ + { + "registry_name": "unnormalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors" + }, + { + "registry_name": "device_processor", + "config": { + "device": "cpu", + "float_dtype": null + } + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_preprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_preprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f57e6242af17f882bc107c602ca76393c57d55 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_preprocessor.json @@ -0,0 +1,56 @@ +{ + "name": "policy_preprocessor", + "steps": [ + { + "registry_name": "rename_observations_processor", + "config": { + "rename_map": {} + } + }, + { + "registry_name": "to_batch_processor", + "config": {} + }, + { + "registry_name": "device_processor", + "config": { + "device": "cuda", + "float_dtype": null + } + }, + { + "registry_name": "normalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + }, + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors" + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/train_config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/train_config.json new file mode 100644 index 0000000000000000000000000000000000000000..638986814c22c471c7596c080c170c7c4c4dd86b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/pretrained_model/train_config.json @@ -0,0 +1,302 @@ +{ + "dataset": { + "repo_id": "local/act_collected_episodes", + "root": "/home/shadeform/Desktop/robot_learning/base_new_dataset_134", + "episodes": null, + "image_transforms": { + "enable": false, + "max_num_transforms": 3, + "random_order": false, + "same_cloth_color": false, + "tfs": { + "color_jitter": { + "weight": 1.5, + "type": "ColorJitter", + "kwargs": { + "brightness": [ + 0.7, + 1.3 + ], + "contrast": [ + 0.7, + 1.3 + ], + "saturation": [ + 0.4, + 1.6 + ], + "hue": [ + -0.5, + 0.5 + ] + } + }, + "grayscale": { + "weight": 0.5, + "type": "RandomGrayscale", + "kwargs": { + "p": 1.0 + } + }, + "shadow": { + "weight": 0.8, + "type": "RandomShadow", + "kwargs": { + "num_shadows": [ + 1, + 2 + ], + "intensity": [ + 0.4, + 0.7 + ], + "blur_sigma": [ + 4.0, + 20.0 + ] + } + }, + "highlight": { + "weight": 0.5, + "type": "RandomHighlight", + "kwargs": { + "num_highlights": [ + 0, + 1 + ], + "intensity": [ + 0.2, + 0.5 + ], + "sigma": [ + 20.0, + 60.0 + ] + } + }, + "gamma": { + "weight": 0.7, + "type": "RandomGamma", + "kwargs": { + "gamma": [ + 0.6, + 1.4 + ] + } + }, + "blur": { + "weight": 0.0, + "type": "GaussianBlur", + "kwargs": { + "kernel_size": [ + 3, + 3 + ], + "sigma": [ + 0.1, + 1.5 + ] + } + }, + "jpeg": { + "weight": 0.0, + "type": "RandomJPEG", + "kwargs": { + "quality": [ + 60, + 95 + ] + } + }, + "crop": { + "weight": 0.5, + "type": "RandomCropPreserveSize", + "kwargs": { + "scale": [ + 0.97, + 1.0 + ], + "ratio": [ + 0.99, + 1.01 + ] + } + }, + "affine": { + "weight": 0.0, + "type": "RandomAffine", + "kwargs": { + "degrees": [ + -5.0, + 5.0 + ], + "translate": [ + 0.05, + 0.05 + ] + } + }, + "sharpness": { + "weight": 1.0, + "type": "SharpnessJitter", + "kwargs": { + "sharpness": [ + 0.5, + 1.5 + ] + } + } + } + }, + "revision": null, + "use_imagenet_stats": true, + "video_backend": "pyav", + "return_uint8": false, + "streaming": false + }, + "env": null, + "policy": { + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 + }, + "reward_model": null, + "output_dir": "/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1", + "job_name": "diffusion_specialized_eval1", + "resume": false, + "seed": 1000, + "cudnn_deterministic": false, + "num_workers": 4, + "batch_size": 32, + "prefetch_factor": 4, + "persistent_workers": true, + "steps": 30000, + "eval_freq": 0, + "log_freq": 20, + "tolerance_s": 0.0001, + "save_checkpoint": true, + "save_freq": 5000, + "use_policy_training_preset": true, + "optimizer": { + "type": "adam", + "lr": 1e-05, + "weight_decay": 1e-06, + "grad_clip_norm": 10.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08 + }, + "scheduler": { + "type": "diffuser", + "num_warmup_steps": 100, + "name": "cosine" + }, + "eval": { + "n_episodes": 50, + "batch_size": 11, + "use_async_envs": true + }, + "wandb": { + "enable": true, + "disable_artifact": false, + "project": "lerobot", + "entity": null, + "notes": null, + "run_id": "d8akc176", + "mode": null, + "add_tags": true + }, + "peft": null, + "sample_weighting": null, + "rename_map": {}, + "checkpoint_path": null +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/optimizer_param_groups.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/optimizer_param_groups.json new file mode 100644 index 0000000000000000000000000000000000000000..cd17a194e2d4661070418132c77aa2fc31293a4b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/optimizer_param_groups.json @@ -0,0 +1,396 @@ +[ + { + "lr": 9.351850337481774e-06, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08, + "weight_decay": 1e-06, + "amsgrad": false, + "maximize": false, + "foreach": null, + "capturable": false, + "differentiable": false, + "fused": null, + "decoupled_weight_decay": false, + "initial_lr": 1e-05, + "params": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47, + 48, + 49, + 50, + 51, + 52, + 53, + 54, + 55, + 56, + 57, + 58, + 59, + 60, + 61, + 62, + 63, + 64, + 65, + 66, + 67, + 68, + 69, + 70, + 71, + 72, + 73, + 74, + 75, + 76, + 77, + 78, + 79, + 80, + 81, + 82, + 83, + 84, + 85, + 86, + 87, + 88, + 89, + 90, + 91, + 92, + 93, + 94, + 95, + 96, + 97, + 98, + 99, + 100, + 101, + 102, + 103, + 104, + 105, + 106, + 107, + 108, + 109, + 110, + 111, + 112, + 113, + 114, + 115, + 116, + 117, + 118, + 119, + 120, + 121, + 122, + 123, + 124, + 125, + 126, + 127, + 128, + 129, + 130, + 131, + 132, + 133, + 134, + 135, + 136, + 137, + 138, + 139, + 140, + 141, + 142, + 143, + 144, + 145, + 146, + 147, + 148, + 149, + 150, + 151, + 152, + 153, + 154, + 155, + 156, + 157, + 158, + 159, + 160, + 161, + 162, + 163, + 164, + 165, + 166, + 167, + 168, + 169, + 170, + 171, + 172, + 173, + 174, + 175, + 176, + 177, + 178, + 179, + 180, + 181, + 182, + 183, + 184, + 185, + 186, + 187, + 188, + 189, + 190, + 191, + 192, + 193, + 194, + 195, + 196, + 197, + 198, + 199, + 200, + 201, + 202, + 203, + 204, + 205, + 206, + 207, + 208, + 209, + 210, + 211, + 212, + 213, + 214, + 215, + 216, + 217, + 218, + 219, + 220, + 221, + 222, + 223, + 224, + 225, + 226, + 227, + 228, + 229, + 230, + 231, + 232, + 233, + 234, + 235, + 236, + 237, + 238, + 239, + 240, + 241, + 242, + 243, + 244, + 245, + 246, + 247, + 248, + 249, + 250, + 251, + 252, + 253, + 254, + 255, + 256, + 257, + 258, + 259, + 260, + 261, + 262, + 263, + 264, + 265, + 266, + 267, + 268, + 269, + 270, + 271, + 272, + 273, + 274, + 275, + 276, + 277, + 278, + 279, + 280, + 281, + 282, + 283, + 284, + 285, + 286, + 287, + 288, + 289, + 290, + 291, + 292, + 293, + 294, + 295, + 296, + 297, + 298, + 299, + 300, + 301, + 302, + 303, + 304, + 305, + 306, + 307, + 308, + 309, + 310, + 311, + 312, + 313, + 314, + 315, + 316, + 317, + 318, + 319, + 320, + 321, + 322, + 323, + 324, + 325, + 326, + 327, + 328, + 329, + 330, + 331, + 332, + 333, + 334, + 335, + 336, + 337, + 338, + 339, + 340, + 341, + 342, + 343, + 344, + 345, + 346, + 347, + 348, + 349, + 350, + 351, + 352, + 353, + 354, + 355, + 356, + 357, + 358, + 359, + 360, + 361, + 362, + 363, + 364, + 365, + 366, + 367, + 368, + 369, + 370, + 371, + 372, + 373, + 374 + ] + } +] \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/optimizer_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/optimizer_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..53bcb3a095da3e6167842772b6752fb0c2cbad6d --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/optimizer_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d14a3dacd0c411d138135d8d2c5c14b6662c6d82707928637de1e055d26b1c4a +size 2014217744 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/rng_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/rng_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5185469b3dc835bada57c0a885c1559451e2d0ae --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/rng_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99d3021418cfacc2c6869043f18a73b6fafe33c8de9e31cc751a9c9b30e5a065 +size 15708 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/scheduler_state.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/scheduler_state.json new file mode 100644 index 0000000000000000000000000000000000000000..8e5c0277996feb7c944f117fde98fed15285e0ce --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/scheduler_state.json @@ -0,0 +1,15 @@ +{ + "base_lrs": [ + 1e-05 + ], + "last_epoch": 5000, + "_step_count": 5001, + "_is_initial": false, + "_get_lr_called_within_step": false, + "_last_lr": [ + 9.351850337481774e-06 + ], + "lr_lambdas": [ + null + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/training_step.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/training_step.json new file mode 100644 index 0000000000000000000000000000000000000000..592449d3fc8b35c30c604eb1dabe60537e8224a0 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/005000/training_state/training_step.json @@ -0,0 +1,3 @@ +{ + "step": 5000 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6d9e0e843e5fa2dbe7d14fccf5efa4dee2ddb9 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/config.json @@ -0,0 +1,92 @@ +{ + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/model.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..404c46291bfdbbe1541cb8b51dd58e2de6b45850 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7342f68236a419e34aa8cbfdaf1990630d2ac069e038859ec95faca2f50b5963 +size 1095367712 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_postprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_postprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c5e6cea7850bb999ab193f96021fa0129ce4db --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_postprocessor.json @@ -0,0 +1,32 @@ +{ + "name": "policy_postprocessor", + "steps": [ + { + "registry_name": "unnormalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors" + }, + { + "registry_name": "device_processor", + "config": { + "device": "cpu", + "float_dtype": null + } + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_preprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_preprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f57e6242af17f882bc107c602ca76393c57d55 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_preprocessor.json @@ -0,0 +1,56 @@ +{ + "name": "policy_preprocessor", + "steps": [ + { + "registry_name": "rename_observations_processor", + "config": { + "rename_map": {} + } + }, + { + "registry_name": "to_batch_processor", + "config": {} + }, + { + "registry_name": "device_processor", + "config": { + "device": "cuda", + "float_dtype": null + } + }, + { + "registry_name": "normalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + }, + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors" + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/train_config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/train_config.json new file mode 100644 index 0000000000000000000000000000000000000000..638986814c22c471c7596c080c170c7c4c4dd86b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/pretrained_model/train_config.json @@ -0,0 +1,302 @@ +{ + "dataset": { + "repo_id": "local/act_collected_episodes", + "root": "/home/shadeform/Desktop/robot_learning/base_new_dataset_134", + "episodes": null, + "image_transforms": { + "enable": false, + "max_num_transforms": 3, + "random_order": false, + "same_cloth_color": false, + "tfs": { + "color_jitter": { + "weight": 1.5, + "type": "ColorJitter", + "kwargs": { + "brightness": [ + 0.7, + 1.3 + ], + "contrast": [ + 0.7, + 1.3 + ], + "saturation": [ + 0.4, + 1.6 + ], + "hue": [ + -0.5, + 0.5 + ] + } + }, + "grayscale": { + "weight": 0.5, + "type": "RandomGrayscale", + "kwargs": { + "p": 1.0 + } + }, + "shadow": { + "weight": 0.8, + "type": "RandomShadow", + "kwargs": { + "num_shadows": [ + 1, + 2 + ], + "intensity": [ + 0.4, + 0.7 + ], + "blur_sigma": [ + 4.0, + 20.0 + ] + } + }, + "highlight": { + "weight": 0.5, + "type": "RandomHighlight", + "kwargs": { + "num_highlights": [ + 0, + 1 + ], + "intensity": [ + 0.2, + 0.5 + ], + "sigma": [ + 20.0, + 60.0 + ] + } + }, + "gamma": { + "weight": 0.7, + "type": "RandomGamma", + "kwargs": { + "gamma": [ + 0.6, + 1.4 + ] + } + }, + "blur": { + "weight": 0.0, + "type": "GaussianBlur", + "kwargs": { + "kernel_size": [ + 3, + 3 + ], + "sigma": [ + 0.1, + 1.5 + ] + } + }, + "jpeg": { + "weight": 0.0, + "type": "RandomJPEG", + "kwargs": { + "quality": [ + 60, + 95 + ] + } + }, + "crop": { + "weight": 0.5, + "type": "RandomCropPreserveSize", + "kwargs": { + "scale": [ + 0.97, + 1.0 + ], + "ratio": [ + 0.99, + 1.01 + ] + } + }, + "affine": { + "weight": 0.0, + "type": "RandomAffine", + "kwargs": { + "degrees": [ + -5.0, + 5.0 + ], + "translate": [ + 0.05, + 0.05 + ] + } + }, + "sharpness": { + "weight": 1.0, + "type": "SharpnessJitter", + "kwargs": { + "sharpness": [ + 0.5, + 1.5 + ] + } + } + } + }, + "revision": null, + "use_imagenet_stats": true, + "video_backend": "pyav", + "return_uint8": false, + "streaming": false + }, + "env": null, + "policy": { + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 + }, + "reward_model": null, + "output_dir": "/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1", + "job_name": "diffusion_specialized_eval1", + "resume": false, + "seed": 1000, + "cudnn_deterministic": false, + "num_workers": 4, + "batch_size": 32, + "prefetch_factor": 4, + "persistent_workers": true, + "steps": 30000, + "eval_freq": 0, + "log_freq": 20, + "tolerance_s": 0.0001, + "save_checkpoint": true, + "save_freq": 5000, + "use_policy_training_preset": true, + "optimizer": { + "type": "adam", + "lr": 1e-05, + "weight_decay": 1e-06, + "grad_clip_norm": 10.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08 + }, + "scheduler": { + "type": "diffuser", + "num_warmup_steps": 100, + "name": "cosine" + }, + "eval": { + "n_episodes": 50, + "batch_size": 11, + "use_async_envs": true + }, + "wandb": { + "enable": true, + "disable_artifact": false, + "project": "lerobot", + "entity": null, + "notes": null, + "run_id": "d8akc176", + "mode": null, + "add_tags": true + }, + "peft": null, + "sample_weighting": null, + "rename_map": {}, + "checkpoint_path": null +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/optimizer_param_groups.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/optimizer_param_groups.json new file mode 100644 index 0000000000000000000000000000000000000000..deeeb990e48be7cb70235b7373ab642b55d0d84c --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/optimizer_param_groups.json @@ -0,0 +1,396 @@ +[ + { + "lr": 7.530269513584158e-06, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08, + "weight_decay": 1e-06, + "amsgrad": false, + "maximize": false, + "foreach": null, + "capturable": false, + "differentiable": false, + "fused": null, + "decoupled_weight_decay": false, + "initial_lr": 1e-05, + "params": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47, + 48, + 49, + 50, + 51, + 52, + 53, + 54, + 55, + 56, + 57, + 58, + 59, + 60, + 61, + 62, + 63, + 64, + 65, + 66, + 67, + 68, + 69, + 70, + 71, + 72, + 73, + 74, + 75, + 76, + 77, + 78, + 79, + 80, + 81, + 82, + 83, + 84, + 85, + 86, + 87, + 88, + 89, + 90, + 91, + 92, + 93, + 94, + 95, + 96, + 97, + 98, + 99, + 100, + 101, + 102, + 103, + 104, + 105, + 106, + 107, + 108, + 109, + 110, + 111, + 112, + 113, + 114, + 115, + 116, + 117, + 118, + 119, + 120, + 121, + 122, + 123, + 124, + 125, + 126, + 127, + 128, + 129, + 130, + 131, + 132, + 133, + 134, + 135, + 136, + 137, + 138, + 139, + 140, + 141, + 142, + 143, + 144, + 145, + 146, + 147, + 148, + 149, + 150, + 151, + 152, + 153, + 154, + 155, + 156, + 157, + 158, + 159, + 160, + 161, + 162, + 163, + 164, + 165, + 166, + 167, + 168, + 169, + 170, + 171, + 172, + 173, + 174, + 175, + 176, + 177, + 178, + 179, + 180, + 181, + 182, + 183, + 184, + 185, + 186, + 187, + 188, + 189, + 190, + 191, + 192, + 193, + 194, + 195, + 196, + 197, + 198, + 199, + 200, + 201, + 202, + 203, + 204, + 205, + 206, + 207, + 208, + 209, + 210, + 211, + 212, + 213, + 214, + 215, + 216, + 217, + 218, + 219, + 220, + 221, + 222, + 223, + 224, + 225, + 226, + 227, + 228, + 229, + 230, + 231, + 232, + 233, + 234, + 235, + 236, + 237, + 238, + 239, + 240, + 241, + 242, + 243, + 244, + 245, + 246, + 247, + 248, + 249, + 250, + 251, + 252, + 253, + 254, + 255, + 256, + 257, + 258, + 259, + 260, + 261, + 262, + 263, + 264, + 265, + 266, + 267, + 268, + 269, + 270, + 271, + 272, + 273, + 274, + 275, + 276, + 277, + 278, + 279, + 280, + 281, + 282, + 283, + 284, + 285, + 286, + 287, + 288, + 289, + 290, + 291, + 292, + 293, + 294, + 295, + 296, + 297, + 298, + 299, + 300, + 301, + 302, + 303, + 304, + 305, + 306, + 307, + 308, + 309, + 310, + 311, + 312, + 313, + 314, + 315, + 316, + 317, + 318, + 319, + 320, + 321, + 322, + 323, + 324, + 325, + 326, + 327, + 328, + 329, + 330, + 331, + 332, + 333, + 334, + 335, + 336, + 337, + 338, + 339, + 340, + 341, + 342, + 343, + 344, + 345, + 346, + 347, + 348, + 349, + 350, + 351, + 352, + 353, + 354, + 355, + 356, + 357, + 358, + 359, + 360, + 361, + 362, + 363, + 364, + 365, + 366, + 367, + 368, + 369, + 370, + 371, + 372, + 373, + 374 + ] + } +] \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/optimizer_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/optimizer_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b0b598d0023e8ef8cfc2ff658ad77f46010ec22d --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/optimizer_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:572c1ccc9b9c5d93af00ff92b38cc2b0593796ce2c919d8a8f79389df78532af +size 2014217744 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/rng_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/rng_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ecdb403e791fb91d5c7b144b49276653b55686f3 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/rng_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:071ff168cd01b2ab5e737f7504cedf4cbc3c161683a8a0e19fb25b222e441da5 +size 15708 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/scheduler_state.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/scheduler_state.json new file mode 100644 index 0000000000000000000000000000000000000000..4e1876b4baa7a78e0e98e1b8a5c854de8fcf27bd --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/scheduler_state.json @@ -0,0 +1,15 @@ +{ + "base_lrs": [ + 1e-05 + ], + "last_epoch": 10000, + "_step_count": 10001, + "_is_initial": false, + "_get_lr_called_within_step": false, + "_last_lr": [ + 7.530269513584158e-06 + ], + "lr_lambdas": [ + null + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/training_step.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/training_step.json new file mode 100644 index 0000000000000000000000000000000000000000..7cb7c0986e9e7461ca851ce71e95d235ae3d2732 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/010000/training_state/training_step.json @@ -0,0 +1,3 @@ +{ + "step": 10000 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6d9e0e843e5fa2dbe7d14fccf5efa4dee2ddb9 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/config.json @@ -0,0 +1,92 @@ +{ + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/model.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..d85377c7039199268bb5ec04f42848cffd0df2df --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab1d19cc8966902e720cbbffbc1fadfd94d497028cecae751794fe4b6e3f5e5 +size 1095367712 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_postprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_postprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c5e6cea7850bb999ab193f96021fa0129ce4db --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_postprocessor.json @@ -0,0 +1,32 @@ +{ + "name": "policy_postprocessor", + "steps": [ + { + "registry_name": "unnormalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors" + }, + { + "registry_name": "device_processor", + "config": { + "device": "cpu", + "float_dtype": null + } + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_preprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_preprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f57e6242af17f882bc107c602ca76393c57d55 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_preprocessor.json @@ -0,0 +1,56 @@ +{ + "name": "policy_preprocessor", + "steps": [ + { + "registry_name": "rename_observations_processor", + "config": { + "rename_map": {} + } + }, + { + "registry_name": "to_batch_processor", + "config": {} + }, + { + "registry_name": "device_processor", + "config": { + "device": "cuda", + "float_dtype": null + } + }, + { + "registry_name": "normalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + }, + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors" + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/train_config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/train_config.json new file mode 100644 index 0000000000000000000000000000000000000000..638986814c22c471c7596c080c170c7c4c4dd86b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/pretrained_model/train_config.json @@ -0,0 +1,302 @@ +{ + "dataset": { + "repo_id": "local/act_collected_episodes", + "root": "/home/shadeform/Desktop/robot_learning/base_new_dataset_134", + "episodes": null, + "image_transforms": { + "enable": false, + "max_num_transforms": 3, + "random_order": false, + "same_cloth_color": false, + "tfs": { + "color_jitter": { + "weight": 1.5, + "type": "ColorJitter", + "kwargs": { + "brightness": [ + 0.7, + 1.3 + ], + "contrast": [ + 0.7, + 1.3 + ], + "saturation": [ + 0.4, + 1.6 + ], + "hue": [ + -0.5, + 0.5 + ] + } + }, + "grayscale": { + "weight": 0.5, + "type": "RandomGrayscale", + "kwargs": { + "p": 1.0 + } + }, + "shadow": { + "weight": 0.8, + "type": "RandomShadow", + "kwargs": { + "num_shadows": [ + 1, + 2 + ], + "intensity": [ + 0.4, + 0.7 + ], + "blur_sigma": [ + 4.0, + 20.0 + ] + } + }, + "highlight": { + "weight": 0.5, + "type": "RandomHighlight", + "kwargs": { + "num_highlights": [ + 0, + 1 + ], + "intensity": [ + 0.2, + 0.5 + ], + "sigma": [ + 20.0, + 60.0 + ] + } + }, + "gamma": { + "weight": 0.7, + "type": "RandomGamma", + "kwargs": { + "gamma": [ + 0.6, + 1.4 + ] + } + }, + "blur": { + "weight": 0.0, + "type": "GaussianBlur", + "kwargs": { + "kernel_size": [ + 3, + 3 + ], + "sigma": [ + 0.1, + 1.5 + ] + } + }, + "jpeg": { + "weight": 0.0, + "type": "RandomJPEG", + "kwargs": { + "quality": [ + 60, + 95 + ] + } + }, + "crop": { + "weight": 0.5, + "type": "RandomCropPreserveSize", + "kwargs": { + "scale": [ + 0.97, + 1.0 + ], + "ratio": [ + 0.99, + 1.01 + ] + } + }, + "affine": { + "weight": 0.0, + "type": "RandomAffine", + "kwargs": { + "degrees": [ + -5.0, + 5.0 + ], + "translate": [ + 0.05, + 0.05 + ] + } + }, + "sharpness": { + "weight": 1.0, + "type": "SharpnessJitter", + "kwargs": { + "sharpness": [ + 0.5, + 1.5 + ] + } + } + } + }, + "revision": null, + "use_imagenet_stats": true, + "video_backend": "pyav", + "return_uint8": false, + "streaming": false + }, + "env": null, + "policy": { + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 + }, + "reward_model": null, + "output_dir": "/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1", + "job_name": "diffusion_specialized_eval1", + "resume": false, + "seed": 1000, + "cudnn_deterministic": false, + "num_workers": 4, + "batch_size": 32, + "prefetch_factor": 4, + "persistent_workers": true, + "steps": 30000, + "eval_freq": 0, + "log_freq": 20, + "tolerance_s": 0.0001, + "save_checkpoint": true, + "save_freq": 5000, + "use_policy_training_preset": true, + "optimizer": { + "type": "adam", + "lr": 1e-05, + "weight_decay": 1e-06, + "grad_clip_norm": 10.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08 + }, + "scheduler": { + "type": "diffuser", + "num_warmup_steps": 100, + "name": "cosine" + }, + "eval": { + "n_episodes": 50, + "batch_size": 11, + "use_async_envs": true + }, + "wandb": { + "enable": true, + "disable_artifact": false, + "project": "lerobot", + "entity": null, + "notes": null, + "run_id": "d8akc176", + "mode": null, + "add_tags": true + }, + "peft": null, + "sample_weighting": null, + "rename_map": {}, + "checkpoint_path": null +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/optimizer_param_groups.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/optimizer_param_groups.json new file mode 100644 index 0000000000000000000000000000000000000000..7b4a900903303c52fcc3110be95b4a093573f46c --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/optimizer_param_groups.json @@ -0,0 +1,396 @@ +[ + { + "lr": 5.0262673762765316e-06, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08, + "weight_decay": 1e-06, + "amsgrad": false, + "maximize": false, + "foreach": null, + "capturable": false, + "differentiable": false, + "fused": null, + "decoupled_weight_decay": false, + "initial_lr": 1e-05, + "params": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47, + 48, + 49, + 50, + 51, + 52, + 53, + 54, + 55, + 56, + 57, + 58, + 59, + 60, + 61, + 62, + 63, + 64, + 65, + 66, + 67, + 68, + 69, + 70, + 71, + 72, + 73, + 74, + 75, + 76, + 77, + 78, + 79, + 80, + 81, + 82, + 83, + 84, + 85, + 86, + 87, + 88, + 89, + 90, + 91, + 92, + 93, + 94, + 95, + 96, + 97, + 98, + 99, + 100, + 101, + 102, + 103, + 104, + 105, + 106, + 107, + 108, + 109, + 110, + 111, + 112, + 113, + 114, + 115, + 116, + 117, + 118, + 119, + 120, + 121, + 122, + 123, + 124, + 125, + 126, + 127, + 128, + 129, + 130, + 131, + 132, + 133, + 134, + 135, + 136, + 137, + 138, + 139, + 140, + 141, + 142, + 143, + 144, + 145, + 146, + 147, + 148, + 149, + 150, + 151, + 152, + 153, + 154, + 155, + 156, + 157, + 158, + 159, + 160, + 161, + 162, + 163, + 164, + 165, + 166, + 167, + 168, + 169, + 170, + 171, + 172, + 173, + 174, + 175, + 176, + 177, + 178, + 179, + 180, + 181, + 182, + 183, + 184, + 185, + 186, + 187, + 188, + 189, + 190, + 191, + 192, + 193, + 194, + 195, + 196, + 197, + 198, + 199, + 200, + 201, + 202, + 203, + 204, + 205, + 206, + 207, + 208, + 209, + 210, + 211, + 212, + 213, + 214, + 215, + 216, + 217, + 218, + 219, + 220, + 221, + 222, + 223, + 224, + 225, + 226, + 227, + 228, + 229, + 230, + 231, + 232, + 233, + 234, + 235, + 236, + 237, + 238, + 239, + 240, + 241, + 242, + 243, + 244, + 245, + 246, + 247, + 248, + 249, + 250, + 251, + 252, + 253, + 254, + 255, + 256, + 257, + 258, + 259, + 260, + 261, + 262, + 263, + 264, + 265, + 266, + 267, + 268, + 269, + 270, + 271, + 272, + 273, + 274, + 275, + 276, + 277, + 278, + 279, + 280, + 281, + 282, + 283, + 284, + 285, + 286, + 287, + 288, + 289, + 290, + 291, + 292, + 293, + 294, + 295, + 296, + 297, + 298, + 299, + 300, + 301, + 302, + 303, + 304, + 305, + 306, + 307, + 308, + 309, + 310, + 311, + 312, + 313, + 314, + 315, + 316, + 317, + 318, + 319, + 320, + 321, + 322, + 323, + 324, + 325, + 326, + 327, + 328, + 329, + 330, + 331, + 332, + 333, + 334, + 335, + 336, + 337, + 338, + 339, + 340, + 341, + 342, + 343, + 344, + 345, + 346, + 347, + 348, + 349, + 350, + 351, + 352, + 353, + 354, + 355, + 356, + 357, + 358, + 359, + 360, + 361, + 362, + 363, + 364, + 365, + 366, + 367, + 368, + 369, + 370, + 371, + 372, + 373, + 374 + ] + } +] \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/optimizer_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/optimizer_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..dcfd04153199ec42fc447dfd016837b72918105f --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/optimizer_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3aa17b020b219072748f81334b702862e9494aacfdaa2eb9d102e8d6682b1d0 +size 2014217744 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/rng_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/rng_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..3f05063053d93f824eb0171e6c48d5a691c426c5 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/rng_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:133e203cd0ce608c81b90b9798c13530eed9548b4cc3b5a9a1f6c8361c3efac5 +size 15708 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/scheduler_state.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/scheduler_state.json new file mode 100644 index 0000000000000000000000000000000000000000..cfc1fde89e35ba363bfcb8899c211f23ca23d41a --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/scheduler_state.json @@ -0,0 +1,15 @@ +{ + "base_lrs": [ + 1e-05 + ], + "last_epoch": 15000, + "_step_count": 15001, + "_is_initial": false, + "_get_lr_called_within_step": false, + "_last_lr": [ + 5.0262673762765316e-06 + ], + "lr_lambdas": [ + null + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/training_step.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/training_step.json new file mode 100644 index 0000000000000000000000000000000000000000..5cec056c8ba7f3c2e865a0f73ae59975a0503067 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/015000/training_state/training_step.json @@ -0,0 +1,3 @@ +{ + "step": 15000 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6d9e0e843e5fa2dbe7d14fccf5efa4dee2ddb9 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/config.json @@ -0,0 +1,92 @@ +{ + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/model.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..57fa373da06abb1d4c5f879183d78c5a07b1fc80 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b25c2f0b1cc75bb1d3c28dba3fc912b523ed0dbd78a94a7fac6ad56472a4ecb3 +size 1095367712 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_postprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_postprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c5e6cea7850bb999ab193f96021fa0129ce4db --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_postprocessor.json @@ -0,0 +1,32 @@ +{ + "name": "policy_postprocessor", + "steps": [ + { + "registry_name": "unnormalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors" + }, + { + "registry_name": "device_processor", + "config": { + "device": "cpu", + "float_dtype": null + } + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_preprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_preprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f57e6242af17f882bc107c602ca76393c57d55 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_preprocessor.json @@ -0,0 +1,56 @@ +{ + "name": "policy_preprocessor", + "steps": [ + { + "registry_name": "rename_observations_processor", + "config": { + "rename_map": {} + } + }, + { + "registry_name": "to_batch_processor", + "config": {} + }, + { + "registry_name": "device_processor", + "config": { + "device": "cuda", + "float_dtype": null + } + }, + { + "registry_name": "normalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + }, + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors" + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/train_config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/train_config.json new file mode 100644 index 0000000000000000000000000000000000000000..638986814c22c471c7596c080c170c7c4c4dd86b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/pretrained_model/train_config.json @@ -0,0 +1,302 @@ +{ + "dataset": { + "repo_id": "local/act_collected_episodes", + "root": "/home/shadeform/Desktop/robot_learning/base_new_dataset_134", + "episodes": null, + "image_transforms": { + "enable": false, + "max_num_transforms": 3, + "random_order": false, + "same_cloth_color": false, + "tfs": { + "color_jitter": { + "weight": 1.5, + "type": "ColorJitter", + "kwargs": { + "brightness": [ + 0.7, + 1.3 + ], + "contrast": [ + 0.7, + 1.3 + ], + "saturation": [ + 0.4, + 1.6 + ], + "hue": [ + -0.5, + 0.5 + ] + } + }, + "grayscale": { + "weight": 0.5, + "type": "RandomGrayscale", + "kwargs": { + "p": 1.0 + } + }, + "shadow": { + "weight": 0.8, + "type": "RandomShadow", + "kwargs": { + "num_shadows": [ + 1, + 2 + ], + "intensity": [ + 0.4, + 0.7 + ], + "blur_sigma": [ + 4.0, + 20.0 + ] + } + }, + "highlight": { + "weight": 0.5, + "type": "RandomHighlight", + "kwargs": { + "num_highlights": [ + 0, + 1 + ], + "intensity": [ + 0.2, + 0.5 + ], + "sigma": [ + 20.0, + 60.0 + ] + } + }, + "gamma": { + "weight": 0.7, + "type": "RandomGamma", + "kwargs": { + "gamma": [ + 0.6, + 1.4 + ] + } + }, + "blur": { + "weight": 0.0, + "type": "GaussianBlur", + "kwargs": { + "kernel_size": [ + 3, + 3 + ], + "sigma": [ + 0.1, + 1.5 + ] + } + }, + "jpeg": { + "weight": 0.0, + "type": "RandomJPEG", + "kwargs": { + "quality": [ + 60, + 95 + ] + } + }, + "crop": { + "weight": 0.5, + "type": "RandomCropPreserveSize", + "kwargs": { + "scale": [ + 0.97, + 1.0 + ], + "ratio": [ + 0.99, + 1.01 + ] + } + }, + "affine": { + "weight": 0.0, + "type": "RandomAffine", + "kwargs": { + "degrees": [ + -5.0, + 5.0 + ], + "translate": [ + 0.05, + 0.05 + ] + } + }, + "sharpness": { + "weight": 1.0, + "type": "SharpnessJitter", + "kwargs": { + "sharpness": [ + 0.5, + 1.5 + ] + } + } + } + }, + "revision": null, + "use_imagenet_stats": true, + "video_backend": "pyav", + "return_uint8": false, + "streaming": false + }, + "env": null, + "policy": { + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 + }, + "reward_model": null, + "output_dir": "/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1", + "job_name": "diffusion_specialized_eval1", + "resume": false, + "seed": 1000, + "cudnn_deterministic": false, + "num_workers": 4, + "batch_size": 32, + "prefetch_factor": 4, + "persistent_workers": true, + "steps": 30000, + "eval_freq": 0, + "log_freq": 20, + "tolerance_s": 0.0001, + "save_checkpoint": true, + "save_freq": 5000, + "use_policy_training_preset": true, + "optimizer": { + "type": "adam", + "lr": 1e-05, + "weight_decay": 1e-06, + "grad_clip_norm": 10.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08 + }, + "scheduler": { + "type": "diffuser", + "num_warmup_steps": 100, + "name": "cosine" + }, + "eval": { + "n_episodes": 50, + "batch_size": 11, + "use_async_envs": true + }, + "wandb": { + "enable": true, + "disable_artifact": false, + "project": "lerobot", + "entity": null, + "notes": null, + "run_id": "d8akc176", + "mode": null, + "add_tags": true + }, + "peft": null, + "sample_weighting": null, + "rename_map": {}, + "checkpoint_path": null +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/optimizer_param_groups.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/optimizer_param_groups.json new file mode 100644 index 0000000000000000000000000000000000000000..8535188e4fb7d118385a76f7381c5904cde9dfa2 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/optimizer_param_groups.json @@ -0,0 +1,396 @@ +[ + { + "lr": 2.515180848423853e-06, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08, + "weight_decay": 1e-06, + "amsgrad": false, + "maximize": false, + "foreach": null, + "capturable": false, + "differentiable": false, + "fused": null, + "decoupled_weight_decay": false, + "initial_lr": 1e-05, + "params": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47, + 48, + 49, + 50, + 51, + 52, + 53, + 54, + 55, + 56, + 57, + 58, + 59, + 60, + 61, + 62, + 63, + 64, + 65, + 66, + 67, + 68, + 69, + 70, + 71, + 72, + 73, + 74, + 75, + 76, + 77, + 78, + 79, + 80, + 81, + 82, + 83, + 84, + 85, + 86, + 87, + 88, + 89, + 90, + 91, + 92, + 93, + 94, + 95, + 96, + 97, + 98, + 99, + 100, + 101, + 102, + 103, + 104, + 105, + 106, + 107, + 108, + 109, + 110, + 111, + 112, + 113, + 114, + 115, + 116, + 117, + 118, + 119, + 120, + 121, + 122, + 123, + 124, + 125, + 126, + 127, + 128, + 129, + 130, + 131, + 132, + 133, + 134, + 135, + 136, + 137, + 138, + 139, + 140, + 141, + 142, + 143, + 144, + 145, + 146, + 147, + 148, + 149, + 150, + 151, + 152, + 153, + 154, + 155, + 156, + 157, + 158, + 159, + 160, + 161, + 162, + 163, + 164, + 165, + 166, + 167, + 168, + 169, + 170, + 171, + 172, + 173, + 174, + 175, + 176, + 177, + 178, + 179, + 180, + 181, + 182, + 183, + 184, + 185, + 186, + 187, + 188, + 189, + 190, + 191, + 192, + 193, + 194, + 195, + 196, + 197, + 198, + 199, + 200, + 201, + 202, + 203, + 204, + 205, + 206, + 207, + 208, + 209, + 210, + 211, + 212, + 213, + 214, + 215, + 216, + 217, + 218, + 219, + 220, + 221, + 222, + 223, + 224, + 225, + 226, + 227, + 228, + 229, + 230, + 231, + 232, + 233, + 234, + 235, + 236, + 237, + 238, + 239, + 240, + 241, + 242, + 243, + 244, + 245, + 246, + 247, + 248, + 249, + 250, + 251, + 252, + 253, + 254, + 255, + 256, + 257, + 258, + 259, + 260, + 261, + 262, + 263, + 264, + 265, + 266, + 267, + 268, + 269, + 270, + 271, + 272, + 273, + 274, + 275, + 276, + 277, + 278, + 279, + 280, + 281, + 282, + 283, + 284, + 285, + 286, + 287, + 288, + 289, + 290, + 291, + 292, + 293, + 294, + 295, + 296, + 297, + 298, + 299, + 300, + 301, + 302, + 303, + 304, + 305, + 306, + 307, + 308, + 309, + 310, + 311, + 312, + 313, + 314, + 315, + 316, + 317, + 318, + 319, + 320, + 321, + 322, + 323, + 324, + 325, + 326, + 327, + 328, + 329, + 330, + 331, + 332, + 333, + 334, + 335, + 336, + 337, + 338, + 339, + 340, + 341, + 342, + 343, + 344, + 345, + 346, + 347, + 348, + 349, + 350, + 351, + 352, + 353, + 354, + 355, + 356, + 357, + 358, + 359, + 360, + 361, + 362, + 363, + 364, + 365, + 366, + 367, + 368, + 369, + 370, + 371, + 372, + 373, + 374 + ] + } +] \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/optimizer_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/optimizer_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..ee2b4bab6dd01a58b6d6208f4187653d4a12802a --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/optimizer_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd8aac0abdb0f998c9defd8d720a68ea3f9a5fa5556a11b97b93f5432c1e16f9 +size 2014217744 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/rng_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/rng_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..0dc0f9a46386016c4683eb6f615bb5b989bda6ff --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/rng_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:068d6b2a7d85978142d462a3aa49650a414fb0605771f5df124520c79460f22d +size 15708 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/scheduler_state.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/scheduler_state.json new file mode 100644 index 0000000000000000000000000000000000000000..142102f3c4aaa13622efce2e6c698fad6dd9b6cd --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/scheduler_state.json @@ -0,0 +1,15 @@ +{ + "base_lrs": [ + 1e-05 + ], + "last_epoch": 20000, + "_step_count": 20001, + "_is_initial": false, + "_get_lr_called_within_step": false, + "_last_lr": [ + 2.515180848423853e-06 + ], + "lr_lambdas": [ + null + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/training_step.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/training_step.json new file mode 100644 index 0000000000000000000000000000000000000000..dc9bb47026c5d5237ca6fc5dbff6020dd122ea05 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/020000/training_state/training_step.json @@ -0,0 +1,3 @@ +{ + "step": 20000 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6d9e0e843e5fa2dbe7d14fccf5efa4dee2ddb9 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/config.json @@ -0,0 +1,92 @@ +{ + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/model.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e912b79ab4e47e264db6037f7de6170436e7eb90 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1463dc3b873fbc72759f493db28f82b3a747b84d44c56dda8c25f1e05f6ba745 +size 1095367712 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_postprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_postprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c5e6cea7850bb999ab193f96021fa0129ce4db --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_postprocessor.json @@ -0,0 +1,32 @@ +{ + "name": "policy_postprocessor", + "steps": [ + { + "registry_name": "unnormalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors" + }, + { + "registry_name": "device_processor", + "config": { + "device": "cpu", + "float_dtype": null + } + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_preprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_preprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f57e6242af17f882bc107c602ca76393c57d55 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_preprocessor.json @@ -0,0 +1,56 @@ +{ + "name": "policy_preprocessor", + "steps": [ + { + "registry_name": "rename_observations_processor", + "config": { + "rename_map": {} + } + }, + { + "registry_name": "to_batch_processor", + "config": {} + }, + { + "registry_name": "device_processor", + "config": { + "device": "cuda", + "float_dtype": null + } + }, + { + "registry_name": "normalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + }, + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors" + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/train_config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/train_config.json new file mode 100644 index 0000000000000000000000000000000000000000..638986814c22c471c7596c080c170c7c4c4dd86b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/pretrained_model/train_config.json @@ -0,0 +1,302 @@ +{ + "dataset": { + "repo_id": "local/act_collected_episodes", + "root": "/home/shadeform/Desktop/robot_learning/base_new_dataset_134", + "episodes": null, + "image_transforms": { + "enable": false, + "max_num_transforms": 3, + "random_order": false, + "same_cloth_color": false, + "tfs": { + "color_jitter": { + "weight": 1.5, + "type": "ColorJitter", + "kwargs": { + "brightness": [ + 0.7, + 1.3 + ], + "contrast": [ + 0.7, + 1.3 + ], + "saturation": [ + 0.4, + 1.6 + ], + "hue": [ + -0.5, + 0.5 + ] + } + }, + "grayscale": { + "weight": 0.5, + "type": "RandomGrayscale", + "kwargs": { + "p": 1.0 + } + }, + "shadow": { + "weight": 0.8, + "type": "RandomShadow", + "kwargs": { + "num_shadows": [ + 1, + 2 + ], + "intensity": [ + 0.4, + 0.7 + ], + "blur_sigma": [ + 4.0, + 20.0 + ] + } + }, + "highlight": { + "weight": 0.5, + "type": "RandomHighlight", + "kwargs": { + "num_highlights": [ + 0, + 1 + ], + "intensity": [ + 0.2, + 0.5 + ], + "sigma": [ + 20.0, + 60.0 + ] + } + }, + "gamma": { + "weight": 0.7, + "type": "RandomGamma", + "kwargs": { + "gamma": [ + 0.6, + 1.4 + ] + } + }, + "blur": { + "weight": 0.0, + "type": "GaussianBlur", + "kwargs": { + "kernel_size": [ + 3, + 3 + ], + "sigma": [ + 0.1, + 1.5 + ] + } + }, + "jpeg": { + "weight": 0.0, + "type": "RandomJPEG", + "kwargs": { + "quality": [ + 60, + 95 + ] + } + }, + "crop": { + "weight": 0.5, + "type": "RandomCropPreserveSize", + "kwargs": { + "scale": [ + 0.97, + 1.0 + ], + "ratio": [ + 0.99, + 1.01 + ] + } + }, + "affine": { + "weight": 0.0, + "type": "RandomAffine", + "kwargs": { + "degrees": [ + -5.0, + 5.0 + ], + "translate": [ + 0.05, + 0.05 + ] + } + }, + "sharpness": { + "weight": 1.0, + "type": "SharpnessJitter", + "kwargs": { + "sharpness": [ + 0.5, + 1.5 + ] + } + } + } + }, + "revision": null, + "use_imagenet_stats": true, + "video_backend": "pyav", + "return_uint8": false, + "streaming": false + }, + "env": null, + "policy": { + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 + }, + "reward_model": null, + "output_dir": "/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1", + "job_name": "diffusion_specialized_eval1", + "resume": false, + "seed": 1000, + "cudnn_deterministic": false, + "num_workers": 4, + "batch_size": 32, + "prefetch_factor": 4, + "persistent_workers": true, + "steps": 30000, + "eval_freq": 0, + "log_freq": 20, + "tolerance_s": 0.0001, + "save_checkpoint": true, + "save_freq": 5000, + "use_policy_training_preset": true, + "optimizer": { + "type": "adam", + "lr": 1e-05, + "weight_decay": 1e-06, + "grad_clip_norm": 10.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08 + }, + "scheduler": { + "type": "diffuser", + "num_warmup_steps": 100, + "name": "cosine" + }, + "eval": { + "n_episodes": 50, + "batch_size": 11, + "use_async_envs": true + }, + "wandb": { + "enable": true, + "disable_artifact": false, + "project": "lerobot", + "entity": null, + "notes": null, + "run_id": "d8akc176", + "mode": null, + "add_tags": true + }, + "peft": null, + "sample_weighting": null, + "rename_map": {}, + "checkpoint_path": null +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/optimizer_param_groups.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/optimizer_param_groups.json new file mode 100644 index 0000000000000000000000000000000000000000..0a87b5b84611df8f5f1c5a3bd9f24dbc5e584ffd --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/optimizer_param_groups.json @@ -0,0 +1,396 @@ +[ + { + "lr": 6.742575343716584e-07, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08, + "weight_decay": 1e-06, + "amsgrad": false, + "maximize": false, + "foreach": null, + "capturable": false, + "differentiable": false, + "fused": null, + "decoupled_weight_decay": false, + "initial_lr": 1e-05, + "params": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47, + 48, + 49, + 50, + 51, + 52, + 53, + 54, + 55, + 56, + 57, + 58, + 59, + 60, + 61, + 62, + 63, + 64, + 65, + 66, + 67, + 68, + 69, + 70, + 71, + 72, + 73, + 74, + 75, + 76, + 77, + 78, + 79, + 80, + 81, + 82, + 83, + 84, + 85, + 86, + 87, + 88, + 89, + 90, + 91, + 92, + 93, + 94, + 95, + 96, + 97, + 98, + 99, + 100, + 101, + 102, + 103, + 104, + 105, + 106, + 107, + 108, + 109, + 110, + 111, + 112, + 113, + 114, + 115, + 116, + 117, + 118, + 119, + 120, + 121, + 122, + 123, + 124, + 125, + 126, + 127, + 128, + 129, + 130, + 131, + 132, + 133, + 134, + 135, + 136, + 137, + 138, + 139, + 140, + 141, + 142, + 143, + 144, + 145, + 146, + 147, + 148, + 149, + 150, + 151, + 152, + 153, + 154, + 155, + 156, + 157, + 158, + 159, + 160, + 161, + 162, + 163, + 164, + 165, + 166, + 167, + 168, + 169, + 170, + 171, + 172, + 173, + 174, + 175, + 176, + 177, + 178, + 179, + 180, + 181, + 182, + 183, + 184, + 185, + 186, + 187, + 188, + 189, + 190, + 191, + 192, + 193, + 194, + 195, + 196, + 197, + 198, + 199, + 200, + 201, + 202, + 203, + 204, + 205, + 206, + 207, + 208, + 209, + 210, + 211, + 212, + 213, + 214, + 215, + 216, + 217, + 218, + 219, + 220, + 221, + 222, + 223, + 224, + 225, + 226, + 227, + 228, + 229, + 230, + 231, + 232, + 233, + 234, + 235, + 236, + 237, + 238, + 239, + 240, + 241, + 242, + 243, + 244, + 245, + 246, + 247, + 248, + 249, + 250, + 251, + 252, + 253, + 254, + 255, + 256, + 257, + 258, + 259, + 260, + 261, + 262, + 263, + 264, + 265, + 266, + 267, + 268, + 269, + 270, + 271, + 272, + 273, + 274, + 275, + 276, + 277, + 278, + 279, + 280, + 281, + 282, + 283, + 284, + 285, + 286, + 287, + 288, + 289, + 290, + 291, + 292, + 293, + 294, + 295, + 296, + 297, + 298, + 299, + 300, + 301, + 302, + 303, + 304, + 305, + 306, + 307, + 308, + 309, + 310, + 311, + 312, + 313, + 314, + 315, + 316, + 317, + 318, + 319, + 320, + 321, + 322, + 323, + 324, + 325, + 326, + 327, + 328, + 329, + 330, + 331, + 332, + 333, + 334, + 335, + 336, + 337, + 338, + 339, + 340, + 341, + 342, + 343, + 344, + 345, + 346, + 347, + 348, + 349, + 350, + 351, + 352, + 353, + 354, + 355, + 356, + 357, + 358, + 359, + 360, + 361, + 362, + 363, + 364, + 365, + 366, + 367, + 368, + 369, + 370, + 371, + 372, + 373, + 374 + ] + } +] \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/optimizer_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/optimizer_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..bbfc65d9f789e6cb79c3bb491172b703d37d0ac4 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/optimizer_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3fbf0f83c05dd68d42a29bf54641aae6dcc6f6fb68e1b1c8d73a765985faa4c +size 2014217744 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/rng_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/rng_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..e1509346819f9180f589845d72fbad3f2b0e19a1 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/rng_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e250b105e6074f8715f61aa8a879c696197113cc35957e4c87f8e23caaa65407 +size 15708 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/scheduler_state.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/scheduler_state.json new file mode 100644 index 0000000000000000000000000000000000000000..71f061e81afa37529460e137c2d2b853455c9ffb --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/scheduler_state.json @@ -0,0 +1,15 @@ +{ + "base_lrs": [ + 1e-05 + ], + "last_epoch": 25000, + "_step_count": 25001, + "_is_initial": false, + "_get_lr_called_within_step": false, + "_last_lr": [ + 6.742575343716584e-07 + ], + "lr_lambdas": [ + null + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/training_step.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/training_step.json new file mode 100644 index 0000000000000000000000000000000000000000..ac6903ae05e7bbaec1e2da710fdbe91d8dc3f37d --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/025000/training_state/training_step.json @@ -0,0 +1,3 @@ +{ + "step": 25000 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/config.json new file mode 100644 index 0000000000000000000000000000000000000000..eb6d9e0e843e5fa2dbe7d14fccf5efa4dee2ddb9 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/config.json @@ -0,0 +1,92 @@ +{ + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/model.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..72492f95e678c47afbc92295a677295480e27407 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b61e1927f9c65bcfc925177164db3f3b68feaa3cbd76e77ea18612bb6d97b9 +size 1095367712 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_postprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_postprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..f2c5e6cea7850bb999ab193f96021fa0129ce4db --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_postprocessor.json @@ -0,0 +1,32 @@ +{ + "name": "policy_postprocessor", + "steps": [ + { + "registry_name": "unnormalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_postprocessor_step_0_unnormalizer_processor.safetensors" + }, + { + "registry_name": "device_processor", + "config": { + "device": "cpu", + "float_dtype": null + } + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_postprocessor_step_0_unnormalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_preprocessor.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_preprocessor.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f57e6242af17f882bc107c602ca76393c57d55 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_preprocessor.json @@ -0,0 +1,56 @@ +{ + "name": "policy_preprocessor", + "steps": [ + { + "registry_name": "rename_observations_processor", + "config": { + "rename_map": {} + } + }, + { + "registry_name": "to_batch_processor", + "config": {} + }, + { + "registry_name": "device_processor", + "config": { + "device": "cuda", + "float_dtype": null + } + }, + { + "registry_name": "normalizer_processor", + "config": { + "eps": 1e-08, + "features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + }, + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "norm_map": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + } + }, + "state_file": "policy_preprocessor_step_3_normalizer_processor.safetensors" + } + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..b5a2a63fb8806fa7c342c79e166f0a8b0e6a46d6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/policy_preprocessor_step_3_normalizer_processor.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246776baee98e80415490a71d2dcc585a887291ef94b140cf637dcff081d3a18 +size 6560 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/train_config.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/train_config.json new file mode 100644 index 0000000000000000000000000000000000000000..638986814c22c471c7596c080c170c7c4c4dd86b --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/pretrained_model/train_config.json @@ -0,0 +1,302 @@ +{ + "dataset": { + "repo_id": "local/act_collected_episodes", + "root": "/home/shadeform/Desktop/robot_learning/base_new_dataset_134", + "episodes": null, + "image_transforms": { + "enable": false, + "max_num_transforms": 3, + "random_order": false, + "same_cloth_color": false, + "tfs": { + "color_jitter": { + "weight": 1.5, + "type": "ColorJitter", + "kwargs": { + "brightness": [ + 0.7, + 1.3 + ], + "contrast": [ + 0.7, + 1.3 + ], + "saturation": [ + 0.4, + 1.6 + ], + "hue": [ + -0.5, + 0.5 + ] + } + }, + "grayscale": { + "weight": 0.5, + "type": "RandomGrayscale", + "kwargs": { + "p": 1.0 + } + }, + "shadow": { + "weight": 0.8, + "type": "RandomShadow", + "kwargs": { + "num_shadows": [ + 1, + 2 + ], + "intensity": [ + 0.4, + 0.7 + ], + "blur_sigma": [ + 4.0, + 20.0 + ] + } + }, + "highlight": { + "weight": 0.5, + "type": "RandomHighlight", + "kwargs": { + "num_highlights": [ + 0, + 1 + ], + "intensity": [ + 0.2, + 0.5 + ], + "sigma": [ + 20.0, + 60.0 + ] + } + }, + "gamma": { + "weight": 0.7, + "type": "RandomGamma", + "kwargs": { + "gamma": [ + 0.6, + 1.4 + ] + } + }, + "blur": { + "weight": 0.0, + "type": "GaussianBlur", + "kwargs": { + "kernel_size": [ + 3, + 3 + ], + "sigma": [ + 0.1, + 1.5 + ] + } + }, + "jpeg": { + "weight": 0.0, + "type": "RandomJPEG", + "kwargs": { + "quality": [ + 60, + 95 + ] + } + }, + "crop": { + "weight": 0.5, + "type": "RandomCropPreserveSize", + "kwargs": { + "scale": [ + 0.97, + 1.0 + ], + "ratio": [ + 0.99, + 1.01 + ] + } + }, + "affine": { + "weight": 0.0, + "type": "RandomAffine", + "kwargs": { + "degrees": [ + -5.0, + 5.0 + ], + "translate": [ + 0.05, + 0.05 + ] + } + }, + "sharpness": { + "weight": 1.0, + "type": "SharpnessJitter", + "kwargs": { + "sharpness": [ + 0.5, + 1.5 + ] + } + } + } + }, + "revision": null, + "use_imagenet_stats": true, + "video_backend": "pyav", + "return_uint8": false, + "streaming": false + }, + "env": null, + "policy": { + "type": "diffusion", + "n_obs_steps": 2, + "input_features": { + "observation.state": { + "type": "STATE", + "shape": [ + 6 + ] + }, + "observation.images.front": { + "type": "VISUAL", + "shape": [ + 3, + 480, + 640 + ] + } + }, + "output_features": { + "action": { + "type": "ACTION", + "shape": [ + 6 + ] + } + }, + "device": "cuda", + "use_amp": false, + "use_peft": false, + "push_to_hub": false, + "repo_id": null, + "private": null, + "tags": null, + "license": null, + "pretrained_path": "/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model", + "horizon": 16, + "n_action_steps": 8, + "normalization_mapping": { + "VISUAL": "MEAN_STD", + "STATE": "MIN_MAX", + "ACTION": "MIN_MAX" + }, + "drop_n_last_frames": 7, + "vision_backbone_type": "dinov2", + "vision_encoder_name": "facebook/dinov2-small", + "freeze_vision_encoder": true, + "vision_backbone": "resnet18", + "resize_shape": [ + 224, + 224 + ], + "crop_ratio": 1.0, + "crop_shape": null, + "crop_is_random": true, + "pretrained_backbone_weights": "ResNet18_Weights.IMAGENET1K_V1", + "use_group_norm": false, + "spatial_softmax_num_keypoints": 32, + "vit_pool_type": "spatial_softmax", + "vit_feature_dim": 512, + "use_separate_rgb_encoder_per_camera": true, + "down_dims": [ + 512, + 1024, + 2048 + ], + "kernel_size": 5, + "n_groups": 8, + "diffusion_step_embed_dim": 128, + "use_film_scale_modulation": true, + "noise_scheduler_type": "DDPM", + "num_train_timesteps": 100, + "beta_schedule": "squaredcos_cap_v2", + "beta_start": 0.0001, + "beta_end": 0.02, + "prediction_type": "epsilon", + "clip_sample": true, + "clip_sample_range": 1.0, + "num_inference_steps": 100, + "compile_model": false, + "compile_mode": "reduce-overhead", + "do_mask_loss_for_padding": false, + "optimizer_lr": 1e-05, + "optimizer_betas": [ + 0.95, + 0.999 + ], + "optimizer_eps": 1e-08, + "optimizer_weight_decay": 1e-06, + "scheduler_name": "cosine", + "scheduler_warmup_steps": 100 + }, + "reward_model": null, + "output_dir": "/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1", + "job_name": "diffusion_specialized_eval1", + "resume": false, + "seed": 1000, + "cudnn_deterministic": false, + "num_workers": 4, + "batch_size": 32, + "prefetch_factor": 4, + "persistent_workers": true, + "steps": 30000, + "eval_freq": 0, + "log_freq": 20, + "tolerance_s": 0.0001, + "save_checkpoint": true, + "save_freq": 5000, + "use_policy_training_preset": true, + "optimizer": { + "type": "adam", + "lr": 1e-05, + "weight_decay": 1e-06, + "grad_clip_norm": 10.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08 + }, + "scheduler": { + "type": "diffuser", + "num_warmup_steps": 100, + "name": "cosine" + }, + "eval": { + "n_episodes": 50, + "batch_size": 11, + "use_async_envs": true + }, + "wandb": { + "enable": true, + "disable_artifact": false, + "project": "lerobot", + "entity": null, + "notes": null, + "run_id": "d8akc176", + "mode": null, + "add_tags": true + }, + "peft": null, + "sample_weighting": null, + "rename_map": {}, + "checkpoint_path": null +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/optimizer_param_groups.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/optimizer_param_groups.json new file mode 100644 index 0000000000000000000000000000000000000000..341d6d699647d763bd830f2010ef65bb0ced2d98 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/optimizer_param_groups.json @@ -0,0 +1,396 @@ +[ + { + "lr": 0.0, + "betas": [ + 0.95, + 0.999 + ], + "eps": 1e-08, + "weight_decay": 1e-06, + "amsgrad": false, + "maximize": false, + "foreach": null, + "capturable": false, + "differentiable": false, + "fused": null, + "decoupled_weight_decay": false, + "initial_lr": 1e-05, + "params": [ + 0, + 1, + 2, + 3, + 4, + 5, + 6, + 7, + 8, + 9, + 10, + 11, + 12, + 13, + 14, + 15, + 16, + 17, + 18, + 19, + 20, + 21, + 22, + 23, + 24, + 25, + 26, + 27, + 28, + 29, + 30, + 31, + 32, + 33, + 34, + 35, + 36, + 37, + 38, + 39, + 40, + 41, + 42, + 43, + 44, + 45, + 46, + 47, + 48, + 49, + 50, + 51, + 52, + 53, + 54, + 55, + 56, + 57, + 58, + 59, + 60, + 61, + 62, + 63, + 64, + 65, + 66, + 67, + 68, + 69, + 70, + 71, + 72, + 73, + 74, + 75, + 76, + 77, + 78, + 79, + 80, + 81, + 82, + 83, + 84, + 85, + 86, + 87, + 88, + 89, + 90, + 91, + 92, + 93, + 94, + 95, + 96, + 97, + 98, + 99, + 100, + 101, + 102, + 103, + 104, + 105, + 106, + 107, + 108, + 109, + 110, + 111, + 112, + 113, + 114, + 115, + 116, + 117, + 118, + 119, + 120, + 121, + 122, + 123, + 124, + 125, + 126, + 127, + 128, + 129, + 130, + 131, + 132, + 133, + 134, + 135, + 136, + 137, + 138, + 139, + 140, + 141, + 142, + 143, + 144, + 145, + 146, + 147, + 148, + 149, + 150, + 151, + 152, + 153, + 154, + 155, + 156, + 157, + 158, + 159, + 160, + 161, + 162, + 163, + 164, + 165, + 166, + 167, + 168, + 169, + 170, + 171, + 172, + 173, + 174, + 175, + 176, + 177, + 178, + 179, + 180, + 181, + 182, + 183, + 184, + 185, + 186, + 187, + 188, + 189, + 190, + 191, + 192, + 193, + 194, + 195, + 196, + 197, + 198, + 199, + 200, + 201, + 202, + 203, + 204, + 205, + 206, + 207, + 208, + 209, + 210, + 211, + 212, + 213, + 214, + 215, + 216, + 217, + 218, + 219, + 220, + 221, + 222, + 223, + 224, + 225, + 226, + 227, + 228, + 229, + 230, + 231, + 232, + 233, + 234, + 235, + 236, + 237, + 238, + 239, + 240, + 241, + 242, + 243, + 244, + 245, + 246, + 247, + 248, + 249, + 250, + 251, + 252, + 253, + 254, + 255, + 256, + 257, + 258, + 259, + 260, + 261, + 262, + 263, + 264, + 265, + 266, + 267, + 268, + 269, + 270, + 271, + 272, + 273, + 274, + 275, + 276, + 277, + 278, + 279, + 280, + 281, + 282, + 283, + 284, + 285, + 286, + 287, + 288, + 289, + 290, + 291, + 292, + 293, + 294, + 295, + 296, + 297, + 298, + 299, + 300, + 301, + 302, + 303, + 304, + 305, + 306, + 307, + 308, + 309, + 310, + 311, + 312, + 313, + 314, + 315, + 316, + 317, + 318, + 319, + 320, + 321, + 322, + 323, + 324, + 325, + 326, + 327, + 328, + 329, + 330, + 331, + 332, + 333, + 334, + 335, + 336, + 337, + 338, + 339, + 340, + 341, + 342, + 343, + 344, + 345, + 346, + 347, + 348, + 349, + 350, + 351, + 352, + 353, + 354, + 355, + 356, + 357, + 358, + 359, + 360, + 361, + 362, + 363, + 364, + 365, + 366, + 367, + 368, + 369, + 370, + 371, + 372, + 373, + 374 + ] + } +] \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/optimizer_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/optimizer_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..98bb16d9c881fc8a0cadf27931e71ec0ce35cbf6 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/optimizer_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2601e45fd772cb1676d282fb1e168655c23f00030a0715ae5c78be4c2c34376 +size 2014217744 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/rng_state.safetensors b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/rng_state.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..f0671c330d5e5d0724e6ee3dd3601138de5e03c4 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/rng_state.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5922b99a5486610cb94b7ce1e49d13a6d67dc1cd05b6855b3aa1cb10999fd89 +size 15708 diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/scheduler_state.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/scheduler_state.json new file mode 100644 index 0000000000000000000000000000000000000000..ae5e55feb993da35fc57c9f624104e30985c3f02 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/scheduler_state.json @@ -0,0 +1,15 @@ +{ + "base_lrs": [ + 1e-05 + ], + "last_epoch": 30000, + "_step_count": 30001, + "_is_initial": false, + "_get_lr_called_within_step": false, + "_last_lr": [ + 0.0 + ], + "lr_lambdas": [ + null + ] +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/training_step.json b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/training_step.json new file mode 100644 index 0000000000000000000000000000000000000000..f4945f660f45b332883dccfccf18d8b8815d916a --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/checkpoints/030000/training_state/training_step.json @@ -0,0 +1,3 @@ +{ + "step": 30000 +} \ No newline at end of file diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/debug-internal.log b/checkpoints/diffusion_specialized_new_dataset_580/wandb/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..af748f54846f59ce5637a2d4c1dffb5228f28570 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/debug-internal.log @@ -0,0 +1,11 @@ +{"time":"2026-05-19T01:11:48.564061586Z","level":"INFO","msg":"stream: starting","core version":"0.24.2"} +{"time":"2026-05-19T01:11:48.736699273Z","level":"INFO","msg":"stream: created new stream","id":"d8akc176"} +{"time":"2026-05-19T01:11:48.736865196Z","level":"INFO","msg":"handler: started","stream_id":"d8akc176"} +{"time":"2026-05-19T01:11:48.736955636Z","level":"INFO","msg":"stream: started","id":"d8akc176"} +{"time":"2026-05-19T01:11:48.736985033Z","level":"INFO","msg":"writer: started","stream_id":"d8akc176"} +{"time":"2026-05-19T01:11:48.73705247Z","level":"INFO","msg":"sender: started","stream_id":"d8akc176"} +{"time":"2026-05-19T02:12:45.882199691Z","level":"INFO","msg":"stream: closing","id":"d8akc176"} +{"time":"2026-05-19T02:13:14.660395438Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2026-05-19T02:13:15.039868032Z","level":"INFO","msg":"handler: closed","stream_id":"d8akc176"} +{"time":"2026-05-19T02:13:15.039996616Z","level":"INFO","msg":"sender: closed","stream_id":"d8akc176"} +{"time":"2026-05-19T02:13:15.040009169Z","level":"INFO","msg":"stream: closed","id":"d8akc176"} diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/debug.log b/checkpoints/diffusion_specialized_new_dataset_580/wandb/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..5a3b2d2cf9eef6bb783b15a0083aa34b32464a47 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/debug.log @@ -0,0 +1,21 @@ +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_setup.py:_flush():81] Current SDK version is 0.24.2 +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_setup.py:_flush():81] Configure stats pid to 32539 +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_setup.py:_flush():81] Loading settings from environment variables +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1/wandb/run-20260519_011148-d8akc176/logs/debug.log +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1/wandb/run-20260519_011148-d8akc176/logs/debug-internal.log +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_init.py:init():844] calling init triggers +2026-05-19 01:11:48,343 INFO MainThread:32539 [wandb_init.py:init():849] wandb.init called with sweep_config: {} +config: {'dataset': {'repo_id': 'local/act_collected_episodes', 'root': '/home/shadeform/Desktop/robot_learning/base_new_dataset_134', 'episodes': None, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'same_cloth_color': False, 'tfs': {'color_jitter': {'weight': 1.5, 'type': 'ColorJitter', 'kwargs': {'brightness': [0.7, 1.3], 'contrast': [0.7, 1.3], 'saturation': [0.4, 1.6], 'hue': [-0.5, 0.5]}}, 'grayscale': {'weight': 0.5, 'type': 'RandomGrayscale', 'kwargs': {'p': 1.0}}, 'shadow': {'weight': 0.8, 'type': 'RandomShadow', 'kwargs': {'num_shadows': [1, 2], 'intensity': [0.4, 0.7], 'blur_sigma': [4.0, 20.0]}}, 'highlight': {'weight': 0.5, 'type': 'RandomHighlight', 'kwargs': {'num_highlights': [0, 1], 'intensity': [0.2, 0.5], 'sigma': [20.0, 60.0]}}, 'gamma': {'weight': 0.7, 'type': 'RandomGamma', 'kwargs': {'gamma': [0.6, 1.4]}}, 'blur': {'weight': 0.0, 'type': 'GaussianBlur', 'kwargs': {'kernel_size': [3, 3], 'sigma': [0.1, 1.5]}}, 'jpeg': {'weight': 0.0, 'type': 'RandomJPEG', 'kwargs': {'quality': [60, 95]}}, 'crop': {'weight': 0.5, 'type': 'RandomCropPreserveSize', 'kwargs': {'scale': [0.97, 1.0], 'ratio': [0.99, 1.01]}}, 'affine': {'weight': 0.0, 'type': 'RandomAffine', 'kwargs': {'degrees': [-5.0, 5.0], 'translate': [0.05, 0.05]}}, 'sharpness': {'weight': 1.0, 'type': 'SharpnessJitter', 'kwargs': {'sharpness': [0.5, 1.5]}}}}, 'revision': None, 'use_imagenet_stats': True, 'video_backend': 'pyav', 'return_uint8': False, 'streaming': False}, 'env': None, 'policy': {'type': 'diffusion', 'n_obs_steps': 2, 'input_features': {'observation.state': {'type': , 'shape': [6]}, 'observation.images.front': {'type': , 'shape': [3, 480, 640]}}, 'output_features': {'action': {'type': , 'shape': [6]}}, 'device': 'cuda', 'use_amp': False, 'use_peft': False, 'push_to_hub': False, 'repo_id': None, 'private': None, 'tags': None, 'license': None, 'pretrained_path': '/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model', 'horizon': 16, 'n_action_steps': 8, 'normalization_mapping': {'VISUAL': , 'STATE': , 'ACTION': }, 'drop_n_last_frames': 7, 'vision_backbone_type': 'dinov2', 'vision_encoder_name': 'facebook/dinov2-small', 'freeze_vision_encoder': True, 'vision_backbone': 'resnet18', 'resize_shape': [224, 224], 'crop_ratio': 1.0, 'crop_shape': None, 'crop_is_random': True, 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'use_group_norm': False, 'spatial_softmax_num_keypoints': 32, 'vit_pool_type': 'spatial_softmax', 'vit_feature_dim': 512, 'use_separate_rgb_encoder_per_camera': True, 'down_dims': [512, 1024, 2048], 'kernel_size': 5, 'n_groups': 8, 'diffusion_step_embed_dim': 128, 'use_film_scale_modulation': True, 'noise_scheduler_type': 'DDPM', 'num_train_timesteps': 100, 'beta_schedule': 'squaredcos_cap_v2', 'beta_start': 0.0001, 'beta_end': 0.02, 'prediction_type': 'epsilon', 'clip_sample': True, 'clip_sample_range': 1.0, 'num_inference_steps': 100, 'compile_model': False, 'compile_mode': 'reduce-overhead', 'do_mask_loss_for_padding': False, 'optimizer_lr': 1e-05, 'optimizer_betas': [0.95, 0.999], 'optimizer_eps': 1e-08, 'optimizer_weight_decay': 1e-06, 'scheduler_name': 'cosine', 'scheduler_warmup_steps': 100}, 'reward_model': None, 'output_dir': '/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1', 'job_name': 'diffusion_specialized_eval1', 'resume': False, 'seed': 1000, 'cudnn_deterministic': False, 'num_workers': 4, 'batch_size': 32, 'prefetch_factor': 4, 'persistent_workers': True, 'steps': 30000, 'eval_freq': 0, 'log_freq': 20, 'tolerance_s': 0.0001, 'save_checkpoint': True, 'save_freq': 5000, 'use_policy_training_preset': True, 'optimizer': {'type': 'adam', 'lr': 1e-05, 'weight_decay': 1e-06, 'grad_clip_norm': 10.0, 'betas': [0.95, 0.999], 'eps': 1e-08}, 'scheduler': {'type': 'diffuser', 'num_warmup_steps': 100, 'name': 'cosine'}, 'eval': {'n_episodes': 50, 'batch_size': 11, 'use_async_envs': True}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot', 'entity': None, 'notes': None, 'run_id': None, 'mode': None, 'add_tags': True}, 'peft': None, 'sample_weighting': None, 'rename_map': {}, 'checkpoint_path': None, '_wandb': {}} +2026-05-19 01:11:48,343 INFO MainThread:32539 [wandb_init.py:init():892] starting backend +2026-05-19 01:11:48,558 INFO MainThread:32539 [wandb_init.py:init():895] sending inform_init request +2026-05-19 01:11:48,561 INFO MainThread:32539 [wandb_init.py:init():903] backend started and connected +2026-05-19 01:11:48,564 INFO MainThread:32539 [wandb_init.py:init():973] updated telemetry +2026-05-19 01:11:48,569 INFO MainThread:32539 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout +2026-05-19 01:11:49,150 INFO MainThread:32539 [wandb_init.py:init():1042] starting run threads in backend +2026-05-19 01:11:49,225 INFO MainThread:32539 [wandb_run.py:_console_start():2529] atexit reg +2026-05-19 01:11:49,225 INFO MainThread:32539 [wandb_run.py:_redirect():2377] redirect: wrap_raw +2026-05-19 01:11:49,226 INFO MainThread:32539 [wandb_run.py:_redirect():2446] Wrapping output streams. +2026-05-19 01:11:49,226 INFO MainThread:32539 [wandb_run.py:_redirect():2469] Redirects installed. +2026-05-19 01:11:49,230 INFO MainThread:32539 [wandb_init.py:init():1082] run started, returning control to user process +2026-05-19 02:12:45,882 INFO wandb-AsyncioManager-main:32539 [service_client.py:_forward_responses():94] Reached EOF. +2026-05-19 02:12:45,882 INFO wandb-AsyncioManager-main:32539 [mailbox.py:close():154] Closing mailbox, abandoning 2 handles. diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/files/config.yaml b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/files/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..41c6d9b163edcfa5ab0f11682c40f3a1365b7caa --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/files/config.yaml @@ -0,0 +1,351 @@ +_wandb: + value: + cli_version: 0.24.2 + e: + x3jk0td9akckfmhe6zf899m82gqt1ey3: + args: + - --policy.path=/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model/ + - --dataset.repo_id=local/act_collected_episodes + - --dataset.root=/home/shadeform/Desktop/robot_learning/base_new_dataset_134 + - --dataset.video_backend=pyav + - --policy.device=cuda + - --policy.push_to_hub=false + - --policy.freeze_vision_encoder=true + - --policy.optimizer_lr=1e-5 + - --policy.scheduler_warmup_steps=100 + - --output_dir=/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1 + - --job_name=diffusion_specialized_eval1 + - --batch_size=32 + - --steps=30000 + - --num_workers=4 + - --log_freq=20 + - --save_freq=5000 + - --eval_freq=0 + - --wandb.enable=True + codePath: .venv/bin/lerobot-train + codePathLocal: .venv/bin/lerobot-train + cpu_count: 16 + cpu_count_logical: 16 + cudaVersion: "13.0" + disk: + /: + total: "1055573327872" + used: "44265787392" + executable: /home/shadeform/Desktop/robot_learning/lerobot/.venv/bin/python3 + git: + commit: 8d23fd47055bfd22999a0aa8504b2db2a224760e + remote: https://github.com/michavol/lerobot.git + gpu: NVIDIA A100-SXM4-80GB + gpu_count: 1 + gpu_nvidia: + - architecture: Ampere + cudaCores: 6912 + memoryTotal: "85899345920" + name: NVIDIA A100-SXM4-80GB + uuid: GPU-4daed4a6-5610-593e-ff8b-288aa879a882 + host: brev-8nneacbnr + memory: + total: "126711091200" + os: Linux-6.8.0-90-generic-x86_64-with-glibc2.35 + program: /home/shadeform/Desktop/robot_learning/lerobot/.venv/bin/lerobot-train + python: CPython 3.12.13 + root: /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1 + startedAt: "2026-05-19T01:11:48.341609Z" + writerId: x3jk0td9akckfmhe6zf899m82gqt1ey3 + m: [] + python_version: 3.12.13 + t: + "1": + - 1 + - 11 + - 41 + - 49 + - 51 + - 71 + - 83 + "2": + - 1 + - 11 + - 41 + - 49 + - 51 + - 71 + - 83 + "3": + - 13 + - 15 + - 16 + - 61 + "4": 3.12.13 + "5": 0.24.2 + "6": 5.5.4 + "10": + - 21 + "12": 0.24.2 + "13": linux-x86_64 +batch_size: + value: 32 +checkpoint_path: + value: null +cudnn_deterministic: + value: false +dataset: + value: + episodes: null + image_transforms: + enable: false + max_num_transforms: 3 + random_order: false + same_cloth_color: false + tfs: + affine: + kwargs: + degrees: + - -5 + - 5 + translate: + - 0.05 + - 0.05 + type: RandomAffine + weight: 0 + blur: + kwargs: + kernel_size: + - 3 + - 3 + sigma: + - 0.1 + - 1.5 + type: GaussianBlur + weight: 0 + color_jitter: + kwargs: + brightness: + - 0.7 + - 1.3 + contrast: + - 0.7 + - 1.3 + hue: + - -0.5 + - 0.5 + saturation: + - 0.4 + - 1.6 + type: ColorJitter + weight: 1.5 + crop: + kwargs: + ratio: + - 0.99 + - 1.01 + scale: + - 0.97 + - 1 + type: RandomCropPreserveSize + weight: 0.5 + gamma: + kwargs: + gamma: + - 0.6 + - 1.4 + type: RandomGamma + weight: 0.7 + grayscale: + kwargs: + p: 1 + type: RandomGrayscale + weight: 0.5 + highlight: + kwargs: + intensity: + - 0.2 + - 0.5 + num_highlights: + - 0 + - 1 + sigma: + - 20 + - 60 + type: RandomHighlight + weight: 0.5 + jpeg: + kwargs: + quality: + - 60 + - 95 + type: RandomJPEG + weight: 0 + shadow: + kwargs: + blur_sigma: + - 4 + - 20 + intensity: + - 0.4 + - 0.7 + num_shadows: + - 1 + - 2 + type: RandomShadow + weight: 0.8 + sharpness: + kwargs: + sharpness: + - 0.5 + - 1.5 + type: SharpnessJitter + weight: 1 + repo_id: local/act_collected_episodes + return_uint8: false + revision: null + root: /home/shadeform/Desktop/robot_learning/base_new_dataset_134 + streaming: false + use_imagenet_stats: true + video_backend: pyav +env: + value: null +eval: + value: + batch_size: 11 + n_episodes: 50 + use_async_envs: true +eval_freq: + value: 0 +job_name: + value: diffusion_specialized_eval1 +log_freq: + value: 20 +num_workers: + value: 4 +optimizer: + value: + betas: + - 0.95 + - 0.999 + eps: 1e-08 + grad_clip_norm: 10 + lr: 1e-05 + type: adam + weight_decay: 1e-06 +output_dir: + value: /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1 +peft: + value: null +persistent_workers: + value: true +policy: + value: + beta_end: 0.02 + beta_schedule: squaredcos_cap_v2 + beta_start: 0.0001 + clip_sample: true + clip_sample_range: 1 + compile_mode: reduce-overhead + compile_model: false + crop_is_random: true + crop_ratio: 1 + crop_shape: null + device: cuda + diffusion_step_embed_dim: 128 + do_mask_loss_for_padding: false + down_dims: + - 512 + - 1024 + - 2048 + drop_n_last_frames: 7 + freeze_vision_encoder: true + horizon: 16 + input_features: + observation.images.front: + shape: + - 3 + - 480 + - 640 + type: VISUAL + observation.state: + shape: + - 6 + type: STATE + kernel_size: 5 + license: null + n_action_steps: 8 + n_groups: 8 + n_obs_steps: 2 + noise_scheduler_type: DDPM + normalization_mapping: + ACTION: MIN_MAX + STATE: MIN_MAX + VISUAL: MEAN_STD + num_inference_steps: 100 + num_train_timesteps: 100 + optimizer_betas: + - 0.95 + - 0.999 + optimizer_eps: 1e-08 + optimizer_lr: 1e-05 + optimizer_weight_decay: 1e-06 + output_features: + action: + shape: + - 6 + type: ACTION + prediction_type: epsilon + pretrained_backbone_weights: ResNet18_Weights.IMAGENET1K_V1 + pretrained_path: /home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model + private: null + push_to_hub: false + repo_id: null + resize_shape: + - 224 + - 224 + scheduler_name: cosine + scheduler_warmup_steps: 100 + spatial_softmax_num_keypoints: 32 + tags: null + type: diffusion + use_amp: false + use_film_scale_modulation: true + use_group_norm: false + use_peft: false + use_separate_rgb_encoder_per_camera: true + vision_backbone: resnet18 + vision_backbone_type: dinov2 + vision_encoder_name: facebook/dinov2-small + vit_feature_dim: 512 + vit_pool_type: spatial_softmax +prefetch_factor: + value: 4 +resume: + value: false +reward_model: + value: null +sample_weighting: + value: null +save_checkpoint: + value: true +save_freq: + value: 5000 +scheduler: + value: + name: cosine + num_warmup_steps: 100 + type: diffuser +seed: + value: 1000 +steps: + value: 30000 +tolerance_s: + value: 0.0001 +use_policy_training_preset: + value: true +wandb: + value: + add_tags: true + disable_artifact: false + enable: true + entity: null + mode: null + notes: null + project: lerobot + run_id: null diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/files/output.log b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..efd03d03d497b3d2f03fdd3dad9fd6971dc20b83 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/files/output.log @@ -0,0 +1,1526 @@ +INFO 2026-05-19 01:11:49 db_utils.py:121 Logs will be synced with wandb. +INFO 2026-05-19 01:11:49 db_utils.py:122 Track this run --> https://wandb.ai/romainguntz-eth-z-rich/lerobot/runs/d8akc176 +INFO 2026-05-19 01:11:49 ot_train.py:236 Creating dataset +INFO 2026-05-19 01:11:49 eo_utils.py:110 Using video codec: libsvtav1 +INFO 2026-05-19 01:11:49 ot_train.py:270 Creating policy +config.json: 100%|███████████████████████████████████████████████████████| 547/547 [00:00<00:00, 2.16MB/s] +model.safetensors: 100%|██████████████████████████████████████████████| 88.2M/88.2M [00:00<00:00, 108MB/s] +Loading weights: 100%|████████████████████████████████████████████████| 223/223 [00:00<00:00, 4996.77it/s] +Loading weights from local directory +INFO 2026-05-19 01:11:52 ot_train.py:347 Creating optimizer and scheduler +INFO 2026-05-19 01:11:52 ot_train.py:374 Output dir: /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1 +INFO 2026-05-19 01:11:52 ot_train.py:381 cfg.steps=30000 (30K) +INFO 2026-05-19 01:11:52 ot_train.py:382 dataset.num_frames=80087 (80K) +INFO 2026-05-19 01:11:52 ot_train.py:383 dataset.num_episodes=134 +INFO 2026-05-19 01:11:52 ot_train.py:386 Effective batch size: 32 x 1 = 32 +INFO 2026-05-19 01:11:52 ot_train.py:387 num_learnable_params=251772134 (252M) +INFO 2026-05-19 01:11:52 ot_train.py:388 num_total_params=273828710 (274M) +Training: 0%| | 0/30000 [00:00@: use of closed network connection","id":"1(@)"} +{"time":"2026-05-19T02:13:15.042045159Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"} +{"time":"2026-05-19T02:13:15.042075977Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"} +{"time":"2026-05-19T02:13:15.042092778Z","level":"INFO","msg":"server is closed"} diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/logs/debug-internal.log b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..af748f54846f59ce5637a2d4c1dffb5228f28570 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/logs/debug-internal.log @@ -0,0 +1,11 @@ +{"time":"2026-05-19T01:11:48.564061586Z","level":"INFO","msg":"stream: starting","core version":"0.24.2"} +{"time":"2026-05-19T01:11:48.736699273Z","level":"INFO","msg":"stream: created new stream","id":"d8akc176"} +{"time":"2026-05-19T01:11:48.736865196Z","level":"INFO","msg":"handler: started","stream_id":"d8akc176"} +{"time":"2026-05-19T01:11:48.736955636Z","level":"INFO","msg":"stream: started","id":"d8akc176"} +{"time":"2026-05-19T01:11:48.736985033Z","level":"INFO","msg":"writer: started","stream_id":"d8akc176"} +{"time":"2026-05-19T01:11:48.73705247Z","level":"INFO","msg":"sender: started","stream_id":"d8akc176"} +{"time":"2026-05-19T02:12:45.882199691Z","level":"INFO","msg":"stream: closing","id":"d8akc176"} +{"time":"2026-05-19T02:13:14.660395438Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2026-05-19T02:13:15.039868032Z","level":"INFO","msg":"handler: closed","stream_id":"d8akc176"} +{"time":"2026-05-19T02:13:15.039996616Z","level":"INFO","msg":"sender: closed","stream_id":"d8akc176"} +{"time":"2026-05-19T02:13:15.040009169Z","level":"INFO","msg":"stream: closed","id":"d8akc176"} diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/logs/debug.log b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..5a3b2d2cf9eef6bb783b15a0083aa34b32464a47 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/logs/debug.log @@ -0,0 +1,21 @@ +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_setup.py:_flush():81] Current SDK version is 0.24.2 +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_setup.py:_flush():81] Configure stats pid to 32539 +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_setup.py:_flush():81] Loading settings from environment variables +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_init.py:setup_run_log_directory():717] Logging user logs to /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1/wandb/run-20260519_011148-d8akc176/logs/debug.log +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_init.py:setup_run_log_directory():718] Logging internal logs to /home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1/wandb/run-20260519_011148-d8akc176/logs/debug-internal.log +2026-05-19 01:11:48,342 INFO MainThread:32539 [wandb_init.py:init():844] calling init triggers +2026-05-19 01:11:48,343 INFO MainThread:32539 [wandb_init.py:init():849] wandb.init called with sweep_config: {} +config: {'dataset': {'repo_id': 'local/act_collected_episodes', 'root': '/home/shadeform/Desktop/robot_learning/base_new_dataset_134', 'episodes': None, 'image_transforms': {'enable': False, 'max_num_transforms': 3, 'random_order': False, 'same_cloth_color': False, 'tfs': {'color_jitter': {'weight': 1.5, 'type': 'ColorJitter', 'kwargs': {'brightness': [0.7, 1.3], 'contrast': [0.7, 1.3], 'saturation': [0.4, 1.6], 'hue': [-0.5, 0.5]}}, 'grayscale': {'weight': 0.5, 'type': 'RandomGrayscale', 'kwargs': {'p': 1.0}}, 'shadow': {'weight': 0.8, 'type': 'RandomShadow', 'kwargs': {'num_shadows': [1, 2], 'intensity': [0.4, 0.7], 'blur_sigma': [4.0, 20.0]}}, 'highlight': {'weight': 0.5, 'type': 'RandomHighlight', 'kwargs': {'num_highlights': [0, 1], 'intensity': [0.2, 0.5], 'sigma': [20.0, 60.0]}}, 'gamma': {'weight': 0.7, 'type': 'RandomGamma', 'kwargs': {'gamma': [0.6, 1.4]}}, 'blur': {'weight': 0.0, 'type': 'GaussianBlur', 'kwargs': {'kernel_size': [3, 3], 'sigma': [0.1, 1.5]}}, 'jpeg': {'weight': 0.0, 'type': 'RandomJPEG', 'kwargs': {'quality': [60, 95]}}, 'crop': {'weight': 0.5, 'type': 'RandomCropPreserveSize', 'kwargs': {'scale': [0.97, 1.0], 'ratio': [0.99, 1.01]}}, 'affine': {'weight': 0.0, 'type': 'RandomAffine', 'kwargs': {'degrees': [-5.0, 5.0], 'translate': [0.05, 0.05]}}, 'sharpness': {'weight': 1.0, 'type': 'SharpnessJitter', 'kwargs': {'sharpness': [0.5, 1.5]}}}}, 'revision': None, 'use_imagenet_stats': True, 'video_backend': 'pyav', 'return_uint8': False, 'streaming': False}, 'env': None, 'policy': {'type': 'diffusion', 'n_obs_steps': 2, 'input_features': {'observation.state': {'type': , 'shape': [6]}, 'observation.images.front': {'type': , 'shape': [3, 480, 640]}}, 'output_features': {'action': {'type': , 'shape': [6]}}, 'device': 'cuda', 'use_amp': False, 'use_peft': False, 'push_to_hub': False, 'repo_id': None, 'private': None, 'tags': None, 'license': None, 'pretrained_path': '/home/shadeform/Desktop/robot_learning/models/checkpoints/diffusion_580_new_dataset_dino/200000/pretrained_model', 'horizon': 16, 'n_action_steps': 8, 'normalization_mapping': {'VISUAL': , 'STATE': , 'ACTION': }, 'drop_n_last_frames': 7, 'vision_backbone_type': 'dinov2', 'vision_encoder_name': 'facebook/dinov2-small', 'freeze_vision_encoder': True, 'vision_backbone': 'resnet18', 'resize_shape': [224, 224], 'crop_ratio': 1.0, 'crop_shape': None, 'crop_is_random': True, 'pretrained_backbone_weights': 'ResNet18_Weights.IMAGENET1K_V1', 'use_group_norm': False, 'spatial_softmax_num_keypoints': 32, 'vit_pool_type': 'spatial_softmax', 'vit_feature_dim': 512, 'use_separate_rgb_encoder_per_camera': True, 'down_dims': [512, 1024, 2048], 'kernel_size': 5, 'n_groups': 8, 'diffusion_step_embed_dim': 128, 'use_film_scale_modulation': True, 'noise_scheduler_type': 'DDPM', 'num_train_timesteps': 100, 'beta_schedule': 'squaredcos_cap_v2', 'beta_start': 0.0001, 'beta_end': 0.02, 'prediction_type': 'epsilon', 'clip_sample': True, 'clip_sample_range': 1.0, 'num_inference_steps': 100, 'compile_model': False, 'compile_mode': 'reduce-overhead', 'do_mask_loss_for_padding': False, 'optimizer_lr': 1e-05, 'optimizer_betas': [0.95, 0.999], 'optimizer_eps': 1e-08, 'optimizer_weight_decay': 1e-06, 'scheduler_name': 'cosine', 'scheduler_warmup_steps': 100}, 'reward_model': None, 'output_dir': '/home/shadeform/Desktop/robot_learning/outputs/train/diffusion_specialized_eval1', 'job_name': 'diffusion_specialized_eval1', 'resume': False, 'seed': 1000, 'cudnn_deterministic': False, 'num_workers': 4, 'batch_size': 32, 'prefetch_factor': 4, 'persistent_workers': True, 'steps': 30000, 'eval_freq': 0, 'log_freq': 20, 'tolerance_s': 0.0001, 'save_checkpoint': True, 'save_freq': 5000, 'use_policy_training_preset': True, 'optimizer': {'type': 'adam', 'lr': 1e-05, 'weight_decay': 1e-06, 'grad_clip_norm': 10.0, 'betas': [0.95, 0.999], 'eps': 1e-08}, 'scheduler': {'type': 'diffuser', 'num_warmup_steps': 100, 'name': 'cosine'}, 'eval': {'n_episodes': 50, 'batch_size': 11, 'use_async_envs': True}, 'wandb': {'enable': True, 'disable_artifact': False, 'project': 'lerobot', 'entity': None, 'notes': None, 'run_id': None, 'mode': None, 'add_tags': True}, 'peft': None, 'sample_weighting': None, 'rename_map': {}, 'checkpoint_path': None, '_wandb': {}} +2026-05-19 01:11:48,343 INFO MainThread:32539 [wandb_init.py:init():892] starting backend +2026-05-19 01:11:48,558 INFO MainThread:32539 [wandb_init.py:init():895] sending inform_init request +2026-05-19 01:11:48,561 INFO MainThread:32539 [wandb_init.py:init():903] backend started and connected +2026-05-19 01:11:48,564 INFO MainThread:32539 [wandb_init.py:init():973] updated telemetry +2026-05-19 01:11:48,569 INFO MainThread:32539 [wandb_init.py:init():997] communicating run to backend with 90.0 second timeout +2026-05-19 01:11:49,150 INFO MainThread:32539 [wandb_init.py:init():1042] starting run threads in backend +2026-05-19 01:11:49,225 INFO MainThread:32539 [wandb_run.py:_console_start():2529] atexit reg +2026-05-19 01:11:49,225 INFO MainThread:32539 [wandb_run.py:_redirect():2377] redirect: wrap_raw +2026-05-19 01:11:49,226 INFO MainThread:32539 [wandb_run.py:_redirect():2446] Wrapping output streams. +2026-05-19 01:11:49,226 INFO MainThread:32539 [wandb_run.py:_redirect():2469] Redirects installed. +2026-05-19 01:11:49,230 INFO MainThread:32539 [wandb_init.py:init():1082] run started, returning control to user process +2026-05-19 02:12:45,882 INFO wandb-AsyncioManager-main:32539 [service_client.py:_forward_responses():94] Reached EOF. +2026-05-19 02:12:45,882 INFO wandb-AsyncioManager-main:32539 [mailbox.py:close():154] Closing mailbox, abandoning 2 handles. diff --git a/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/run-d8akc176.wandb b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/run-d8akc176.wandb new file mode 100644 index 0000000000000000000000000000000000000000..c84809ce277b94d2836db5aa545cacc6dc6ba130 --- /dev/null +++ b/checkpoints/diffusion_specialized_new_dataset_580/wandb/run-20260519_011148-d8akc176/run-d8akc176.wandb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a26262acf008f697e51f81096238c0b312bec675154fc9478f0c9a9895e73a +size 5017212