yuta0x89 commited on
Commit
4f2b242
·
verified ·
1 Parent(s): 05fa785

Upload folder using huggingface_hub

Browse files
README.md ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Library: https://huggingface.co/robotics-diffusion-transformer/rdt-1b
9
+ - Docs: [More Information Needed]
checkpoint-100/README.md ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Library: https://huggingface.co/robotics-diffusion-transformer/rdt-1b
9
+ - Docs: [More Information Needed]
checkpoint-100/config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_dim": 128,
3
+ "ema": {
4
+ "inv_gamma": 1.0,
5
+ "max_value": 0.9999,
6
+ "min_value": 0.0,
7
+ "power": 0.75,
8
+ "update_after_step": 0
9
+ },
10
+ "img_adaptor": "mlp2x_gelu",
11
+ "img_cond_len": 4374,
12
+ "img_pos_embed_config": [
13
+ [
14
+ "image",
15
+ [
16
+ 2,
17
+ 3,
18
+ -729
19
+ ]
20
+ ]
21
+ ],
22
+ "img_token_dim": 1152,
23
+ "lang_adaptor": "mlp2x_gelu",
24
+ "lang_pos_embed_config": [
25
+ [
26
+ "lang",
27
+ -1024
28
+ ]
29
+ ],
30
+ "lang_token_dim": 4096,
31
+ "max_lang_cond_len": 1024,
32
+ "noise_scheduler": {
33
+ "beta_schedule": "squaredcos_cap_v2",
34
+ "clip_sample": false,
35
+ "num_inference_timesteps": 5,
36
+ "num_train_timesteps": 1000,
37
+ "prediction_type": "sample",
38
+ "type": "ddpm"
39
+ },
40
+ "pred_horizon": 64,
41
+ "rdt": {
42
+ "cond_pos_embed_type": "multimodal",
43
+ "depth": 28,
44
+ "hidden_size": 2048,
45
+ "num_heads": 32
46
+ },
47
+ "state_adaptor": "mlp3x_gelu",
48
+ "state_token_dim": 128
49
+ }
checkpoint-100/model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d1fc7d36a1e9696cb003879baa3f6b98aec063a440eca406c2cde6ca52f263f
3
+ size 2512832968
checkpoint-100/optimizer.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a02e4e45cc23d6110d919712036826c139685e98d7200e31ad57f336f7de6237
3
+ size 5026055309
checkpoint-100/pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc97fc23d09fdf6376ccf26fd65f57710d7b675a96c3c35ecbc31e4ea5a72f9f
3
+ size 2513008267
checkpoint-100/random_states_0.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9acc0c01d36765357863588613423d5a48fcfc8dbdbb5521b32c8e04fe486505
3
+ size 16513
checkpoint-100/random_states_1.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d86066f1f6262a935176342587055a2d9ba50a676ce5bf19aacf5afab43a8154
3
+ size 16449
checkpoint-100/random_states_2.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d7ad37ffe3f56c37d1f4b8a988b1c86848a159be35969c287ed34f5de3af4205
3
+ size 16513
checkpoint-100/random_states_3.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccb54702b1a118dbfa147b8156bff5f6a2152f7d725dcc09f86b7b275d15885f
3
+ size 16513
checkpoint-100/random_states_4.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32fc4d606a43952410a86cd9fba2b9f92a0c16547e39e9b81b006090060709a5
3
+ size 16513
checkpoint-100/random_states_5.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e5794f947108456ae5199b48ab6042f4b8664dbe52f0123a36aae40be967e630
3
+ size 16513
checkpoint-100/random_states_6.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f18981771fe0f852dff0004f22bc7c2d462af0c5b2ccdf0e486b8e6c84f33b3d
3
+ size 16449
checkpoint-100/random_states_7.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf1b2d2f825c634258dbf7082f5495988a7ebfd72a20161962cf365c07b240ea
3
+ size 16513
checkpoint-100/scheduler.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4475372fbf2e3da6d4807a0dff26b2fa33c10c5343d8d1571e5c893836d6c7ca
3
+ size 1401
config.json ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "action_dim": 128,
3
+ "ema": {
4
+ "inv_gamma": 1.0,
5
+ "max_value": 0.9999,
6
+ "min_value": 0.0,
7
+ "power": 0.75,
8
+ "update_after_step": 0
9
+ },
10
+ "img_adaptor": "mlp2x_gelu",
11
+ "img_cond_len": 4374,
12
+ "img_pos_embed_config": [
13
+ [
14
+ "image",
15
+ [
16
+ 2,
17
+ 3,
18
+ -729
19
+ ]
20
+ ]
21
+ ],
22
+ "img_token_dim": 1152,
23
+ "lang_adaptor": "mlp2x_gelu",
24
+ "lang_pos_embed_config": [
25
+ [
26
+ "lang",
27
+ -1024
28
+ ]
29
+ ],
30
+ "lang_token_dim": 4096,
31
+ "max_lang_cond_len": 1024,
32
+ "noise_scheduler": {
33
+ "beta_schedule": "squaredcos_cap_v2",
34
+ "clip_sample": false,
35
+ "num_inference_timesteps": 5,
36
+ "num_train_timesteps": 1000,
37
+ "prediction_type": "sample",
38
+ "type": "ddpm"
39
+ },
40
+ "pred_horizon": 64,
41
+ "rdt": {
42
+ "cond_pos_embed_type": "multimodal",
43
+ "depth": 28,
44
+ "hidden_size": 2048,
45
+ "num_heads": 32
46
+ },
47
+ "state_adaptor": "mlp3x_gelu",
48
+ "state_token_dim": 128
49
+ }
logs/roboticDiffusionTransformer/1761750657.8426015/events.out.tfevents.1761750657.14002ff7b0c2.229585.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45f9d3df8e6f8c5f6f5ff5f8f5f7a2e134a7b11ba0ec9e50bfaf4dcac1e33391
3
+ size 2767
logs/roboticDiffusionTransformer/1761750657.8457227/hparams.yml ADDED
@@ -0,0 +1,49 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ adam_beta1: 0.9
2
+ adam_beta2: 0.999
3
+ adam_epsilon: 1.0e-08
4
+ adam_weight_decay: 0.01
5
+ allow_tf32: false
6
+ alpha: 0.9
7
+ cam_ext_mask_prob: -1.0
8
+ checkpointing_period: 10
9
+ checkpoints_total_limit: 4
10
+ cond_mask_prob: 0.1
11
+ config_path: configs/base.yaml
12
+ dataloader_num_workers: 8
13
+ dataset_type: finetune
14
+ deepspeed: null
15
+ gradient_accumulation_steps: 1
16
+ gradient_checkpointing: false
17
+ hub_model_id: null
18
+ hub_token: null
19
+ image_aug: true
20
+ learning_rate: 0.0001
21
+ load_from_hdf5: true
22
+ local_rank: 0
23
+ logging_dir: logs
24
+ lr_num_cycles: 1
25
+ lr_power: 1.0
26
+ lr_scheduler: constant
27
+ lr_warmup_steps: 500
28
+ max_grad_norm: 1.0
29
+ max_train_steps: 100
30
+ mixed_precision: bf16
31
+ num_sample_batches: 2
32
+ num_train_epochs: 1
33
+ output_dir: checkpoints/20251029150953
34
+ precomp_lang_embed: false
35
+ pretrained_model_name_or_path: /work/bmb/hf_models/OpenDriveLab-org/rdt-iros-manipulation-challenge-baseline/awb-pretrained/
36
+ pretrained_text_encoder_name_or_path: /work/bmb/hf_models/google/t5-v1_1-xxl
37
+ pretrained_vision_encoder_name_or_path: /work/bmb/hf_models/google/siglip-so400m-patch14-384
38
+ push_to_hub: false
39
+ recipe: 10task
40
+ report_to: all
41
+ resume_from_checkpoint: null
42
+ sample_batch_size: 32
43
+ sample_period: 5
44
+ scale_lr: false
45
+ seed: null
46
+ set_grads_to_none: false
47
+ state_noise_snr: 40.0
48
+ train_batch_size: 16
49
+ use_8bit_adam: false
logs/roboticDiffusionTransformer/events.out.tfevents.1761750655.14002ff7b0c2.229585.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4aa2a59eaf2cbba1571320d4f0338c0327dc148d82e7831f2602c5202dcb2db0
3
+ size 12968
pytorch_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bc97fc23d09fdf6376ccf26fd65f57710d7b675a96c3c35ecbc31e4ea5a72f9f
3
+ size 2513008267