ry-5 commited on Apr 9

Commit

88304e9

verified ·

1 Parent(s): 2a4e638

Remove intermediate checkpoints, keep final model only

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

checkpoint-10000/config.json +0 -70
checkpoint-10000/embodiment_id.json +0 -11
checkpoint-10000/experiment_cfg/conf.yaml +0 -206
checkpoint-10000/experiment_cfg/config.yaml +0 -239
checkpoint-10000/experiment_cfg/dataset_statistics.json +0 -149
checkpoint-10000/experiment_cfg/final_model_config.json +0 -54
checkpoint-10000/experiment_cfg/final_processor_config.json +0 -0
checkpoint-10000/model-00001-of-00002.safetensors +0 -3
checkpoint-10000/model-00002-of-00002.safetensors +0 -3
checkpoint-10000/model.safetensors.index.json +0 -0
checkpoint-10000/optimizer.pt +0 -3
checkpoint-10000/processor_config.json +0 -455
checkpoint-10000/rng_state.pth +0 -3
checkpoint-10000/scheduler.pt +0 -3
checkpoint-10000/statistics.json +0 -0
checkpoint-10000/trainer_state.json +0 -0
checkpoint-10000/training_args.bin +0 -3
checkpoint-10000/wandb_config.json +0 -1
checkpoint-15000/config.json +0 -70
checkpoint-15000/embodiment_id.json +0 -11
checkpoint-15000/experiment_cfg/conf.yaml +0 -206
checkpoint-15000/experiment_cfg/config.yaml +0 -239
checkpoint-15000/experiment_cfg/dataset_statistics.json +0 -149
checkpoint-15000/experiment_cfg/final_model_config.json +0 -54
checkpoint-15000/experiment_cfg/final_processor_config.json +0 -0
checkpoint-15000/model-00001-of-00002.safetensors +0 -3
checkpoint-15000/model-00002-of-00002.safetensors +0 -3
checkpoint-15000/model.safetensors.index.json +0 -0
checkpoint-15000/optimizer.pt +0 -3
checkpoint-15000/processor_config.json +0 -455
checkpoint-15000/rng_state.pth +0 -3
checkpoint-15000/scheduler.pt +0 -3
checkpoint-15000/statistics.json +0 -0
checkpoint-15000/trainer_state.json +0 -0
checkpoint-15000/training_args.bin +0 -3
checkpoint-15000/wandb_config.json +0 -1
checkpoint-20000/config.json +0 -70
checkpoint-20000/embodiment_id.json +0 -11
checkpoint-20000/experiment_cfg/conf.yaml +0 -206
checkpoint-20000/experiment_cfg/config.yaml +0 -239
checkpoint-20000/experiment_cfg/dataset_statistics.json +0 -149
checkpoint-20000/experiment_cfg/final_model_config.json +0 -54
checkpoint-20000/experiment_cfg/final_processor_config.json +0 -0
checkpoint-20000/model-00001-of-00002.safetensors +0 -3
checkpoint-20000/model-00002-of-00002.safetensors +0 -3
checkpoint-20000/model.safetensors.index.json +0 -0
checkpoint-20000/optimizer.pt +0 -3
checkpoint-20000/processor_config.json +0 -455
checkpoint-20000/rng_state.pth +0 -3
checkpoint-20000/scheduler.pt +0 -3

checkpoint-10000/config.json DELETED Viewed

@@ -1,70 +0,0 @@
-{
-  "action_horizon": 50,
-  "add_pos_embed": true,
-  "apply_sincos_state_encoding": true,
-  "architectures": [
-    "Gr00tN1d6"
-  ],
-  "attn_dropout": 0.2,
-  "attn_implementation": null,
-  "backbone_embedding_dim": 2048,
-  "backbone_model_type": "eagle",
-  "backbone_trainable_params_fp32": true,
-  "collator_overwrite_image_inputs": false,
-  "color_jitter_params": {
-    "brightness": 0.1,
-    "contrast": 0.1,
-    "hue": 0.1,
-    "saturation": 0.1
-  },
-  "crop_fraction": 0.95,
-  "diffusion_model_cfg": {
-    "attention_head_dim": 48,
-    "dropout": 0.2,
-    "final_dropout": true,
-    "interleave_self_attention": true,
-    "norm_type": "ada_norm",
-    "num_attention_heads": 32,
-    "num_layers": 32,
-    "output_dim": 1024,
-    "positional_embeddings": null
-  },
-  "eagle_collator": true,
-  "formalize_language": true,
-  "gemma_collator": false,
-  "hidden_size": 1024,
-  "image_crop_size": null,
-  "image_target_size": null,
-  "input_embedding_dim": 1536,
-  "load_bf16": true,
-  "max_action_dim": 128,
-  "max_num_embodiments": 32,
-  "max_seq_len": 1024,
-  "max_state_dim": 128,
-  "model_dtype": "bfloat16",
-  "model_name": "nvidia/Eagle-Block2A-2B-v2",
-  "model_type": "Gr00tN1d6",
-  "noise_beta_alpha": 1.5,
-  "noise_beta_beta": 1.0,
-  "noise_s": 0.999,
-  "num_inference_timesteps": 4,
-  "num_timestep_buckets": 1000,
-  "random_rotation_angle": null,
-  "reproject_vision": false,
-  "select_layer": 16,
-  "shortest_image_edge": 256,
-  "state_dropout_prob": 0.0,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.51.3",
-  "tune_diffusion_model": true,
-  "tune_llm": false,
-  "tune_projector": true,
-  "tune_top_llm_layers": 4,
-  "tune_visual": false,
-  "tune_vlln": true,
-  "use_albumentations_transforms": true,
-  "use_alternate_vl_dit": true,
-  "use_flash_attention": true,
-  "use_relative_action": true,
-  "use_vlln": true
-}

checkpoint-10000/embodiment_id.json DELETED Viewed

@@ -1,11 +0,0 @@
-{
-  "robocasa_panda_omron": 13,
-  "gr1": 20,
-  "behavior_r1_pro": 24,
-  "unitree_g1": 8,
-  "oxe_google": 0,
-  "oxe_widowx": 1,
-  "libero_panda": 2,
-  "oxe_droid": 16,
-  "new_embodiment": 10
-}

checkpoint-10000/experiment_cfg/conf.yaml DELETED Viewed

@@ -1,206 +0,0 @@
-load_config_path: null
-model:
-  model_type: Gr00tN1d6
-  model_dtype: bfloat16
-  model_name: nvidia/Eagle-Block2A-2B-v2
-  backbone_model_type: eagle
-  model_revision: null
-  tune_top_llm_layers: 4
-  backbone_embedding_dim: 2048
-  tune_llm: false
-  tune_visual: false
-  select_layer: 16
-  reproject_vision: false
-  use_flash_attention: true
-  load_bf16: false
-  collator_overwrite_image_inputs: false
-  eagle_collator: true
-  backbone_trainable_params_fp32: true
-  image_crop_size: null
-  image_target_size: null
-  shortest_image_edge: 256
-  crop_fraction: 0.95
-  random_rotation_angle: null
-  color_jitter_params: null
-  use_albumentations_transforms: true
-  extra_augmentation_config: null
-  formalize_language: true
-  apply_sincos_state_encoding: false
-  use_relative_action: true
-  max_state_dim: 29
-  max_action_dim: 29
-  action_horizon: 16
-  hidden_size: 1024
-  input_embedding_dim: 1536
-  add_pos_embed: true
-  attn_dropout: 0.2
-  use_vlln: true
-  max_seq_len: 1024
-  use_alternate_vl_dit: true
-  attend_text_every_n_blocks: 2
-  diffusion_model_cfg:
-    positional_embeddings: null
-    num_layers: 32
-    num_attention_heads: 32
-    attention_head_dim: 48
-    norm_type: ada_norm
-    dropout: 0.2
-    final_dropout: true
-    output_dim: 1024
-    interleave_self_attention: true
-  num_inference_timesteps: 4
-  noise_beta_alpha: 1.5
-  noise_beta_beta: 1.0
-  noise_s: 0.999
-  num_timestep_buckets: 1000
-  tune_projector: true
-  tune_diffusion_model: true
-  tune_vlln: true
-  state_dropout_prob: 0.0
-  state_additive_noise_scale: 0.0
-  max_num_embodiments: 32
-data:
-  datasets:
-  - dataset_paths:
-    - ./cherry_data
-    embodiment_tag: new_embodiment
-    mix_ratio: 1.0
-    dataset_type: physical_embodiment
-    val_dataset_path: null
-  modality_configs:
-    new_embodiment:
-      video:
-        delta_indices:
-        - 0
-        modality_keys:
-        - cam_base
-        - cam_wrist
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-      state:
-        delta_indices:
-        - 0
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-      action:
-        delta_indices:
-        - 0
-        - 1
-        - 2
-        - 3
-        - 4
-        - 5
-        - 6
-        - 7
-        - 8
-        - 9
-        - 10
-        - 11
-        - 12
-        - 13
-        - 14
-        - 15
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs:
-        - rep: ABSOLUTE
-          type: NON_EEF
-          format: DEFAULT
-          state_key: null
-        - rep: ABSOLUTE
-          type: NON_EEF
-          format: DEFAULT
-          state_key: null
-      language:
-        delta_indices:
-        - 0
-        modality_keys:
-        - annotation.human.task_description
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-  download_cache: false
-  shard_size: 1024
-  episode_sampling_rate: 0.1
-  num_shards_per_epoch: 100000
-  override_pretraining_statistics: false
-  mode: single_turn
-  random_chop: 0.0
-  mock_dataset_mode: false
-  shuffle: true
-  seed: 42
-  multiprocessing_context: fork
-  allow_padding: false
-  subsample_ratio: 1.0
-  image_crop_size:
-  - 244
-  - 244
-  image_target_size:
-  - 224
-  - 224
-  video_backend: decord
-training:
-  output_dir: ./outputs/fr5_cherry
-  experiment_name: null
-  max_steps: 20000
-  global_batch_size: 32
-  batch_size: null
-  gradient_accumulation_steps: 1
-  learning_rate: 0.0001
-  lr_scheduler_type: cosine
-  weight_decay: 1.0e-05
-  warmup_ratio: 0.05
-  warmup_steps: 0
-  max_grad_norm: 1.0
-  optim: adamw_torch
-  start_from_checkpoint: ./pretrained_models/GR00T-N1.6-3B
-  tf32: true
-  fp16: false
-  bf16: true
-  eval_bf16: true
-  logging_steps: 10
-  save_steps: 5000
-  save_total_limit: 5
-  save_vl_model: false
-  upload_checkpoints: false
-  upload_every: 1000
-  upload_last_n_checkpoints: 5
-  max_concurrent_uploads: 2
-  eval_strategy: 'no'
-  eval_steps: 500
-  eval_set_split_ratio: 0.1
-  eval_batch_size: 2
-  save_best_eval_metric_name: ''
-  save_best_eval_metric_greater_is_better: true
-  deepspeed_stage: 2
-  gradient_checkpointing: false
-  transformers_trust_remote_code: true
-  transformers_local_files_only: false
-  transformers_cache_dir: null
-  transformers_access_token: null
-  use_ddp: false
-  ddp_bucket_cap_mb: 100
-  num_gpus: 1
-  dataloader_num_workers: 2
-  remove_unused_columns: false
-  use_wandb: false
-  wandb_project: finetune-gr00t-n1d6
-  enable_profiling: false
-  max_retries: 3
-  assert_loss_less_than: null
-  add_rl_callback: false
-  enable_open_loop_eval: false
-  open_loop_eval_traj_ids:
-  - 0
-  open_loop_eval_steps_per_traj: 100
-  open_loop_eval_plot_indices: null
-max_steps: 20000
-save_steps: 5000

checkpoint-10000/experiment_cfg/config.yaml DELETED Viewed

@@ -1,239 +0,0 @@
-!!python/object:gr00t.configs.base_config.Config
-data: !!python/object:gr00t.configs.data.data_config.DataConfig
-  allow_padding: false
-  datasets:
-  - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
-    dataset_paths:
-    - ./cherry_data
-    dataset_type: physical_embodiment
-    embodiment_tag: new_embodiment
-    mix_ratio: 1.0
-    val_dataset_path: null
-  download_cache: false
-  episode_sampling_rate: 0.1
-  image_crop_size:
-  - 244
-  - 244
-  image_target_size:
-  - 224
-  - 224
-  mock_dataset_mode: false
-  modality_configs:
-    new_embodiment:
-      action: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs:
-        - !!python/object:gr00t.data.types.ActionConfig
-          format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
-          - default
-          rep: &id002 !!python/object/apply:gr00t.data.types.ActionRepresentation
-          - absolute
-          state_key: null
-          type: &id003 !!python/object/apply:gr00t.data.types.ActionType
-          - non_eef
-        - !!python/object:gr00t.data.types.ActionConfig
-          format: *id001
-          rep: *id002
-          state_key: null
-          type: *id003
-        delta_indices:
-        - 0
-        - 1
-        - 2
-        - 3
-        - 4
-        - 5
-        - 6
-        - 7
-        - 8
-        - 9
-        - 10
-        - 11
-        - 12
-        - 13
-        - 14
-        - 15
-        mean_std_embedding_keys: null
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-      language: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - annotation.human.task_description
-        sin_cos_embedding_keys: null
-      state: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-      video: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - cam_base
-        - cam_wrist
-        sin_cos_embedding_keys: null
-  mode: single_turn
-  multiprocessing_context: fork
-  num_shards_per_epoch: 100000
-  override_pretraining_statistics: false
-  random_chop: 0.0
-  seed: 42
-  shard_size: 1024
-  shuffle: true
-  subsample_ratio: 1.0
-  video_backend: decord
-load_config_path: null
-model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
-  _attn_implementation_autoset: false
-  _attn_implementation_internal: null
-  _commit_hash: null
-  _name_or_path: ''
-  add_cross_attention: false
-  architectures: null
-  backbone_model_type: eagle
-  backbone_trainable_params_fp32: true
-  bad_words_ids: null
-  begin_suppress_tokens: null
-  bos_token_id: null
-  chunk_size_feed_forward: 0
-  color_jitter_params: null
-  cross_attention_hidden_size: null
-  decoder_start_token_id: null
-  diffusion_model_cfg:
-    attention_head_dim: 48
-    dropout: 0.2
-    final_dropout: true
-    interleave_self_attention: true
-    norm_type: ada_norm
-    num_attention_heads: 32
-    num_layers: 32
-    output_dim: 1024
-    positional_embeddings: null
-  diversity_penalty: 0.0
-  do_sample: false
-  eagle_collator: true
-  early_stopping: false
-  encoder_no_repeat_ngram_size: 0
-  eos_token_id: null
-  exponential_decay_length_penalty: null
-  extra_augmentation_config: null
-  finetuning_task: null
-  forced_bos_token_id: null
-  forced_eos_token_id: null
-  id2label:
-    0: LABEL_0
-    1: LABEL_1
-  is_decoder: false
-  is_encoder_decoder: false
-  label2id:
-    LABEL_0: 0
-    LABEL_1: 1
-  length_penalty: 1.0
-  load_bf16: false
-  max_length: 20
-  min_length: 0
-  model_name: nvidia/Eagle-Block2A-2B-v2
-  no_repeat_ngram_size: 0
-  num_beam_groups: 1
-  num_beams: 1
-  num_return_sequences: 1
-  output_attentions: false
-  output_hidden_states: false
-  output_scores: false
-  pad_token_id: null
-  prefix: null
-  problem_type: null
-  pruned_heads: {}
-  random_rotation_angle: null
-  remove_invalid_values: false
-  repetition_penalty: 1.0
-  reproject_vision: false
-  return_dict: true
-  return_dict_in_generate: false
-  sep_token_id: null
-  state_dropout_prob: 0.0
-  suppress_tokens: null
-  task_specific_params: null
-  temperature: 1.0
-  tf_legacy_loss: false
-  tie_encoder_decoder: false
-  tie_word_embeddings: true
-  tokenizer_class: null
-  top_k: 50
-  top_p: 1.0
-  torch_dtype: null
-  torchscript: false
-  transformers_version: null
-  tune_diffusion_model: true
-  tune_llm: false
-  tune_projector: true
-  tune_visual: false
-  typical_p: 1.0
-  use_bfloat16: false
-  use_relative_action: true
-training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
-  add_rl_callback: false
-  assert_loss_less_than: null
-  batch_size: null
-  bf16: true
-  dataloader_num_workers: 2
-  ddp_bucket_cap_mb: 100
-  deepspeed_stage: 2
-  enable_open_loop_eval: false
-  enable_profiling: false
-  eval_batch_size: 2
-  eval_bf16: true
-  eval_set_split_ratio: 0.1
-  eval_steps: 500
-  eval_strategy: 'no'
-  experiment_name: null
-  fp16: false
-  global_batch_size: 32
-  gradient_accumulation_steps: 1
-  gradient_checkpointing: false
-  learning_rate: 0.0001
-  logging_steps: 10
-  lr_scheduler_type: cosine
-  max_concurrent_uploads: 2
-  max_grad_norm: 1.0
-  max_retries: 3
-  max_steps: 20000
-  num_gpus: 1
-  open_loop_eval_plot_indices: null
-  open_loop_eval_steps_per_traj: 100
-  open_loop_eval_traj_ids:
-  - 0
-  optim: adamw_torch
-  output_dir: ./outputs/fr5_cherry
-  remove_unused_columns: false
-  save_best_eval_metric_greater_is_better: true
-  save_best_eval_metric_name: ''
-  save_steps: 5000
-  save_total_limit: 5
-  save_vl_model: false
-  start_from_checkpoint: ./pretrained_models/GR00T-N1.6-3B
-  tf32: true
-  transformers_access_token: null
-  transformers_cache_dir: null
-  transformers_local_files_only: false
-  transformers_trust_remote_code: true
-  upload_checkpoints: false
-  upload_every: 1000
-  upload_last_n_checkpoints: 5
-  use_ddp: false
-  use_wandb: false
-  wandb_project: finetune-gr00t-n1d6
-  warmup_ratio: 0.05
-  warmup_steps: 0
-  weight_decay: 1.0e-05

checkpoint-10000/experiment_cfg/dataset_statistics.json DELETED Viewed

@@ -1,149 +0,0 @@
-{
-  "new_embodiment": {
-    "state": {
-      "arm": {
-        "min": [
-          0.4818978011608124,
-          -1.687173843383789,
-          0.62826007604599,
-          -2.6761701107025146,
-          -1.8431425094604492,
-          -0.5678880214691162
-        ],
-        "max": [
-          0.7935351133346558,
-          -1.014952301979065,
-          1.8637524843215942,
-          -1.0820374488830566,
-          -1.4455490112304688,
-          0.3115537762641907
-        ],
-        "mean": [
-          0.6489784717559814,
-          -1.3269319534301758,
-          1.356391429901123,
-          -1.804563045501709,
-          -1.619696021080017,
-          -0.07974076271057129
-        ],
-        "std": [
-          0.053538445383310186,
-          0.1604488044977188,
-          0.2438623011112213,
-          0.22075510025024414,
-          0.07333532720804177,
-          0.10092151165008545
-        ],
-        "q01": [
-          0.5197953635454178,
-          -1.6432996988296509,
-          0.8626433879137039,
-          -2.5542680168151857,
-          -1.8000394713878631,
-          -0.37301090329885483
-        ],
-        "q99": [
-          0.7509180748462676,
-          -1.0879072868824005,
-          1.7959050333499906,
-          -1.252977850437165,
-          -1.4705305182933812,
-          0.2933953133225437
-        ]
-      },
-      "gripper": {
-        "min": [
-          0.0
-        ],
-        "max": [
-          1.0
-        ],
-        "mean": [
-          0.7650123238563538
-        ],
-        "std": [
-          0.39907386898994446
-        ],
-        "q01": [
-          0.0
-        ],
-        "q99": [
-          1.0
-        ]
-      }
-    },
-    "action": {
-      "arm": {
-        "min": [
-          0.4818978011608124,
-          -1.687173843383789,
-          0.62826007604599,
-          -2.6573522090911865,
-          -1.8431425094604492,
-          -0.5678880214691162
-        ],
-        "max": [
-          0.7935351133346558,
-          -1.014952301979065,
-          1.8637524843215942,
-          -1.0820374488830566,
-          -1.4455490112304688,
-          0.3115537762641907
-        ],
-        "mean": [
-          0.6489997506141663,
-          -1.326717495918274,
-          1.355955958366394,
-          -1.8026670217514038,
-          -1.6199865341186523,
-          -0.07982920855283737
-        ],
-        "std": [
-          0.05358240380883204,
-          0.16021256148815155,
-          0.243374302983284,
-          0.2178075611591339,
-          0.07321629673242531,
-          0.10097639262676239
-        ],
-        "q01": [
-          0.5197953635454178,
-          -1.6432996988296509,
-          0.8625765931606293,
-          -2.53433034658432,
-          -1.8000823378562927,
-          -0.37301090329885483
-        ],
-        "q99": [
-          0.7509180748462676,
-          -1.0879072868824005,
-          1.7849992513656616,
-          -1.2526323044300085,
-          -1.4705633461475374,
-          0.2933953133225437
-        ]
-      },
-      "gripper": {
-        "min": [
-          0.0
-        ],
-        "max": [
-          1.0
-        ],
-        "mean": [
-          0.7650123238563538
-        ],
-        "std": [
-          0.39907386898994446
-        ],
-        "q01": [
-          0.0
-        ],
-        "q99": [
-          1.0
-        ]
-      }
-    },
-    "relative_action": {}
-  }
-}

checkpoint-10000/experiment_cfg/final_model_config.json DELETED Viewed

@@ -1,54 +0,0 @@
-{
-  "model_type": "Gr00tN1d6",
-  "model_dtype": "bfloat16",
-  "model_name": "nvidia/Eagle-Block2A-2B-v2",
-  "backbone_model_type": "eagle",
-  "model_revision": null,
-  "tune_top_llm_layers": 4,
-  "backbone_embedding_dim": 2048,
-  "tune_llm": false,
-  "tune_visual": false,
-  "select_layer": 16,
-  "reproject_vision": false,
-  "use_flash_attention": true,
-  "load_bf16": true,
-  "collator_overwrite_image_inputs": false,
-  "eagle_collator": true,
-  "backbone_trainable_params_fp32": true,
-  "extra_augmentation_config": null,
-  "apply_sincos_state_encoding": true,
-  "use_relative_action": true,
-  "max_state_dim": 128,
-  "max_action_dim": 128,
-  "action_horizon": 50,
-  "hidden_size": 1024,
-  "input_embedding_dim": 1536,
-  "add_pos_embed": true,
-  "attn_dropout": 0.2,
-  "use_vlln": true,
-  "max_seq_len": 1024,
-  "use_alternate_vl_dit": true,
-  "attend_text_every_n_blocks": 2,
-  "diffusion_model_cfg": {
-    "attention_head_dim": 48,
-    "dropout": 0.2,
-    "final_dropout": true,
-    "interleave_self_attention": true,
-    "norm_type": "ada_norm",
-    "num_attention_heads": 32,
-    "num_layers": 32,
-    "output_dim": 1024,
-    "positional_embeddings": null
-  },
-  "num_inference_timesteps": 4,
-  "noise_beta_alpha": 1.5,
-  "noise_beta_beta": 1.0,
-  "noise_s": 0.999,
-  "num_timestep_buckets": 1000,
-  "tune_projector": true,
-  "tune_diffusion_model": true,
-  "tune_vlln": true,
-  "state_dropout_prob": 0.0,
-  "state_additive_noise_scale": 0.0,
-  "max_num_embodiments": 32
-}

checkpoint-10000/experiment_cfg/final_processor_config.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-10000/model-00001-of-00002.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a22551925e5bb41c48ebb3cd8533566607a4e966f51d34097f53fbe937a91659
-size 4990120184

checkpoint-10000/model-00002-of-00002.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:01a8b9f9243a6606b220e9ecfdf9c90271caecbf6a218d878817c602c0be7a3e
-size 4823190320

checkpoint-10000/model.safetensors.index.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-10000/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f1daa28f457b70c4bbcb6ef25875f17b75f9c587aee1da4f54bc2f8a7177d9af
-size 12960193762

checkpoint-10000/processor_config.json DELETED Viewed

@@ -1,455 +0,0 @@
-{
-  "processor_class": "Gr00tN1d6Processor",
-  "processor_kwargs": {
-    "modality_configs": {
-      "behavior_r1_pro": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "observation.images.rgb.head_256_256",
-            "observation.images.rgb.left_wrist_256_256",
-            "observation.images.rgb.right_wrist_256_256"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "robot_pos",
-            "robot_ori_cos",
-            "robot_ori_sin",
-            "robot_2d_ori",
-            "robot_2d_ori_cos",
-            "robot_2d_ori_sin",
-            "robot_lin_vel",
-            "robot_ang_vel",
-            "arm_left_qpos",
-            "arm_left_qpos_sin",
-            "arm_left_qpos_cos",
-            "eef_left_pos",
-            "eef_left_quat",
-            "gripper_left_qpos",
-            "arm_right_qpos",
-            "arm_right_qpos_sin",
-            "arm_right_qpos_cos",
-            "eef_right_pos",
-            "eef_right_quat",
-            "gripper_right_qpos",
-            "trunk_qpos"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15,
-            16,
-            17,
-            18,
-            19,
-            20,
-            21,
-            22,
-            23,
-            24,
-            25,
-            26,
-            27,
-            28,
-            29,
-            30,
-            31
-          ],
-          "modality_keys": [
-            "base",
-            "torso",
-            "left_arm",
-            "left_gripper",
-            "right_arm",
-            "right_gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "trunk_qpos"
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "arm_left_qpos"
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "arm_right_qpos"
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.coarse_action"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "gr1": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "ego_view_bg_crop_pad_res256_freq20"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "sin_cos_embedding_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "task"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "robocasa_panda_omron": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "res256_image_side_0",
-            "res256_image_side_1",
-            "res256_image_wrist_0"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "end_effector_position_relative",
-            "end_effector_rotation_relative",
-            "gripper_qpos",
-            "base_position",
-            "base_rotation"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "end_effector_position",
-            "end_effector_rotation",
-            "gripper_close",
-            "base_motion",
-            "control_mode"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.action.task_description"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "new_embodiment": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "cam_base",
-            "cam_wrist"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "arm",
-            "gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "arm",
-            "gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.task_description"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      }
-    },
-    "image_crop_size": null,
-    "image_target_size": null,
-    "use_albumentations": true,
-    "random_rotation_angle": null,
-    "color_jitter_params": {
-      "brightness": 0.3,
-      "contrast": 0.4,
-      "saturation": 0.5,
-      "hue": 0.08
-    },
-    "shortest_image_edge": 256,
-    "crop_fraction": 0.95,
-    "model_name": "nvidia/Eagle-Block2A-2B-v2",
-    "model_type": "eagle",
-    "formalize_language": true,
-    "max_state_dim": 128,
-    "max_action_dim": 128,
-    "max_action_horizon": 50,
-    "use_percentiles": false,
-    "clip_outliers": true,
-    "apply_sincos_state_encoding": true,
-    "use_relative_action": true
-  }
-}

checkpoint-10000/rng_state.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:3f5ea38e8fe73fc84868ec3e6011e3571a59e9595fe7e6de70a21b520b40798f
-size 14645

checkpoint-10000/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:9793ce798c508501a83c7de96591494637b8ee20bbad166324a3caeddb4cdc8e
-size 1465

checkpoint-10000/statistics.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-10000/trainer_state.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-10000/training_args.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:49cf1bb9160fba423ccdd2dae7d9b40228772dd15a3fb17d44a4fd07f7818f45
-size 5713

checkpoint-10000/wandb_config.json DELETED Viewed

	@@ -1 +0,0 @@
1	- {"project": "finetune-gr00t-n1d6", "run_id": "fr5_cherry"}

checkpoint-15000/config.json DELETED Viewed

@@ -1,70 +0,0 @@
-{
-  "action_horizon": 50,
-  "add_pos_embed": true,
-  "apply_sincos_state_encoding": true,
-  "architectures": [
-    "Gr00tN1d6"
-  ],
-  "attn_dropout": 0.2,
-  "attn_implementation": null,
-  "backbone_embedding_dim": 2048,
-  "backbone_model_type": "eagle",
-  "backbone_trainable_params_fp32": true,
-  "collator_overwrite_image_inputs": false,
-  "color_jitter_params": {
-    "brightness": 0.1,
-    "contrast": 0.1,
-    "hue": 0.1,
-    "saturation": 0.1
-  },
-  "crop_fraction": 0.95,
-  "diffusion_model_cfg": {
-    "attention_head_dim": 48,
-    "dropout": 0.2,
-    "final_dropout": true,
-    "interleave_self_attention": true,
-    "norm_type": "ada_norm",
-    "num_attention_heads": 32,
-    "num_layers": 32,
-    "output_dim": 1024,
-    "positional_embeddings": null
-  },
-  "eagle_collator": true,
-  "formalize_language": true,
-  "gemma_collator": false,
-  "hidden_size": 1024,
-  "image_crop_size": null,
-  "image_target_size": null,
-  "input_embedding_dim": 1536,
-  "load_bf16": true,
-  "max_action_dim": 128,
-  "max_num_embodiments": 32,
-  "max_seq_len": 1024,
-  "max_state_dim": 128,
-  "model_dtype": "bfloat16",
-  "model_name": "nvidia/Eagle-Block2A-2B-v2",
-  "model_type": "Gr00tN1d6",
-  "noise_beta_alpha": 1.5,
-  "noise_beta_beta": 1.0,
-  "noise_s": 0.999,
-  "num_inference_timesteps": 4,
-  "num_timestep_buckets": 1000,
-  "random_rotation_angle": null,
-  "reproject_vision": false,
-  "select_layer": 16,
-  "shortest_image_edge": 256,
-  "state_dropout_prob": 0.0,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.51.3",
-  "tune_diffusion_model": true,
-  "tune_llm": false,
-  "tune_projector": true,
-  "tune_top_llm_layers": 4,
-  "tune_visual": false,
-  "tune_vlln": true,
-  "use_albumentations_transforms": true,
-  "use_alternate_vl_dit": true,
-  "use_flash_attention": true,
-  "use_relative_action": true,
-  "use_vlln": true
-}

checkpoint-15000/embodiment_id.json DELETED Viewed

@@ -1,11 +0,0 @@
-{
-  "robocasa_panda_omron": 13,
-  "gr1": 20,
-  "behavior_r1_pro": 24,
-  "unitree_g1": 8,
-  "oxe_google": 0,
-  "oxe_widowx": 1,
-  "libero_panda": 2,
-  "oxe_droid": 16,
-  "new_embodiment": 10
-}

checkpoint-15000/experiment_cfg/conf.yaml DELETED Viewed

@@ -1,206 +0,0 @@
-load_config_path: null
-model:
-  model_type: Gr00tN1d6
-  model_dtype: bfloat16
-  model_name: nvidia/Eagle-Block2A-2B-v2
-  backbone_model_type: eagle
-  model_revision: null
-  tune_top_llm_layers: 4
-  backbone_embedding_dim: 2048
-  tune_llm: false
-  tune_visual: false
-  select_layer: 16
-  reproject_vision: false
-  use_flash_attention: true
-  load_bf16: false
-  collator_overwrite_image_inputs: false
-  eagle_collator: true
-  backbone_trainable_params_fp32: true
-  image_crop_size: null
-  image_target_size: null
-  shortest_image_edge: 256
-  crop_fraction: 0.95
-  random_rotation_angle: null
-  color_jitter_params: null
-  use_albumentations_transforms: true
-  extra_augmentation_config: null
-  formalize_language: true
-  apply_sincos_state_encoding: false
-  use_relative_action: true
-  max_state_dim: 29
-  max_action_dim: 29
-  action_horizon: 16
-  hidden_size: 1024
-  input_embedding_dim: 1536
-  add_pos_embed: true
-  attn_dropout: 0.2
-  use_vlln: true
-  max_seq_len: 1024
-  use_alternate_vl_dit: true
-  attend_text_every_n_blocks: 2
-  diffusion_model_cfg:
-    positional_embeddings: null
-    num_layers: 32
-    num_attention_heads: 32
-    attention_head_dim: 48
-    norm_type: ada_norm
-    dropout: 0.2
-    final_dropout: true
-    output_dim: 1024
-    interleave_self_attention: true
-  num_inference_timesteps: 4
-  noise_beta_alpha: 1.5
-  noise_beta_beta: 1.0
-  noise_s: 0.999
-  num_timestep_buckets: 1000
-  tune_projector: true
-  tune_diffusion_model: true
-  tune_vlln: true
-  state_dropout_prob: 0.0
-  state_additive_noise_scale: 0.0
-  max_num_embodiments: 32
-data:
-  datasets:
-  - dataset_paths:
-    - ./cherry_data
-    embodiment_tag: new_embodiment
-    mix_ratio: 1.0
-    dataset_type: physical_embodiment
-    val_dataset_path: null
-  modality_configs:
-    new_embodiment:
-      video:
-        delta_indices:
-        - 0
-        modality_keys:
-        - cam_base
-        - cam_wrist
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-      state:
-        delta_indices:
-        - 0
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-      action:
-        delta_indices:
-        - 0
-        - 1
-        - 2
-        - 3
-        - 4
-        - 5
-        - 6
-        - 7
-        - 8
-        - 9
-        - 10
-        - 11
-        - 12
-        - 13
-        - 14
-        - 15
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs:
-        - rep: ABSOLUTE
-          type: NON_EEF
-          format: DEFAULT
-          state_key: null
-        - rep: ABSOLUTE
-          type: NON_EEF
-          format: DEFAULT
-          state_key: null
-      language:
-        delta_indices:
-        - 0
-        modality_keys:
-        - annotation.human.task_description
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-  download_cache: false
-  shard_size: 1024
-  episode_sampling_rate: 0.1
-  num_shards_per_epoch: 100000
-  override_pretraining_statistics: false
-  mode: single_turn
-  random_chop: 0.0
-  mock_dataset_mode: false
-  shuffle: true
-  seed: 42
-  multiprocessing_context: fork
-  allow_padding: false
-  subsample_ratio: 1.0
-  image_crop_size:
-  - 244
-  - 244
-  image_target_size:
-  - 224
-  - 224
-  video_backend: decord
-training:
-  output_dir: ./outputs/fr5_cherry
-  experiment_name: null
-  max_steps: 20000
-  global_batch_size: 32
-  batch_size: null
-  gradient_accumulation_steps: 1
-  learning_rate: 0.0001
-  lr_scheduler_type: cosine
-  weight_decay: 1.0e-05
-  warmup_ratio: 0.05
-  warmup_steps: 0
-  max_grad_norm: 1.0
-  optim: adamw_torch
-  start_from_checkpoint: ./pretrained_models/GR00T-N1.6-3B
-  tf32: true
-  fp16: false
-  bf16: true
-  eval_bf16: true
-  logging_steps: 10
-  save_steps: 5000
-  save_total_limit: 5
-  save_vl_model: false
-  upload_checkpoints: false
-  upload_every: 1000
-  upload_last_n_checkpoints: 5
-  max_concurrent_uploads: 2
-  eval_strategy: 'no'
-  eval_steps: 500
-  eval_set_split_ratio: 0.1
-  eval_batch_size: 2
-  save_best_eval_metric_name: ''
-  save_best_eval_metric_greater_is_better: true
-  deepspeed_stage: 2
-  gradient_checkpointing: false
-  transformers_trust_remote_code: true
-  transformers_local_files_only: false
-  transformers_cache_dir: null
-  transformers_access_token: null
-  use_ddp: false
-  ddp_bucket_cap_mb: 100
-  num_gpus: 1
-  dataloader_num_workers: 2
-  remove_unused_columns: false
-  use_wandb: false
-  wandb_project: finetune-gr00t-n1d6
-  enable_profiling: false
-  max_retries: 3
-  assert_loss_less_than: null
-  add_rl_callback: false
-  enable_open_loop_eval: false
-  open_loop_eval_traj_ids:
-  - 0
-  open_loop_eval_steps_per_traj: 100
-  open_loop_eval_plot_indices: null
-max_steps: 20000
-save_steps: 5000

checkpoint-15000/experiment_cfg/config.yaml DELETED Viewed

@@ -1,239 +0,0 @@
-!!python/object:gr00t.configs.base_config.Config
-data: !!python/object:gr00t.configs.data.data_config.DataConfig
-  allow_padding: false
-  datasets:
-  - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
-    dataset_paths:
-    - ./cherry_data
-    dataset_type: physical_embodiment
-    embodiment_tag: new_embodiment
-    mix_ratio: 1.0
-    val_dataset_path: null
-  download_cache: false
-  episode_sampling_rate: 0.1
-  image_crop_size:
-  - 244
-  - 244
-  image_target_size:
-  - 224
-  - 224
-  mock_dataset_mode: false
-  modality_configs:
-    new_embodiment:
-      action: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs:
-        - !!python/object:gr00t.data.types.ActionConfig
-          format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
-          - default
-          rep: &id002 !!python/object/apply:gr00t.data.types.ActionRepresentation
-          - absolute
-          state_key: null
-          type: &id003 !!python/object/apply:gr00t.data.types.ActionType
-          - non_eef
-        - !!python/object:gr00t.data.types.ActionConfig
-          format: *id001
-          rep: *id002
-          state_key: null
-          type: *id003
-        delta_indices:
-        - 0
-        - 1
-        - 2
-        - 3
-        - 4
-        - 5
-        - 6
-        - 7
-        - 8
-        - 9
-        - 10
-        - 11
-        - 12
-        - 13
-        - 14
-        - 15
-        mean_std_embedding_keys: null
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-      language: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - annotation.human.task_description
-        sin_cos_embedding_keys: null
-      state: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-      video: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - cam_base
-        - cam_wrist
-        sin_cos_embedding_keys: null
-  mode: single_turn
-  multiprocessing_context: fork
-  num_shards_per_epoch: 100000
-  override_pretraining_statistics: false
-  random_chop: 0.0
-  seed: 42
-  shard_size: 1024
-  shuffle: true
-  subsample_ratio: 1.0
-  video_backend: decord
-load_config_path: null
-model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
-  _attn_implementation_autoset: false
-  _attn_implementation_internal: null
-  _commit_hash: null
-  _name_or_path: ''
-  add_cross_attention: false
-  architectures: null
-  backbone_model_type: eagle
-  backbone_trainable_params_fp32: true
-  bad_words_ids: null
-  begin_suppress_tokens: null
-  bos_token_id: null
-  chunk_size_feed_forward: 0
-  color_jitter_params: null
-  cross_attention_hidden_size: null
-  decoder_start_token_id: null
-  diffusion_model_cfg:
-    attention_head_dim: 48
-    dropout: 0.2
-    final_dropout: true
-    interleave_self_attention: true
-    norm_type: ada_norm
-    num_attention_heads: 32
-    num_layers: 32
-    output_dim: 1024
-    positional_embeddings: null
-  diversity_penalty: 0.0
-  do_sample: false
-  eagle_collator: true
-  early_stopping: false
-  encoder_no_repeat_ngram_size: 0
-  eos_token_id: null
-  exponential_decay_length_penalty: null
-  extra_augmentation_config: null
-  finetuning_task: null
-  forced_bos_token_id: null
-  forced_eos_token_id: null
-  id2label:
-    0: LABEL_0
-    1: LABEL_1
-  is_decoder: false
-  is_encoder_decoder: false
-  label2id:
-    LABEL_0: 0
-    LABEL_1: 1
-  length_penalty: 1.0
-  load_bf16: false
-  max_length: 20
-  min_length: 0
-  model_name: nvidia/Eagle-Block2A-2B-v2
-  no_repeat_ngram_size: 0
-  num_beam_groups: 1
-  num_beams: 1
-  num_return_sequences: 1
-  output_attentions: false
-  output_hidden_states: false
-  output_scores: false
-  pad_token_id: null
-  prefix: null
-  problem_type: null
-  pruned_heads: {}
-  random_rotation_angle: null
-  remove_invalid_values: false
-  repetition_penalty: 1.0
-  reproject_vision: false
-  return_dict: true
-  return_dict_in_generate: false
-  sep_token_id: null
-  state_dropout_prob: 0.0
-  suppress_tokens: null
-  task_specific_params: null
-  temperature: 1.0
-  tf_legacy_loss: false
-  tie_encoder_decoder: false
-  tie_word_embeddings: true
-  tokenizer_class: null
-  top_k: 50
-  top_p: 1.0
-  torch_dtype: null
-  torchscript: false
-  transformers_version: null
-  tune_diffusion_model: true
-  tune_llm: false
-  tune_projector: true
-  tune_visual: false
-  typical_p: 1.0
-  use_bfloat16: false
-  use_relative_action: true
-training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
-  add_rl_callback: false
-  assert_loss_less_than: null
-  batch_size: null
-  bf16: true
-  dataloader_num_workers: 2
-  ddp_bucket_cap_mb: 100
-  deepspeed_stage: 2
-  enable_open_loop_eval: false
-  enable_profiling: false
-  eval_batch_size: 2
-  eval_bf16: true
-  eval_set_split_ratio: 0.1
-  eval_steps: 500
-  eval_strategy: 'no'
-  experiment_name: null
-  fp16: false
-  global_batch_size: 32
-  gradient_accumulation_steps: 1
-  gradient_checkpointing: false
-  learning_rate: 0.0001
-  logging_steps: 10
-  lr_scheduler_type: cosine
-  max_concurrent_uploads: 2
-  max_grad_norm: 1.0
-  max_retries: 3
-  max_steps: 20000
-  num_gpus: 1
-  open_loop_eval_plot_indices: null
-  open_loop_eval_steps_per_traj: 100
-  open_loop_eval_traj_ids:
-  - 0
-  optim: adamw_torch
-  output_dir: ./outputs/fr5_cherry
-  remove_unused_columns: false
-  save_best_eval_metric_greater_is_better: true
-  save_best_eval_metric_name: ''
-  save_steps: 5000
-  save_total_limit: 5
-  save_vl_model: false
-  start_from_checkpoint: ./pretrained_models/GR00T-N1.6-3B
-  tf32: true
-  transformers_access_token: null
-  transformers_cache_dir: null
-  transformers_local_files_only: false
-  transformers_trust_remote_code: true
-  upload_checkpoints: false
-  upload_every: 1000
-  upload_last_n_checkpoints: 5
-  use_ddp: false
-  use_wandb: false
-  wandb_project: finetune-gr00t-n1d6
-  warmup_ratio: 0.05
-  warmup_steps: 0
-  weight_decay: 1.0e-05

checkpoint-15000/experiment_cfg/dataset_statistics.json DELETED Viewed

@@ -1,149 +0,0 @@
-{
-  "new_embodiment": {
-    "state": {
-      "arm": {
-        "min": [
-          0.4818978011608124,
-          -1.687173843383789,
-          0.62826007604599,
-          -2.6761701107025146,
-          -1.8431425094604492,
-          -0.5678880214691162
-        ],
-        "max": [
-          0.7935351133346558,
-          -1.014952301979065,
-          1.8637524843215942,
-          -1.0820374488830566,
-          -1.4455490112304688,
-          0.3115537762641907
-        ],
-        "mean": [
-          0.6489784717559814,
-          -1.3269319534301758,
-          1.356391429901123,
-          -1.804563045501709,
-          -1.619696021080017,
-          -0.07974076271057129
-        ],
-        "std": [
-          0.053538445383310186,
-          0.1604488044977188,
-          0.2438623011112213,
-          0.22075510025024414,
-          0.07333532720804177,
-          0.10092151165008545
-        ],
-        "q01": [
-          0.5197953635454178,
-          -1.6432996988296509,
-          0.8626433879137039,
-          -2.5542680168151857,
-          -1.8000394713878631,
-          -0.37301090329885483
-        ],
-        "q99": [
-          0.7509180748462676,
-          -1.0879072868824005,
-          1.7959050333499906,
-          -1.252977850437165,
-          -1.4705305182933812,
-          0.2933953133225437
-        ]
-      },
-      "gripper": {
-        "min": [
-          0.0
-        ],
-        "max": [
-          1.0
-        ],
-        "mean": [
-          0.7650123238563538
-        ],
-        "std": [
-          0.39907386898994446
-        ],
-        "q01": [
-          0.0
-        ],
-        "q99": [
-          1.0
-        ]
-      }
-    },
-    "action": {
-      "arm": {
-        "min": [
-          0.4818978011608124,
-          -1.687173843383789,
-          0.62826007604599,
-          -2.6573522090911865,
-          -1.8431425094604492,
-          -0.5678880214691162
-        ],
-        "max": [
-          0.7935351133346558,
-          -1.014952301979065,
-          1.8637524843215942,
-          -1.0820374488830566,
-          -1.4455490112304688,
-          0.3115537762641907
-        ],
-        "mean": [
-          0.6489997506141663,
-          -1.326717495918274,
-          1.355955958366394,
-          -1.8026670217514038,
-          -1.6199865341186523,
-          -0.07982920855283737
-        ],
-        "std": [
-          0.05358240380883204,
-          0.16021256148815155,
-          0.243374302983284,
-          0.2178075611591339,
-          0.07321629673242531,
-          0.10097639262676239
-        ],
-        "q01": [
-          0.5197953635454178,
-          -1.6432996988296509,
-          0.8625765931606293,
-          -2.53433034658432,
-          -1.8000823378562927,
-          -0.37301090329885483
-        ],
-        "q99": [
-          0.7509180748462676,
-          -1.0879072868824005,
-          1.7849992513656616,
-          -1.2526323044300085,
-          -1.4705633461475374,
-          0.2933953133225437
-        ]
-      },
-      "gripper": {
-        "min": [
-          0.0
-        ],
-        "max": [
-          1.0
-        ],
-        "mean": [
-          0.7650123238563538
-        ],
-        "std": [
-          0.39907386898994446
-        ],
-        "q01": [
-          0.0
-        ],
-        "q99": [
-          1.0
-        ]
-      }
-    },
-    "relative_action": {}
-  }
-}

checkpoint-15000/experiment_cfg/final_model_config.json DELETED Viewed

@@ -1,54 +0,0 @@
-{
-  "model_type": "Gr00tN1d6",
-  "model_dtype": "bfloat16",
-  "model_name": "nvidia/Eagle-Block2A-2B-v2",
-  "backbone_model_type": "eagle",
-  "model_revision": null,
-  "tune_top_llm_layers": 4,
-  "backbone_embedding_dim": 2048,
-  "tune_llm": false,
-  "tune_visual": false,
-  "select_layer": 16,
-  "reproject_vision": false,
-  "use_flash_attention": true,
-  "load_bf16": true,
-  "collator_overwrite_image_inputs": false,
-  "eagle_collator": true,
-  "backbone_trainable_params_fp32": true,
-  "extra_augmentation_config": null,
-  "apply_sincos_state_encoding": true,
-  "use_relative_action": true,
-  "max_state_dim": 128,
-  "max_action_dim": 128,
-  "action_horizon": 50,
-  "hidden_size": 1024,
-  "input_embedding_dim": 1536,
-  "add_pos_embed": true,
-  "attn_dropout": 0.2,
-  "use_vlln": true,
-  "max_seq_len": 1024,
-  "use_alternate_vl_dit": true,
-  "attend_text_every_n_blocks": 2,
-  "diffusion_model_cfg": {
-    "attention_head_dim": 48,
-    "dropout": 0.2,
-    "final_dropout": true,
-    "interleave_self_attention": true,
-    "norm_type": "ada_norm",
-    "num_attention_heads": 32,
-    "num_layers": 32,
-    "output_dim": 1024,
-    "positional_embeddings": null
-  },
-  "num_inference_timesteps": 4,
-  "noise_beta_alpha": 1.5,
-  "noise_beta_beta": 1.0,
-  "noise_s": 0.999,
-  "num_timestep_buckets": 1000,
-  "tune_projector": true,
-  "tune_diffusion_model": true,
-  "tune_vlln": true,
-  "state_dropout_prob": 0.0,
-  "state_additive_noise_scale": 0.0,
-  "max_num_embodiments": 32
-}

checkpoint-15000/experiment_cfg/final_processor_config.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-15000/model-00001-of-00002.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1b2b93b15f33bd8ea70ac7f6b11aa60c56788947162d6ae00dd1987457f54da3
-size 4990120184

checkpoint-15000/model-00002-of-00002.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:d9be8fde5f5ace47b89e78e8cbea6a0b5494abb99ac6350affb66f53c7fc7c68
-size 4823190320

checkpoint-15000/model.safetensors.index.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-15000/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:018072403772e39d83a35fb933559eaf88901e875bf632858002d7b78a84a344
-size 12960193762

checkpoint-15000/processor_config.json DELETED Viewed

@@ -1,455 +0,0 @@
-{
-  "processor_class": "Gr00tN1d6Processor",
-  "processor_kwargs": {
-    "modality_configs": {
-      "behavior_r1_pro": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "observation.images.rgb.head_256_256",
-            "observation.images.rgb.left_wrist_256_256",
-            "observation.images.rgb.right_wrist_256_256"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "robot_pos",
-            "robot_ori_cos",
-            "robot_ori_sin",
-            "robot_2d_ori",
-            "robot_2d_ori_cos",
-            "robot_2d_ori_sin",
-            "robot_lin_vel",
-            "robot_ang_vel",
-            "arm_left_qpos",
-            "arm_left_qpos_sin",
-            "arm_left_qpos_cos",
-            "eef_left_pos",
-            "eef_left_quat",
-            "gripper_left_qpos",
-            "arm_right_qpos",
-            "arm_right_qpos_sin",
-            "arm_right_qpos_cos",
-            "eef_right_pos",
-            "eef_right_quat",
-            "gripper_right_qpos",
-            "trunk_qpos"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15,
-            16,
-            17,
-            18,
-            19,
-            20,
-            21,
-            22,
-            23,
-            24,
-            25,
-            26,
-            27,
-            28,
-            29,
-            30,
-            31
-          ],
-          "modality_keys": [
-            "base",
-            "torso",
-            "left_arm",
-            "left_gripper",
-            "right_arm",
-            "right_gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "trunk_qpos"
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "arm_left_qpos"
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "arm_right_qpos"
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.coarse_action"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "gr1": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "ego_view_bg_crop_pad_res256_freq20"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "sin_cos_embedding_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "task"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "robocasa_panda_omron": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "res256_image_side_0",
-            "res256_image_side_1",
-            "res256_image_wrist_0"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "end_effector_position_relative",
-            "end_effector_rotation_relative",
-            "gripper_qpos",
-            "base_position",
-            "base_rotation"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "end_effector_position",
-            "end_effector_rotation",
-            "gripper_close",
-            "base_motion",
-            "control_mode"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.action.task_description"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "new_embodiment": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "cam_base",
-            "cam_wrist"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "arm",
-            "gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "arm",
-            "gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.task_description"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      }
-    },
-    "image_crop_size": null,
-    "image_target_size": null,
-    "use_albumentations": true,
-    "random_rotation_angle": null,
-    "color_jitter_params": {
-      "brightness": 0.3,
-      "contrast": 0.4,
-      "saturation": 0.5,
-      "hue": 0.08
-    },
-    "shortest_image_edge": 256,
-    "crop_fraction": 0.95,
-    "model_name": "nvidia/Eagle-Block2A-2B-v2",
-    "model_type": "eagle",
-    "formalize_language": true,
-    "max_state_dim": 128,
-    "max_action_dim": 128,
-    "max_action_horizon": 50,
-    "use_percentiles": false,
-    "clip_outliers": true,
-    "apply_sincos_state_encoding": true,
-    "use_relative_action": true
-  }
-}

checkpoint-15000/rng_state.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:292427e64b7e1ca74d7fc55bdd4f7612064cd77b7dcb6cf568f0be95dfd5152b
-size 14645

checkpoint-15000/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ee0ce25fd589eb0fbcffab63bcc2e2a86e5fb56630601b06b6bc1e425539b706
-size 1465

checkpoint-15000/statistics.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-15000/trainer_state.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-15000/training_args.bin DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:49cf1bb9160fba423ccdd2dae7d9b40228772dd15a3fb17d44a4fd07f7818f45
-size 5713

checkpoint-15000/wandb_config.json DELETED Viewed

	@@ -1 +0,0 @@
1	- {"project": "finetune-gr00t-n1d6", "run_id": "fr5_cherry"}

checkpoint-20000/config.json DELETED Viewed

@@ -1,70 +0,0 @@
-{
-  "action_horizon": 50,
-  "add_pos_embed": true,
-  "apply_sincos_state_encoding": true,
-  "architectures": [
-    "Gr00tN1d6"
-  ],
-  "attn_dropout": 0.2,
-  "attn_implementation": null,
-  "backbone_embedding_dim": 2048,
-  "backbone_model_type": "eagle",
-  "backbone_trainable_params_fp32": true,
-  "collator_overwrite_image_inputs": false,
-  "color_jitter_params": {
-    "brightness": 0.1,
-    "contrast": 0.1,
-    "hue": 0.1,
-    "saturation": 0.1
-  },
-  "crop_fraction": 0.95,
-  "diffusion_model_cfg": {
-    "attention_head_dim": 48,
-    "dropout": 0.2,
-    "final_dropout": true,
-    "interleave_self_attention": true,
-    "norm_type": "ada_norm",
-    "num_attention_heads": 32,
-    "num_layers": 32,
-    "output_dim": 1024,
-    "positional_embeddings": null
-  },
-  "eagle_collator": true,
-  "formalize_language": true,
-  "gemma_collator": false,
-  "hidden_size": 1024,
-  "image_crop_size": null,
-  "image_target_size": null,
-  "input_embedding_dim": 1536,
-  "load_bf16": true,
-  "max_action_dim": 128,
-  "max_num_embodiments": 32,
-  "max_seq_len": 1024,
-  "max_state_dim": 128,
-  "model_dtype": "bfloat16",
-  "model_name": "nvidia/Eagle-Block2A-2B-v2",
-  "model_type": "Gr00tN1d6",
-  "noise_beta_alpha": 1.5,
-  "noise_beta_beta": 1.0,
-  "noise_s": 0.999,
-  "num_inference_timesteps": 4,
-  "num_timestep_buckets": 1000,
-  "random_rotation_angle": null,
-  "reproject_vision": false,
-  "select_layer": 16,
-  "shortest_image_edge": 256,
-  "state_dropout_prob": 0.0,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.51.3",
-  "tune_diffusion_model": true,
-  "tune_llm": false,
-  "tune_projector": true,
-  "tune_top_llm_layers": 4,
-  "tune_visual": false,
-  "tune_vlln": true,
-  "use_albumentations_transforms": true,
-  "use_alternate_vl_dit": true,
-  "use_flash_attention": true,
-  "use_relative_action": true,
-  "use_vlln": true
-}

checkpoint-20000/embodiment_id.json DELETED Viewed

@@ -1,11 +0,0 @@
-{
-  "robocasa_panda_omron": 13,
-  "gr1": 20,
-  "behavior_r1_pro": 24,
-  "unitree_g1": 8,
-  "oxe_google": 0,
-  "oxe_widowx": 1,
-  "libero_panda": 2,
-  "oxe_droid": 16,
-  "new_embodiment": 10
-}

checkpoint-20000/experiment_cfg/conf.yaml DELETED Viewed

@@ -1,206 +0,0 @@
-load_config_path: null
-model:
-  model_type: Gr00tN1d6
-  model_dtype: bfloat16
-  model_name: nvidia/Eagle-Block2A-2B-v2
-  backbone_model_type: eagle
-  model_revision: null
-  tune_top_llm_layers: 4
-  backbone_embedding_dim: 2048
-  tune_llm: false
-  tune_visual: false
-  select_layer: 16
-  reproject_vision: false
-  use_flash_attention: true
-  load_bf16: false
-  collator_overwrite_image_inputs: false
-  eagle_collator: true
-  backbone_trainable_params_fp32: true
-  image_crop_size: null
-  image_target_size: null
-  shortest_image_edge: 256
-  crop_fraction: 0.95
-  random_rotation_angle: null
-  color_jitter_params: null
-  use_albumentations_transforms: true
-  extra_augmentation_config: null
-  formalize_language: true
-  apply_sincos_state_encoding: false
-  use_relative_action: true
-  max_state_dim: 29
-  max_action_dim: 29
-  action_horizon: 16
-  hidden_size: 1024
-  input_embedding_dim: 1536
-  add_pos_embed: true
-  attn_dropout: 0.2
-  use_vlln: true
-  max_seq_len: 1024
-  use_alternate_vl_dit: true
-  attend_text_every_n_blocks: 2
-  diffusion_model_cfg:
-    positional_embeddings: null
-    num_layers: 32
-    num_attention_heads: 32
-    attention_head_dim: 48
-    norm_type: ada_norm
-    dropout: 0.2
-    final_dropout: true
-    output_dim: 1024
-    interleave_self_attention: true
-  num_inference_timesteps: 4
-  noise_beta_alpha: 1.5
-  noise_beta_beta: 1.0
-  noise_s: 0.999
-  num_timestep_buckets: 1000
-  tune_projector: true
-  tune_diffusion_model: true
-  tune_vlln: true
-  state_dropout_prob: 0.0
-  state_additive_noise_scale: 0.0
-  max_num_embodiments: 32
-data:
-  datasets:
-  - dataset_paths:
-    - ./cherry_data
-    embodiment_tag: new_embodiment
-    mix_ratio: 1.0
-    dataset_type: physical_embodiment
-    val_dataset_path: null
-  modality_configs:
-    new_embodiment:
-      video:
-        delta_indices:
-        - 0
-        modality_keys:
-        - cam_base
-        - cam_wrist
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-      state:
-        delta_indices:
-        - 0
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-      action:
-        delta_indices:
-        - 0
-        - 1
-        - 2
-        - 3
-        - 4
-        - 5
-        - 6
-        - 7
-        - 8
-        - 9
-        - 10
-        - 11
-        - 12
-        - 13
-        - 14
-        - 15
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs:
-        - rep: ABSOLUTE
-          type: NON_EEF
-          format: DEFAULT
-          state_key: null
-        - rep: ABSOLUTE
-          type: NON_EEF
-          format: DEFAULT
-          state_key: null
-      language:
-        delta_indices:
-        - 0
-        modality_keys:
-        - annotation.human.task_description
-        sin_cos_embedding_keys: null
-        mean_std_embedding_keys: null
-        action_configs: null
-  download_cache: false
-  shard_size: 1024
-  episode_sampling_rate: 0.1
-  num_shards_per_epoch: 100000
-  override_pretraining_statistics: false
-  mode: single_turn
-  random_chop: 0.0
-  mock_dataset_mode: false
-  shuffle: true
-  seed: 42
-  multiprocessing_context: fork
-  allow_padding: false
-  subsample_ratio: 1.0
-  image_crop_size:
-  - 244
-  - 244
-  image_target_size:
-  - 224
-  - 224
-  video_backend: decord
-training:
-  output_dir: ./outputs/fr5_cherry
-  experiment_name: null
-  max_steps: 20000
-  global_batch_size: 32
-  batch_size: null
-  gradient_accumulation_steps: 1
-  learning_rate: 0.0001
-  lr_scheduler_type: cosine
-  weight_decay: 1.0e-05
-  warmup_ratio: 0.05
-  warmup_steps: 0
-  max_grad_norm: 1.0
-  optim: adamw_torch
-  start_from_checkpoint: ./pretrained_models/GR00T-N1.6-3B
-  tf32: true
-  fp16: false
-  bf16: true
-  eval_bf16: true
-  logging_steps: 10
-  save_steps: 5000
-  save_total_limit: 5
-  save_vl_model: false
-  upload_checkpoints: false
-  upload_every: 1000
-  upload_last_n_checkpoints: 5
-  max_concurrent_uploads: 2
-  eval_strategy: 'no'
-  eval_steps: 500
-  eval_set_split_ratio: 0.1
-  eval_batch_size: 2
-  save_best_eval_metric_name: ''
-  save_best_eval_metric_greater_is_better: true
-  deepspeed_stage: 2
-  gradient_checkpointing: false
-  transformers_trust_remote_code: true
-  transformers_local_files_only: false
-  transformers_cache_dir: null
-  transformers_access_token: null
-  use_ddp: false
-  ddp_bucket_cap_mb: 100
-  num_gpus: 1
-  dataloader_num_workers: 2
-  remove_unused_columns: false
-  use_wandb: false
-  wandb_project: finetune-gr00t-n1d6
-  enable_profiling: false
-  max_retries: 3
-  assert_loss_less_than: null
-  add_rl_callback: false
-  enable_open_loop_eval: false
-  open_loop_eval_traj_ids:
-  - 0
-  open_loop_eval_steps_per_traj: 100
-  open_loop_eval_plot_indices: null
-max_steps: 20000
-save_steps: 5000

checkpoint-20000/experiment_cfg/config.yaml DELETED Viewed

@@ -1,239 +0,0 @@
-!!python/object:gr00t.configs.base_config.Config
-data: !!python/object:gr00t.configs.data.data_config.DataConfig
-  allow_padding: false
-  datasets:
-  - !!python/object:gr00t.configs.data.data_config.SingleDatasetConfig
-    dataset_paths:
-    - ./cherry_data
-    dataset_type: physical_embodiment
-    embodiment_tag: new_embodiment
-    mix_ratio: 1.0
-    val_dataset_path: null
-  download_cache: false
-  episode_sampling_rate: 0.1
-  image_crop_size:
-  - 244
-  - 244
-  image_target_size:
-  - 224
-  - 224
-  mock_dataset_mode: false
-  modality_configs:
-    new_embodiment:
-      action: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs:
-        - !!python/object:gr00t.data.types.ActionConfig
-          format: &id001 !!python/object/apply:gr00t.data.types.ActionFormat
-          - default
-          rep: &id002 !!python/object/apply:gr00t.data.types.ActionRepresentation
-          - absolute
-          state_key: null
-          type: &id003 !!python/object/apply:gr00t.data.types.ActionType
-          - non_eef
-        - !!python/object:gr00t.data.types.ActionConfig
-          format: *id001
-          rep: *id002
-          state_key: null
-          type: *id003
-        delta_indices:
-        - 0
-        - 1
-        - 2
-        - 3
-        - 4
-        - 5
-        - 6
-        - 7
-        - 8
-        - 9
-        - 10
-        - 11
-        - 12
-        - 13
-        - 14
-        - 15
-        mean_std_embedding_keys: null
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-      language: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - annotation.human.task_description
-        sin_cos_embedding_keys: null
-      state: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - arm
-        - gripper
-        sin_cos_embedding_keys: null
-      video: !!python/object:gr00t.data.types.ModalityConfig
-        action_configs: null
-        delta_indices:
-        - 0
-        mean_std_embedding_keys: null
-        modality_keys:
-        - cam_base
-        - cam_wrist
-        sin_cos_embedding_keys: null
-  mode: single_turn
-  multiprocessing_context: fork
-  num_shards_per_epoch: 100000
-  override_pretraining_statistics: false
-  random_chop: 0.0
-  seed: 42
-  shard_size: 1024
-  shuffle: true
-  subsample_ratio: 1.0
-  video_backend: decord
-load_config_path: null
-model: !!python/object:gr00t.configs.model.gr00t_n1d6.Gr00tN1d6Config
-  _attn_implementation_autoset: false
-  _attn_implementation_internal: null
-  _commit_hash: null
-  _name_or_path: ''
-  add_cross_attention: false
-  architectures: null
-  backbone_model_type: eagle
-  backbone_trainable_params_fp32: true
-  bad_words_ids: null
-  begin_suppress_tokens: null
-  bos_token_id: null
-  chunk_size_feed_forward: 0
-  color_jitter_params: null
-  cross_attention_hidden_size: null
-  decoder_start_token_id: null
-  diffusion_model_cfg:
-    attention_head_dim: 48
-    dropout: 0.2
-    final_dropout: true
-    interleave_self_attention: true
-    norm_type: ada_norm
-    num_attention_heads: 32
-    num_layers: 32
-    output_dim: 1024
-    positional_embeddings: null
-  diversity_penalty: 0.0
-  do_sample: false
-  eagle_collator: true
-  early_stopping: false
-  encoder_no_repeat_ngram_size: 0
-  eos_token_id: null
-  exponential_decay_length_penalty: null
-  extra_augmentation_config: null
-  finetuning_task: null
-  forced_bos_token_id: null
-  forced_eos_token_id: null
-  id2label:
-    0: LABEL_0
-    1: LABEL_1
-  is_decoder: false
-  is_encoder_decoder: false
-  label2id:
-    LABEL_0: 0
-    LABEL_1: 1
-  length_penalty: 1.0
-  load_bf16: false
-  max_length: 20
-  min_length: 0
-  model_name: nvidia/Eagle-Block2A-2B-v2
-  no_repeat_ngram_size: 0
-  num_beam_groups: 1
-  num_beams: 1
-  num_return_sequences: 1
-  output_attentions: false
-  output_hidden_states: false
-  output_scores: false
-  pad_token_id: null
-  prefix: null
-  problem_type: null
-  pruned_heads: {}
-  random_rotation_angle: null
-  remove_invalid_values: false
-  repetition_penalty: 1.0
-  reproject_vision: false
-  return_dict: true
-  return_dict_in_generate: false
-  sep_token_id: null
-  state_dropout_prob: 0.0
-  suppress_tokens: null
-  task_specific_params: null
-  temperature: 1.0
-  tf_legacy_loss: false
-  tie_encoder_decoder: false
-  tie_word_embeddings: true
-  tokenizer_class: null
-  top_k: 50
-  top_p: 1.0
-  torch_dtype: null
-  torchscript: false
-  transformers_version: null
-  tune_diffusion_model: true
-  tune_llm: false
-  tune_projector: true
-  tune_visual: false
-  typical_p: 1.0
-  use_bfloat16: false
-  use_relative_action: true
-training: !!python/object:gr00t.configs.training.training_config.TrainingConfig
-  add_rl_callback: false
-  assert_loss_less_than: null
-  batch_size: null
-  bf16: true
-  dataloader_num_workers: 2
-  ddp_bucket_cap_mb: 100
-  deepspeed_stage: 2
-  enable_open_loop_eval: false
-  enable_profiling: false
-  eval_batch_size: 2
-  eval_bf16: true
-  eval_set_split_ratio: 0.1
-  eval_steps: 500
-  eval_strategy: 'no'
-  experiment_name: null
-  fp16: false
-  global_batch_size: 32
-  gradient_accumulation_steps: 1
-  gradient_checkpointing: false
-  learning_rate: 0.0001
-  logging_steps: 10
-  lr_scheduler_type: cosine
-  max_concurrent_uploads: 2
-  max_grad_norm: 1.0
-  max_retries: 3
-  max_steps: 20000
-  num_gpus: 1
-  open_loop_eval_plot_indices: null
-  open_loop_eval_steps_per_traj: 100
-  open_loop_eval_traj_ids:
-  - 0
-  optim: adamw_torch
-  output_dir: ./outputs/fr5_cherry
-  remove_unused_columns: false
-  save_best_eval_metric_greater_is_better: true
-  save_best_eval_metric_name: ''
-  save_steps: 5000
-  save_total_limit: 5
-  save_vl_model: false
-  start_from_checkpoint: ./pretrained_models/GR00T-N1.6-3B
-  tf32: true
-  transformers_access_token: null
-  transformers_cache_dir: null
-  transformers_local_files_only: false
-  transformers_trust_remote_code: true
-  upload_checkpoints: false
-  upload_every: 1000
-  upload_last_n_checkpoints: 5
-  use_ddp: false
-  use_wandb: false
-  wandb_project: finetune-gr00t-n1d6
-  warmup_ratio: 0.05
-  warmup_steps: 0
-  weight_decay: 1.0e-05

checkpoint-20000/experiment_cfg/dataset_statistics.json DELETED Viewed

@@ -1,149 +0,0 @@
-{
-  "new_embodiment": {
-    "state": {
-      "arm": {
-        "min": [
-          0.4818978011608124,
-          -1.687173843383789,
-          0.62826007604599,
-          -2.6761701107025146,
-          -1.8431425094604492,
-          -0.5678880214691162
-        ],
-        "max": [
-          0.7935351133346558,
-          -1.014952301979065,
-          1.8637524843215942,
-          -1.0820374488830566,
-          -1.4455490112304688,
-          0.3115537762641907
-        ],
-        "mean": [
-          0.6489784717559814,
-          -1.3269319534301758,
-          1.356391429901123,
-          -1.804563045501709,
-          -1.619696021080017,
-          -0.07974076271057129
-        ],
-        "std": [
-          0.053538445383310186,
-          0.1604488044977188,
-          0.2438623011112213,
-          0.22075510025024414,
-          0.07333532720804177,
-          0.10092151165008545
-        ],
-        "q01": [
-          0.5197953635454178,
-          -1.6432996988296509,
-          0.8626433879137039,
-          -2.5542680168151857,
-          -1.8000394713878631,
-          -0.37301090329885483
-        ],
-        "q99": [
-          0.7509180748462676,
-          -1.0879072868824005,
-          1.7959050333499906,
-          -1.252977850437165,
-          -1.4705305182933812,
-          0.2933953133225437
-        ]
-      },
-      "gripper": {
-        "min": [
-          0.0
-        ],
-        "max": [
-          1.0
-        ],
-        "mean": [
-          0.7650123238563538
-        ],
-        "std": [
-          0.39907386898994446
-        ],
-        "q01": [
-          0.0
-        ],
-        "q99": [
-          1.0
-        ]
-      }
-    },
-    "action": {
-      "arm": {
-        "min": [
-          0.4818978011608124,
-          -1.687173843383789,
-          0.62826007604599,
-          -2.6573522090911865,
-          -1.8431425094604492,
-          -0.5678880214691162
-        ],
-        "max": [
-          0.7935351133346558,
-          -1.014952301979065,
-          1.8637524843215942,
-          -1.0820374488830566,
-          -1.4455490112304688,
-          0.3115537762641907
-        ],
-        "mean": [
-          0.6489997506141663,
-          -1.326717495918274,
-          1.355955958366394,
-          -1.8026670217514038,
-          -1.6199865341186523,
-          -0.07982920855283737
-        ],
-        "std": [
-          0.05358240380883204,
-          0.16021256148815155,
-          0.243374302983284,
-          0.2178075611591339,
-          0.07321629673242531,
-          0.10097639262676239
-        ],
-        "q01": [
-          0.5197953635454178,
-          -1.6432996988296509,
-          0.8625765931606293,
-          -2.53433034658432,
-          -1.8000823378562927,
-          -0.37301090329885483
-        ],
-        "q99": [
-          0.7509180748462676,
-          -1.0879072868824005,
-          1.7849992513656616,
-          -1.2526323044300085,
-          -1.4705633461475374,
-          0.2933953133225437
-        ]
-      },
-      "gripper": {
-        "min": [
-          0.0
-        ],
-        "max": [
-          1.0
-        ],
-        "mean": [
-          0.7650123238563538
-        ],
-        "std": [
-          0.39907386898994446
-        ],
-        "q01": [
-          0.0
-        ],
-        "q99": [
-          1.0
-        ]
-      }
-    },
-    "relative_action": {}
-  }
-}

checkpoint-20000/experiment_cfg/final_model_config.json DELETED Viewed

@@ -1,54 +0,0 @@
-{
-  "model_type": "Gr00tN1d6",
-  "model_dtype": "bfloat16",
-  "model_name": "nvidia/Eagle-Block2A-2B-v2",
-  "backbone_model_type": "eagle",
-  "model_revision": null,
-  "tune_top_llm_layers": 4,
-  "backbone_embedding_dim": 2048,
-  "tune_llm": false,
-  "tune_visual": false,
-  "select_layer": 16,
-  "reproject_vision": false,
-  "use_flash_attention": true,
-  "load_bf16": true,
-  "collator_overwrite_image_inputs": false,
-  "eagle_collator": true,
-  "backbone_trainable_params_fp32": true,
-  "extra_augmentation_config": null,
-  "apply_sincos_state_encoding": true,
-  "use_relative_action": true,
-  "max_state_dim": 128,
-  "max_action_dim": 128,
-  "action_horizon": 50,
-  "hidden_size": 1024,
-  "input_embedding_dim": 1536,
-  "add_pos_embed": true,
-  "attn_dropout": 0.2,
-  "use_vlln": true,
-  "max_seq_len": 1024,
-  "use_alternate_vl_dit": true,
-  "attend_text_every_n_blocks": 2,
-  "diffusion_model_cfg": {
-    "attention_head_dim": 48,
-    "dropout": 0.2,
-    "final_dropout": true,
-    "interleave_self_attention": true,
-    "norm_type": "ada_norm",
-    "num_attention_heads": 32,
-    "num_layers": 32,
-    "output_dim": 1024,
-    "positional_embeddings": null
-  },
-  "num_inference_timesteps": 4,
-  "noise_beta_alpha": 1.5,
-  "noise_beta_beta": 1.0,
-  "noise_s": 0.999,
-  "num_timestep_buckets": 1000,
-  "tune_projector": true,
-  "tune_diffusion_model": true,
-  "tune_vlln": true,
-  "state_dropout_prob": 0.0,
-  "state_additive_noise_scale": 0.0,
-  "max_num_embodiments": 32
-}

checkpoint-20000/experiment_cfg/final_processor_config.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-20000/model-00001-of-00002.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e567773ecb7739580072e23d2cf32c20483faa087d934138f85f3e9f717ef54c
-size 4990120184

checkpoint-20000/model-00002-of-00002.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a82b8434c44a16ff46ed3ac65a9082e15ef327779100bf4e7ac0633f694dc1dc
-size 4823190320

checkpoint-20000/model.safetensors.index.json DELETED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-20000/optimizer.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a4808f6a3470dddc484424c6c3648b3b4b808e96ea886a0505ea84dcea913924
-size 12960193762

checkpoint-20000/processor_config.json DELETED Viewed

@@ -1,455 +0,0 @@
-{
-  "processor_class": "Gr00tN1d6Processor",
-  "processor_kwargs": {
-    "modality_configs": {
-      "behavior_r1_pro": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "observation.images.rgb.head_256_256",
-            "observation.images.rgb.left_wrist_256_256",
-            "observation.images.rgb.right_wrist_256_256"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "robot_pos",
-            "robot_ori_cos",
-            "robot_ori_sin",
-            "robot_2d_ori",
-            "robot_2d_ori_cos",
-            "robot_2d_ori_sin",
-            "robot_lin_vel",
-            "robot_ang_vel",
-            "arm_left_qpos",
-            "arm_left_qpos_sin",
-            "arm_left_qpos_cos",
-            "eef_left_pos",
-            "eef_left_quat",
-            "gripper_left_qpos",
-            "arm_right_qpos",
-            "arm_right_qpos_sin",
-            "arm_right_qpos_cos",
-            "eef_right_pos",
-            "eef_right_quat",
-            "gripper_right_qpos",
-            "trunk_qpos"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15,
-            16,
-            17,
-            18,
-            19,
-            20,
-            21,
-            22,
-            23,
-            24,
-            25,
-            26,
-            27,
-            28,
-            29,
-            30,
-            31
-          ],
-          "modality_keys": [
-            "base",
-            "torso",
-            "left_arm",
-            "left_gripper",
-            "right_arm",
-            "right_gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "trunk_qpos"
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "arm_left_qpos"
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": "arm_right_qpos"
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.coarse_action"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "gr1": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "ego_view_bg_crop_pad_res256_freq20"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "sin_cos_embedding_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "left_arm",
-            "right_arm",
-            "left_hand",
-            "right_hand",
-            "waist"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "RELATIVE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "task"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "robocasa_panda_omron": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "res256_image_side_0",
-            "res256_image_side_1",
-            "res256_image_wrist_0"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "end_effector_position_relative",
-            "end_effector_rotation_relative",
-            "gripper_qpos",
-            "base_position",
-            "base_rotation"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "end_effector_position",
-            "end_effector_rotation",
-            "gripper_close",
-            "base_motion",
-            "control_mode"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.action.task_description"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      },
-      "new_embodiment": {
-        "video": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "cam_base",
-            "cam_wrist"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "state": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "arm",
-            "gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        },
-        "action": {
-          "delta_indices": [
-            0,
-            1,
-            2,
-            3,
-            4,
-            5,
-            6,
-            7,
-            8,
-            9,
-            10,
-            11,
-            12,
-            13,
-            14,
-            15
-          ],
-          "modality_keys": [
-            "arm",
-            "gripper"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": [
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            },
-            {
-              "rep": "ABSOLUTE",
-              "type": "NON_EEF",
-              "format": "DEFAULT",
-              "state_key": null
-            }
-          ]
-        },
-        "language": {
-          "delta_indices": [
-            0
-          ],
-          "modality_keys": [
-            "annotation.human.task_description"
-          ],
-          "sin_cos_embedding_keys": null,
-          "mean_std_embedding_keys": null,
-          "action_configs": null
-        }
-      }
-    },
-    "image_crop_size": null,
-    "image_target_size": null,
-    "use_albumentations": true,
-    "random_rotation_angle": null,
-    "color_jitter_params": {
-      "brightness": 0.3,
-      "contrast": 0.4,
-      "saturation": 0.5,
-      "hue": 0.08
-    },
-    "shortest_image_edge": 256,
-    "crop_fraction": 0.95,
-    "model_name": "nvidia/Eagle-Block2A-2B-v2",
-    "model_type": "eagle",
-    "formalize_language": true,
-    "max_state_dim": 128,
-    "max_action_dim": 128,
-    "max_action_horizon": 50,
-    "use_percentiles": false,
-    "clip_outliers": true,
-    "apply_sincos_state_encoding": true,
-    "use_relative_action": true
-  }
-}

checkpoint-20000/rng_state.pth DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:675751298697509e109188026494482b1da89c72d7a1ba3abec2e498516d2755
-size 14645

checkpoint-20000/scheduler.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7fa802a80def971b73ec74284a6aa44d0b2ea101bd38ed41a3b1c1a0b4001f00
-size 1465