Robometer-4B-LIBERO-No-Fail

aliangdw commited on Feb 16

Commit

cf7160c

verified ·

1 Parent(s): d022de6

Update config.yaml

Files changed (1) hide show

config.yaml CHANGED Viewed

@@ -18,8 +18,6 @@ custom_eval:
   reward_alignment:
   - libero_pi0_no_fail
   reward_alignment_max_trajectories: 10
-  similarity_score:
-  - aliangdw_metaworld_metaworld_eval
   subsample_n_frames: null
   use_frame_steps: true
 data:
@@ -46,8 +44,6 @@ data:
   max_trajectories: -1
   min_frames_per_trajectory: 1
   min_success: 0.5
-  n_wrong_tasks: 5
-  num_bins: 10
   partial_success_threshold: 0.2
   predict_last_frame_partial_progress: false
   preference_strategy_ratio:
@@ -72,14 +68,9 @@ data:
   seed: 42
   shuffle: true
   shuffle_progress_frames: false
-  similarity_strategy_ratio:
-  - 1.0
-  - 1.0
-  - 1.0
   train_datasets:
   - libero_pi0_no_fail
   traj_same_source_prob: 0.5
-  use_data_source_balance: false
   use_multi_image: true
   use_per_frame_progress_token: true
 debug: false
@@ -131,7 +122,6 @@ model:
   train_language_model: true
   train_preference_head: true
   train_progress_head: true
-  train_similarity_head: false
   train_success_head: false
   train_vision_encoder: false
   trust_remote_code: true
@@ -183,8 +173,6 @@ training:
   per_device_eval_batch_size: 64
   per_device_train_batch_size: 64
   predict_pref_progress: true
-  predict_pref_sim: false
-  predict_sim_progress: false
   prediction_loss_only: true
   remove_unused_columns: false
   resume_from_checkpoint: null

   reward_alignment:
   - libero_pi0_no_fail
   reward_alignment_max_trajectories: 10
   subsample_n_frames: null
   use_frame_steps: true
 data:
   max_trajectories: -1
   min_frames_per_trajectory: 1
   min_success: 0.5
   partial_success_threshold: 0.2
   predict_last_frame_partial_progress: false
   preference_strategy_ratio:
   seed: 42
   shuffle: true
   shuffle_progress_frames: false
   train_datasets:
   - libero_pi0_no_fail
   traj_same_source_prob: 0.5
   use_multi_image: true
   use_per_frame_progress_token: true
 debug: false
   train_language_model: true
   train_preference_head: true
   train_progress_head: true
   train_success_head: false
   train_vision_encoder: false
   trust_remote_code: true
   per_device_eval_batch_size: 64
   per_device_train_batch_size: 64
   predict_pref_progress: true
   prediction_loss_only: true
   remove_unused_columns: false
   resume_from_checkpoint: null