Upload config.yaml with huggingface_hub
Browse files- config.yaml +6 -6
config.yaml
CHANGED
|
@@ -10,12 +10,12 @@ custom_eval:
|
|
| 10 |
num_examples_per_quality_pr: 5
|
| 11 |
num_partial_successes: 5
|
| 12 |
policy_ranking:
|
| 13 |
-
-
|
| 14 |
policy_ranking_max_tasks: 100
|
| 15 |
quality_preference:
|
| 16 |
- mw
|
| 17 |
reward_alignment:
|
| 18 |
-
-
|
| 19 |
reward_alignment_max_trajectories: 10
|
| 20 |
similarity_score:
|
| 21 |
- aliangdw_metaworld_metaworld_eval
|
|
@@ -34,7 +34,7 @@ data:
|
|
| 34 |
dataset_success_cutoff_file: rfm/data/dataset_success_cutoff.txt
|
| 35 |
dataset_type: rfm
|
| 36 |
eval_datasets:
|
| 37 |
-
-
|
| 38 |
eval_subset_size: null
|
| 39 |
fps: 10
|
| 40 |
load_embeddings: false
|
|
@@ -74,7 +74,7 @@ data:
|
|
| 74 |
- 1.0
|
| 75 |
- 1.0
|
| 76 |
train_datasets:
|
| 77 |
-
-
|
| 78 |
traj_same_source_prob: 0.5
|
| 79 |
use_data_source_balance: true
|
| 80 |
use_multi_image: true
|
|
@@ -100,7 +100,7 @@ logging:
|
|
| 100 |
save_processor: true
|
| 101 |
wandb_entity: clvr
|
| 102 |
wandb_mode: null
|
| 103 |
-
wandb_notes: libero
|
| 104 |
wandb_project: rfm
|
| 105 |
loss:
|
| 106 |
predict_last_frame_progress: false
|
|
@@ -157,7 +157,7 @@ training:
|
|
| 157 |
do_eval: true
|
| 158 |
eval_steps: 500
|
| 159 |
evaluation_strategy: steps
|
| 160 |
-
exp_name:
|
| 161 |
fp16: false
|
| 162 |
gradient_accumulation_steps: 1
|
| 163 |
gradient_checkpointing: true
|
|
|
|
| 10 |
num_examples_per_quality_pr: 5
|
| 11 |
num_partial_successes: 5
|
| 12 |
policy_ranking:
|
| 13 |
+
- libero_pi0_no_fail
|
| 14 |
policy_ranking_max_tasks: 100
|
| 15 |
quality_preference:
|
| 16 |
- mw
|
| 17 |
reward_alignment:
|
| 18 |
+
- libero_pi0_no_fail
|
| 19 |
reward_alignment_max_trajectories: 10
|
| 20 |
similarity_score:
|
| 21 |
- aliangdw_metaworld_metaworld_eval
|
|
|
|
| 34 |
dataset_success_cutoff_file: rfm/data/dataset_success_cutoff.txt
|
| 35 |
dataset_type: rfm
|
| 36 |
eval_datasets:
|
| 37 |
+
- libero_pi0_no_fail
|
| 38 |
eval_subset_size: null
|
| 39 |
fps: 10
|
| 40 |
load_embeddings: false
|
|
|
|
| 74 |
- 1.0
|
| 75 |
- 1.0
|
| 76 |
train_datasets:
|
| 77 |
+
- libero_pi0_no_fail
|
| 78 |
traj_same_source_prob: 0.5
|
| 79 |
use_data_source_balance: true
|
| 80 |
use_multi_image: true
|
|
|
|
| 100 |
save_processor: true
|
| 101 |
wandb_entity: clvr
|
| 102 |
wandb_mode: null
|
| 103 |
+
wandb_notes: libero prog only
|
| 104 |
wandb_project: rfm
|
| 105 |
loss:
|
| 106 |
predict_last_frame_progress: false
|
|
|
|
| 157 |
do_eval: true
|
| 158 |
eval_steps: 500
|
| 159 |
evaluation_strategy: steps
|
| 160 |
+
exp_name: libero_ablation_prog_pref_4frames_fixeddata
|
| 161 |
fp16: false
|
| 162 |
gradient_accumulation_steps: 1
|
| 163 |
gradient_checkpointing: true
|