aliangdw commited on
Commit
45d0131
·
verified ·
1 Parent(s): cbb9b12

Upload config.yaml with huggingface_hub

Browse files
Files changed (1) hide show
  1. config.yaml +6 -6
config.yaml CHANGED
@@ -10,12 +10,12 @@ custom_eval:
10
  num_examples_per_quality_pr: 5
11
  num_partial_successes: 5
12
  policy_ranking:
13
- - libero
14
  policy_ranking_max_tasks: 100
15
  quality_preference:
16
  - mw
17
  reward_alignment:
18
- - libero
19
  reward_alignment_max_trajectories: 10
20
  similarity_score:
21
  - aliangdw_metaworld_metaworld_eval
@@ -34,7 +34,7 @@ data:
34
  dataset_success_cutoff_file: rfm/data/dataset_success_cutoff.txt
35
  dataset_type: rfm
36
  eval_datasets:
37
- - libero
38
  eval_subset_size: null
39
  fps: 10
40
  load_embeddings: false
@@ -74,7 +74,7 @@ data:
74
  - 1.0
75
  - 1.0
76
  train_datasets:
77
- - libero
78
  traj_same_source_prob: 0.5
79
  use_data_source_balance: true
80
  use_multi_image: true
@@ -100,7 +100,7 @@ logging:
100
  save_processor: true
101
  wandb_entity: clvr
102
  wandb_mode: null
103
- wandb_notes: libero prog_pref_fail only
104
  wandb_project: rfm
105
  loss:
106
  predict_last_frame_progress: false
@@ -157,7 +157,7 @@ training:
157
  do_eval: true
158
  eval_steps: 500
159
  evaluation_strategy: steps
160
- exp_name: libero_90_prog_pref_4frames_fixdata
161
  fp16: false
162
  gradient_accumulation_steps: 1
163
  gradient_checkpointing: true
 
10
  num_examples_per_quality_pr: 5
11
  num_partial_successes: 5
12
  policy_ranking:
13
+ - libero_pi0_no_fail
14
  policy_ranking_max_tasks: 100
15
  quality_preference:
16
  - mw
17
  reward_alignment:
18
+ - libero_pi0_no_fail
19
  reward_alignment_max_trajectories: 10
20
  similarity_score:
21
  - aliangdw_metaworld_metaworld_eval
 
34
  dataset_success_cutoff_file: rfm/data/dataset_success_cutoff.txt
35
  dataset_type: rfm
36
  eval_datasets:
37
+ - libero_pi0_no_fail
38
  eval_subset_size: null
39
  fps: 10
40
  load_embeddings: false
 
74
  - 1.0
75
  - 1.0
76
  train_datasets:
77
+ - libero_pi0_no_fail
78
  traj_same_source_prob: 0.5
79
  use_data_source_balance: true
80
  use_multi_image: true
 
100
  save_processor: true
101
  wandb_entity: clvr
102
  wandb_mode: null
103
+ wandb_notes: libero prog only
104
  wandb_project: rfm
105
  loss:
106
  predict_last_frame_progress: false
 
157
  do_eval: true
158
  eval_steps: 500
159
  evaluation_strategy: steps
160
+ exp_name: libero_ablation_prog_pref_4frames_fixeddata
161
  fp16: false
162
  gradient_accumulation_steps: 1
163
  gradient_checkpointing: true