gyung commited on
Commit
4d33679
·
verified ·
1 Parent(s): 6480e48

Add files using upload-large-folder tool

Browse files
Files changed (23) hide show
  1. .gitattributes +9 -0
  2. stage2b-hrm-full-nocap-extra-epoch1-step350000/all_config.yaml +46 -0
  3. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.0.pt +3 -0
  4. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.1.pt +3 -0
  5. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.2.pt +3 -0
  6. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.3.pt +3 -0
  7. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.4.pt +3 -0
  8. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.5.pt +3 -0
  9. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.6.pt +3 -0
  10. stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.7.pt +3 -0
  11. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/.metadata +3 -0
  12. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__0_0.distcp +3 -0
  13. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__1_0.distcp +3 -0
  14. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__2_0.distcp +3 -0
  15. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__3_0.distcp +3 -0
  16. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__4_0.distcp +3 -0
  17. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__5_0.distcp +3 -0
  18. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__6_0.distcp +3 -0
  19. stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__7_0.distcp +3 -0
  20. stage2b-hrm-full-nocap-extra-epoch1-step350000/latest_checkpoint.txt +1 -0
  21. stage2b-hrm-full-nocap-extra-epoch1-step350000/step_350000_info.json +8 -0
  22. stage2b-hrm-full-nocap-extra-epoch1-step350000/train_metadata.yaml +13 -0
  23. stage2b-hrm-full-nocap-extra-epoch1-step350000/upload_manifest.json +1 -0
.gitattributes CHANGED
@@ -438,3 +438,12 @@ stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__5_0.distcp fi
438
  stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
439
  stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
440
  stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
438
  stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
439
  stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
440
  stage2b-hrm-full-nocap-extra-epoch1-step340000/fsdp2_step_340000/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
441
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__0_0.distcp filter=lfs diff=lfs merge=lfs -text
442
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__1_0.distcp filter=lfs diff=lfs merge=lfs -text
443
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__7_0.distcp filter=lfs diff=lfs merge=lfs -text
444
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/.metadata filter=lfs diff=lfs merge=lfs -text
445
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__4_0.distcp filter=lfs diff=lfs merge=lfs -text
446
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__3_0.distcp filter=lfs diff=lfs merge=lfs -text
447
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__2_0.distcp filter=lfs diff=lfs merge=lfs -text
448
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__5_0.distcp filter=lfs diff=lfs merge=lfs -text
449
+ stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__6_0.distcp filter=lfs diff=lfs merge=lfs -text
stage2b-hrm-full-nocap-extra-epoch1-step350000/all_config.yaml ADDED
@@ -0,0 +1,46 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ arch:
2
+ H_cycles: 2
3
+ H_override: {}
4
+ L_cycles: 3
5
+ bp_max_steps: 5
6
+ bp_warmup_ratio: 0.2
7
+ expansion: 4
8
+ half_layers: true
9
+ head: lm_head@LMHead
10
+ hidden_size: 1536
11
+ init_type: lecun_normal
12
+ n_layers: 32
13
+ name: baselines.hrm_nocarry_bp_warmup@HierarchicalReasoningModel
14
+ norm_eps: 1.0e-06
15
+ norm_type: pre
16
+ num_heads: 12
17
+ pos_emb_type: rope
18
+ rope_theta: 10000.0
19
+ beta1: 0.9
20
+ beta2: 0.95
21
+ checkpoint_interval: 1
22
+ checkpoint_keep_last: 2
23
+ checkpoint_path: /home/work/.data/hrm_text_checkpoints/KoHRM-Text-1.4B-stage2b-hrm-full-nocap-extra-epoch1-gbs180
24
+ checkpoint_step_interval: 10000
25
+ data:
26
+ path: /home/work/.data/hrm_text_prepared/koterm_hrm_cleaned_full_nocap_extra_epochs_1_3_v1
27
+ target_only: true
28
+ ema: 0.9999
29
+ epochs: 1
30
+ fwd_bwd_dtype: bfloat16
31
+ global_batch_size: 180224
32
+ log_interval: 5
33
+ lr: 0.00022
34
+ lr_min_ratio: 1.0
35
+ lr_warmup_steps: 2000
36
+ project_name: KoHRM-Text
37
+ resume_epoch: null
38
+ resume_from: /home/work/.data/hrm_text_checkpoints/KoHRM-Text-1.4B-stage1b-hrm-fastcap-repeat-gbs180
39
+ resume_step: null
40
+ resume_step_offset: 317814
41
+ run_name: KoHRM-Text-1.4B-stage2b-hrm-full-nocap-extra-epoch1
42
+ seed: 0
43
+ skip_batches: 0
44
+ total_steps_override: 465000
45
+ weight_decay: 0.1
46
+ weights_only_resume_from_ema: false
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7299bc96e73980dd4a0640f3d60582e6a025c99d3a5fce58c000bde11db71674
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.1.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f5df4f59854bd81b2f0fc070e1edbfbbeeb982bfdb481f5741895de443b1ecf
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.2.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df48d21428d85ead3bea3c5620bfd6b194d5c51b6d1e5e45062776c333ac38ff
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.3.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3898e9f1c8883c913244d9ca230b1c516a468f66c02040562e0c88c9a9ba80e5
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.4.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a682c70123ac24dbee9067857da700cd30226518a7bc63b530d1aca76c8a9013
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.5.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:697dba7246e640fc8fc77274cc3e9a12a408c4f4b04a9efe5fadb746016e5112
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.6.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4abfddc2b5dcba51602dcd3927451bd62a06bea99decc4c573d127ff62735c1
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/carry_step_350000.7.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8c2c6796a82591ae6621a4c870ef6981a076865196f0fe099c4151c97578dfed
3
+ size 1333
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/.metadata ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a69f8b9a973145921d18913023e3ed7c8d7f169eac61dbb4e6351aeb89f50b3e
3
+ size 983820
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__0_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cea5a7278a5101f04d093df05d6504e96b76f6b4a3087b7e9f733e72fbff456a
3
+ size 2769065329
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__1_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7e87ca0f0a20dddb9823f78a9de8f905f126a75cb5bab3bc9232473d74876e6f
3
+ size 2769090643
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__2_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6ece4e62d49599fca89d1370806b8ead450b58d75de68b1bc1aecc1ad4a18c2
3
+ size 2769090643
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__3_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:20176e96bffc984c71189b0603aaba4b854a7d26a8fe51459492966acf7b38a5
3
+ size 2769090643
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__4_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a9d5bd360daab8f2d21d13aef37d16efc986d090d324a85e4a1371375b898cfa
3
+ size 2769090643
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__5_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39ac4f3052fbc6142ba00ce497882982d3edff7b2914ad7da933cbad7b6f3691
3
+ size 2769090643
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__6_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b24f37048f61feac88eb6288febd6eaf6d19294ea75349b2126b91d22b48437c
3
+ size 2769091588
stage2b-hrm-full-nocap-extra-epoch1-step350000/fsdp2_step_350000/__7_0.distcp ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a025454944fbc460bece2cb85822d809a9b316516f9d5ddaab50e95b6dacb22a
3
+ size 2769098756
stage2b-hrm-full-nocap-extra-epoch1-step350000/latest_checkpoint.txt ADDED
@@ -0,0 +1 @@
 
 
1
+ step_350000
stage2b-hrm-full-nocap-extra-epoch1-step350000/step_350000_info.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "tag": "step_350000",
3
+ "global_step": 350000,
4
+ "stage_start_step": 317814,
5
+ "skip_batches_hint": 32186,
6
+ "data_path": "/home/work/.data/hrm_text_prepared/koterm_hrm_cleaned_full_nocap_extra_epochs_1_3_v1",
7
+ "global_batch_size": 180224
8
+ }
stage2b-hrm-full-nocap-extra-epoch1-step350000/train_metadata.yaml ADDED
@@ -0,0 +1,13 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ max_seq_len: 4096
2
+ tokenizer_info:
3
+ boq: <|im_start|>
4
+ condition_mapping:
5
+ cot: <|object_ref_end|>
6
+ direct: <|object_ref_start|>
7
+ noisy: <|quad_start|>
8
+ synth: <|quad_end|>
9
+ eoa: <|box_end|>
10
+ eoq: <|im_end|>
11
+ tokenizer_path: /home/work/.data/huggingface/trained_tokenizers/hrm-ko-terminal-131k-v1/tokenizer.json
12
+ total_length: 14553638506
13
+ vocab_size: 131072
stage2b-hrm-full-nocap-extra-epoch1-step350000/upload_manifest.json ADDED
@@ -0,0 +1 @@
 
 
1
+ stage2b-hrm-full-nocap-extra-epoch1 step_350000 raw resume checkpoint