andyjzhao commited on
Commit
15ab5f5
·
verified ·
1 Parent(s): 3353078

Upload folder using huggingface_hub

Browse files
checkpoint-10/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c17840d339873628ec2a78a677ab2cbfbb5c03e76c940568a60226f2ea00041e
3
  size 558664971
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:14a29e212fc47cc100a5939f53c8bc3fa3c1a0212a2361c7ac7adc996862b4d8
3
  size 558664971
checkpoint-10/pytorch_model.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:228064a54d4acf279d2af574895d2df9fe663db84d793900c7543edeb6586b58
3
  size 279336283
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7515af91c686d7f835331022de9decd37f02f6407e09e7741288c45b234df983
3
  size 279336283
checkpoint-10/trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_global_step": 10,
3
- "best_metric": 1.698420053510286e+17,
4
  "best_model_checkpoint": "/network/scratch/j/jianan.zhao/DNAFM/output/gencode_human_12.8k_12800/CKPT_DEBUG/checkpoint-10",
5
- "epoch": 0.0014184397163120568,
6
  "eval_steps": 10,
7
  "global_step": 10,
8
  "is_hyper_param_search": false,
@@ -12,60 +12,60 @@
12
  {
13
  "comp/rl_weight": 0.03,
14
  "comp/strictness": 0.0,
15
- "epoch": 0.0014184397163120568,
16
- "grad_norm": 904.2174682617188,
17
- "loss": 144.6514,
18
- "loss_ce": 54.04480743408203,
19
- "loss_region": 0.1044125035405159,
20
- "loss_total": 54.14921951293945,
21
  "lr": 2.20454076850486e-05,
22
- "router/selected_tokens_s0": 22.09375,
23
  "router/selected_tokens_s1": 1.0,
24
  "step": 10,
25
- "tokens_trained": 0.01638272
26
  },
27
  {
28
- "epoch": 0.0014184397163120568,
29
- "eval_ppl": 1.698420053510286e+17,
30
- "eval_runtime": 1.7385,
31
  "step": 10,
32
- "tokens_trained": 0.01638272
33
  },
34
  {
35
- "epoch": 0.0014184397163120568,
36
  "eval_F": 7.813110399249941e-05,
37
- "eval_F_cds": 2.439649178448139e-05,
38
  "eval_F_dig": 7.813110399249941e-05,
39
- "eval_F_exon": 6.169412055031155e-05,
40
- "eval_F_intron": 8.631567698207511e-05,
41
- "eval_F_nig": 8.867784676802712e-05,
42
- "eval_F_promoter": 2.898993785611503e-05,
43
- "eval_F_utr": 0.00013418766144453016,
44
- "eval_G": 0.00021740636410105978,
45
- "eval_G_cds": 0.00017406325095451275,
46
- "eval_G_dig": 0.00015412581061020393,
47
- "eval_G_exon": 0.00024593300789684745,
48
- "eval_G_intron": 0.000209744205032615,
49
- "eval_G_nig": 0.0001933390126892979,
50
- "eval_G_promoter": 0.000290331756895652,
51
- "eval_G_utr": 0.0002710944576302459,
52
  "eval_avg_bp_per_token": 12799.0,
53
- "eval_bp_per_token/cds": 40989.5,
54
  "eval_bp_per_token/dig": 12799.0,
55
- "eval_bp_per_token/exon": 16209.0,
56
- "eval_bp_per_token/intron": 11585.380952380952,
57
- "eval_bp_per_token/nig": 11276.77358490566,
58
- "eval_bp_per_token/promoter": 34494.72727272727,
59
- "eval_bp_per_token/utr": 7452.25,
60
- "eval_ppl_cds": 2.889123597693874e+19,
61
- "eval_ppl_dig": 3.430802770811005e+17,
62
- "eval_ppl_exon": 4.6340490808362584e+16,
63
- "eval_ppl_intron": 9.889931203838952e+16,
64
- "eval_ppl_nig": 3.3020604346559384e+16,
65
- "eval_ppl_promoter": 7.55131215186589e+19,
66
- "eval_ppl_utr": 1.4233813097089611e+17,
67
  "step": 10,
68
- "tokens_trained": 0.01638272
69
  }
70
  ],
71
  "logging_steps": 10,
 
1
  {
2
  "best_global_step": 10,
3
+ "best_metric": 1.1411666197284078e+18,
4
  "best_model_checkpoint": "/network/scratch/j/jianan.zhao/DNAFM/output/gencode_human_12.8k_12800/CKPT_DEBUG/checkpoint-10",
5
+ "epoch": 0.00035457220863028757,
6
  "eval_steps": 10,
7
  "global_step": 10,
8
  "is_hyper_param_search": false,
 
12
  {
13
  "comp/rl_weight": 0.03,
14
  "comp/strictness": 0.0,
15
+ "epoch": 0.00035457220863028757,
16
+ "grad_norm": 1104.44580078125,
17
+ "loss": 146.6099,
18
+ "loss_ce": 54.38197326660156,
19
+ "loss_region": 0.10671775788068771,
20
+ "loss_total": 54.48868942260742,
21
  "lr": 2.20454076850486e-05,
22
+ "router/selected_tokens_s0": 22.71875,
23
  "router/selected_tokens_s1": 1.0,
24
  "step": 10,
25
+ "tokens_trained": 0.00409568
26
  },
27
  {
28
+ "epoch": 0.00035457220863028757,
29
+ "eval_ppl": 1.1411666197284078e+18,
30
+ "eval_runtime": 7.5718,
31
  "step": 10,
32
+ "tokens_trained": 0.00409568
33
  },
34
  {
35
+ "epoch": 0.00035457220863028757,
36
  "eval_F": 7.813110399249941e-05,
37
+ "eval_F_cds": 4.744345662481978e-05,
38
  "eval_F_dig": 7.813110399249941e-05,
39
+ "eval_F_exon": 6.977782739756614e-05,
40
+ "eval_F_intron": 8.580132276805985e-05,
41
+ "eval_F_nig": 8.365496566708533e-05,
42
+ "eval_F_promoter": 4.770454407466195e-05,
43
+ "eval_F_utr": 7.9026626119178e-05,
44
+ "eval_G": 0.00018249983824419877,
45
+ "eval_G_cds": 0.0001800133237040688,
46
+ "eval_G_dig": 0.00018303075842513738,
47
+ "eval_G_exon": 0.00019645910961166313,
48
+ "eval_G_intron": 0.00018081985788333596,
49
+ "eval_G_nig": 0.00017549950537569102,
50
+ "eval_G_promoter": 0.00019468167686080247,
51
+ "eval_G_utr": 0.00019923581984270775,
52
  "eval_avg_bp_per_token": 12799.0,
53
+ "eval_bp_per_token/cds": 21077.722222222223,
54
  "eval_bp_per_token/dig": 12799.0,
55
+ "eval_bp_per_token/exon": 14331.2,
56
+ "eval_bp_per_token/intron": 11654.831973898858,
57
+ "eval_bp_per_token/nig": 11953.86301369863,
58
+ "eval_bp_per_token/promoter": 20962.363636363636,
59
+ "eval_bp_per_token/utr": 12653.962962962964,
60
+ "eval_ppl_cds": 3.4552045457243275e+20,
61
+ "eval_ppl_dig": 1.0972195397037683e+17,
62
+ "eval_ppl_exon": 3.635291150333688e+18,
63
+ "eval_ppl_intron": 4.403435383603975e+17,
64
+ "eval_ppl_nig": 1.714937073151653e+17,
65
+ "eval_ppl_promoter": 2.442053915928566e+20,
66
+ "eval_ppl_utr": 6.521360367361032e+17,
67
  "step": 10,
68
+ "tokens_trained": 0.00409568
69
  }
70
  ],
71
  "logging_steps": 10,
checkpoint-10/training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:912c85f83733bc75ddebd721c1bb21205af4115ec87e6bbd7790ca686f00482a
3
  size 5969
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:41cc3ab09601671003ffee48a30ae9c578b1fa64cc5e7591626680344f1fa2b0
3
  size 5969