Upload folder using huggingface_hub
Browse files
checkpoint-10/optimizer.pt
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 558664971
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e8f737755e1707c54316203052f6ac69bc0a137a55a150363b1621beebab104d
|
| 3 |
size 558664971
|
checkpoint-10/pytorch_model.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 279336283
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:747ed44a38f676c73bc39fa8323ac7f34af0ad201fe4147bcfaaff3ea4362fcf
|
| 3 |
size 279336283
|
checkpoint-10/rng_state.pth
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c0a94dcd39eccd1603ad876bde99a39ec9194a931682980ebefe91dd918a3493
|
| 3 |
+
size 16359
|
checkpoint-10/trainer_state.json
CHANGED
|
@@ -1,7 +1,7 @@
|
|
| 1 |
{
|
| 2 |
"best_global_step": 10,
|
| 3 |
-
"best_metric":
|
| 4 |
-
"best_model_checkpoint": "/
|
| 5 |
"epoch": 0.00035457220863028757,
|
| 6 |
"eval_steps": 10,
|
| 7 |
"global_step": 10,
|
|
@@ -13,57 +13,57 @@
|
|
| 13 |
"comp/rl_weight": 0.03,
|
| 14 |
"comp/strictness": 0.0,
|
| 15 |
"epoch": 0.00035457220863028757,
|
| 16 |
-
"grad_norm":
|
| 17 |
-
"loss":
|
| 18 |
-
"loss_ce":
|
| 19 |
-
"loss_region": 0.
|
| 20 |
-
"loss_total":
|
| 21 |
"lr": 2.20454076850486e-05,
|
| 22 |
-
"router/selected_tokens_s0":
|
| 23 |
-
"router/selected_tokens_s1":
|
| 24 |
"step": 10,
|
| 25 |
"tokens_trained": 0.00409568
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"epoch": 0.00035457220863028757,
|
| 29 |
-
"eval_ppl":
|
| 30 |
-
"eval_runtime":
|
| 31 |
"step": 10,
|
| 32 |
"tokens_trained": 0.00409568
|
| 33 |
},
|
| 34 |
{
|
| 35 |
"epoch": 0.00035457220863028757,
|
| 36 |
-
"eval_F":
|
| 37 |
-
"eval_F_cds":
|
| 38 |
-
"eval_F_dig":
|
| 39 |
-
"eval_F_exon":
|
| 40 |
-
"eval_F_intron":
|
| 41 |
-
"eval_F_nig":
|
| 42 |
-
"eval_F_promoter":
|
| 43 |
-
"eval_F_utr":
|
| 44 |
-
"eval_G": 0.
|
| 45 |
-
"eval_G_cds": 0.
|
| 46 |
-
"eval_G_dig": 0.
|
| 47 |
-
"eval_G_exon": 0.
|
| 48 |
-
"eval_G_intron": 0.
|
| 49 |
-
"eval_G_nig": 0.
|
| 50 |
-
"eval_G_promoter": 0.
|
| 51 |
-
"eval_G_utr": 0.
|
| 52 |
-
"eval_avg_bp_per_token":
|
| 53 |
-
"eval_bp_per_token/cds":
|
| 54 |
-
"eval_bp_per_token/dig":
|
| 55 |
-
"eval_bp_per_token/exon":
|
| 56 |
-
"eval_bp_per_token/intron":
|
| 57 |
-
"eval_bp_per_token/nig":
|
| 58 |
-
"eval_bp_per_token/promoter":
|
| 59 |
-
"eval_bp_per_token/utr":
|
| 60 |
-
"eval_ppl_cds":
|
| 61 |
-
"eval_ppl_dig":
|
| 62 |
-
"eval_ppl_exon":
|
| 63 |
-
"eval_ppl_intron":
|
| 64 |
-
"eval_ppl_nig":
|
| 65 |
-
"eval_ppl_promoter":
|
| 66 |
-
"eval_ppl_utr":
|
| 67 |
"step": 10,
|
| 68 |
"tokens_trained": 0.00409568
|
| 69 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"best_global_step": 10,
|
| 3 |
+
"best_metric": 9.153268951196861e+22,
|
| 4 |
+
"best_model_checkpoint": "/gpfs/scratch/guoh/DNAFM/output/gencode_human_12.8k_12800/CKPT_DEBUG/checkpoint-10",
|
| 5 |
"epoch": 0.00035457220863028757,
|
| 6 |
"eval_steps": 10,
|
| 7 |
"global_step": 10,
|
|
|
|
| 13 |
"comp/rl_weight": 0.03,
|
| 14 |
"comp/strictness": 0.0,
|
| 15 |
"epoch": 0.00035457220863028757,
|
| 16 |
+
"grad_norm": 1504.030029296875,
|
| 17 |
+
"loss": 87.8092,
|
| 18 |
+
"loss_ce": 59.68216323852539,
|
| 19 |
+
"loss_region": 0.0935576930642128,
|
| 20 |
+
"loss_total": 59.77572250366211,
|
| 21 |
"lr": 2.20454076850486e-05,
|
| 22 |
+
"router/selected_tokens_s0": 793.03125,
|
| 23 |
+
"router/selected_tokens_s1": 148.84375,
|
| 24 |
"step": 10,
|
| 25 |
"tokens_trained": 0.00409568
|
| 26 |
},
|
| 27 |
{
|
| 28 |
"epoch": 0.00035457220863028757,
|
| 29 |
+
"eval_ppl": 9.153268951196861e+22,
|
| 30 |
+
"eval_runtime": 4.9797,
|
| 31 |
"step": 10,
|
| 32 |
"tokens_trained": 0.00409568
|
| 33 |
},
|
| 34 |
{
|
| 35 |
"epoch": 0.00035457220863028757,
|
| 36 |
+
"eval_F": 0.00177827022776477,
|
| 37 |
+
"eval_F_cds": 0.003658417655291659,
|
| 38 |
+
"eval_F_dig": 0.0012045211865510327,
|
| 39 |
+
"eval_F_exon": 0.0016746678575415876,
|
| 40 |
+
"eval_F_intron": 0.001447564894073858,
|
| 41 |
+
"eval_F_nig": 0.0013862277187481856,
|
| 42 |
+
"eval_F_promoter": 0.0033154658131890054,
|
| 43 |
+
"eval_F_utr": 0.0016332169397963454,
|
| 44 |
+
"eval_G": 0.011702613646642867,
|
| 45 |
+
"eval_G_cds": 0.023833423264492,
|
| 46 |
+
"eval_G_dig": 0.009547610734562596,
|
| 47 |
+
"eval_G_exon": 0.01037959719586171,
|
| 48 |
+
"eval_G_intron": 0.008864032313383523,
|
| 49 |
+
"eval_G_nig": 0.008525809138569675,
|
| 50 |
+
"eval_G_promoter": 0.02530388628896865,
|
| 51 |
+
"eval_G_utr": 0.010295956315471365,
|
| 52 |
+
"eval_avg_bp_per_token": 562.3442288953848,
|
| 53 |
+
"eval_bp_per_token/cds": 273.34221902017293,
|
| 54 |
+
"eval_bp_per_token/dig": 830.2054054054054,
|
| 55 |
+
"eval_bp_per_token/exon": 597.1333333333333,
|
| 56 |
+
"eval_bp_per_token/intron": 690.8153161864243,
|
| 57 |
+
"eval_bp_per_token/nig": 721.3821989528795,
|
| 58 |
+
"eval_bp_per_token/promoter": 301.61674296926094,
|
| 59 |
+
"eval_bp_per_token/utr": 612.2885304659499,
|
| 60 |
+
"eval_ppl_cds": 6.414658338854343e+21,
|
| 61 |
+
"eval_ppl_dig": 4.0669318513627916e+21,
|
| 62 |
+
"eval_ppl_exon": 2.4904150523692485e+23,
|
| 63 |
+
"eval_ppl_intron": 1.535523404049312e+23,
|
| 64 |
+
"eval_ppl_nig": 7.19246164907062e+23,
|
| 65 |
+
"eval_ppl_promoter": 1.0487349115377585e+21,
|
| 66 |
+
"eval_ppl_utr": 3.14597976396868e+23,
|
| 67 |
"step": 10,
|
| 68 |
"tokens_trained": 0.00409568
|
| 69 |
}
|
checkpoint-10/training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 5969
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:faf9107e8232f8c02d0de570892b7fdd717781cc6eb0d429077eedff87e08462
|
| 3 |
size 5969
|