msj19 commited on
Commit
bf12bef
·
verified ·
1 Parent(s): 92a859c

Add files using upload-large-folder tool

Browse files
Files changed (15) hide show
  1. .gitattributes +11 -0
  2. retnet-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_fda.jsonl +3 -0
  3. retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_nq_2048.jsonl +3 -0
  4. retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_nq_2048.jsonl +3 -0
  5. retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_squad.jsonl +3 -0
  6. retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_squad.jsonl +3 -0
  7. transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_fda.jsonl +3 -0
  8. transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_fda.jsonl +3 -0
  9. transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_nq_2048.jsonl +3 -0
  10. transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_nq_2048.jsonl +3 -0
  11. transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_squad.jsonl +3 -0
  12. transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_squad.jsonl +3 -0
  13. transformer-1.3B-100B/based_swde/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_swde.jsonl +0 -0
  14. transformer-1.3B-100B/based_triviaqa/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_triviaqa.jsonl +0 -0
  15. transformer-1.3B-100B/based_triviaqa/results.json +55 -0
.gitattributes CHANGED
@@ -49,3 +49,14 @@ hgrn2-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download
49
  hgrn2-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
50
  hgrn2-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
51
  retnet-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
 
 
 
 
 
 
 
 
 
 
 
 
49
  hgrn2-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
50
  hgrn2-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
51
  retnet-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
52
+ retnet-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
53
+ retnet-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
54
+ retnet-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
55
+ retnet-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
56
+ retnet-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
57
+ transformer-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
58
+ transformer-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
59
+ transformer-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
60
+ transformer-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
61
+ transformer-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
62
+ transformer-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
retnet-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_fda.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1926925f2840097db0fe990c2b5e11f13324f9c7bfde7d3f9512a8289e2ee4eb
3
+ size 14171353
retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_nq_2048.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4b4ff4042a7ff6a8fc8d145014a7855f34e8323cd321a3ce0123227c03339af
3
+ size 41001635
retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_nq_2048.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e2666be797d8d33e29a9ac1c7385a60f28ce65e4e8493fbb507f85ade0e66d1
3
+ size 41337513
retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_squad.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aad0d024eff64c8e48b55da997604e712c4f90167c8f320f3cea1ca432767a17
3
+ size 14930884
retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_squad.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56c6b7cba182dec8ec19c08ac928bbc6fd04b455cfbbbe63c2587d1eb62a4a2d
3
+ size 14079972
transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_fda.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cf7c1f275c2f4ff58d4b049acb2d100f8e172b488bc25a695dbd3a3dcded3978
3
+ size 14174515
transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_fda.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d1e9269d688db011bf3a4c75de3de165e9c7c6491a40188a8cfa339d8aaf9fbf
3
+ size 14474221
transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_nq_2048.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3f0f80f593482eba938129cf798118cd643bcab3c682bd0c47c9aaa0158ff54
3
+ size 40983751
transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_nq_2048.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:195b60849fb130d21cf7a39d095d95d42a850a1d4c96994eea2a019e376390c3
3
+ size 41916071
transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_squad.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:08874dee3322c50b55ec6eb364dd7b915cd02a322ecfa26d81996ab9758e706a
3
+ size 14987974
transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_squad.jsonl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7be1f93c9f06169dec7e21f5683c9d4fefc38e91a79a88cbe0de116ed7c29a5d
3
+ size 14990478
transformer-1.3B-100B/based_swde/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_swde.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
transformer-1.3B-100B/based_triviaqa/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_triviaqa.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
transformer-1.3B-100B/based_triviaqa/results.json ADDED
@@ -0,0 +1,55 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "results": {
3
+ "based_triviaqa": {
4
+ "exact,none": 1.481042654028436,
5
+ "exact_stderr,none": "N/A",
6
+ "f1,none": 8.155291191508606,
7
+ "f1_stderr,none": "N/A",
8
+ "contains,none": 0.5811611374407583,
9
+ "contains_stderr,none": "N/A",
10
+ "alias": "based_triviaqa"
11
+ }
12
+ },
13
+ "configs": {
14
+ "based_triviaqa": {
15
+ "description": "",
16
+ "target_delimiter": " ",
17
+ "fewshot_delimiter": "\n\n",
18
+ "num_fewshot": 0,
19
+ "output_type": "generate_until",
20
+ "generation_kwargs": {
21
+ "until": [
22
+ "\n\n"
23
+ ],
24
+ "do_sample": false
25
+ },
26
+ "repeats": 1,
27
+ "should_decontaminate": false,
28
+ "metadata": {
29
+ "version": "default"
30
+ }
31
+ }
32
+ },
33
+ "versions": {
34
+ "based_triviaqa": "default"
35
+ },
36
+ "n-shot": {
37
+ "based_triviaqa": 0
38
+ },
39
+ "config": {
40
+ "model": "lm_eval_model",
41
+ "model_args": " checkpoint_name=/mnt/jfzn/msj/download_model/transformer-1.3B-100B",
42
+ "batch_size": "8",
43
+ "batch_sizes": [],
44
+ "device": "cuda:0",
45
+ "use_cache": null,
46
+ "limit": null,
47
+ "bootstrap_iters": 100000,
48
+ "gen_kwargs": null
49
+ },
50
+ "git_hash": null,
51
+ "context_length": 2000,
52
+ "answer_length": 48,
53
+ "cutting_context": true,
54
+ "decode_mode": "default"
55
+ }