Add files using upload-large-folder tool
Browse files- .gitattributes +11 -0
- retnet-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_fda.jsonl +3 -0
- retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_nq_2048.jsonl +3 -0
- retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_nq_2048.jsonl +3 -0
- retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_squad.jsonl +3 -0
- retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_squad.jsonl +3 -0
- transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_fda.jsonl +3 -0
- transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_fda.jsonl +3 -0
- transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_nq_2048.jsonl +3 -0
- transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_nq_2048.jsonl +3 -0
- transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_squad.jsonl +3 -0
- transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_squad.jsonl +3 -0
- transformer-1.3B-100B/based_swde/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_swde.jsonl +0 -0
- transformer-1.3B-100B/based_triviaqa/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_triviaqa.jsonl +0 -0
- transformer-1.3B-100B/based_triviaqa/results.json +55 -0
.gitattributes
CHANGED
|
@@ -49,3 +49,14 @@ hgrn2-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download
|
|
| 49 |
hgrn2-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 50 |
hgrn2-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 51 |
retnet-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 49 |
hgrn2-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 50 |
hgrn2-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__hgrn2-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 51 |
retnet-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 52 |
+
retnet-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 53 |
+
retnet-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 54 |
+
retnet-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 55 |
+
retnet-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 56 |
+
retnet-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 57 |
+
transformer-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 58 |
+
transformer-1.3B-100B/based_fda/[[:space:]]checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_fda.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 59 |
+
transformer-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 60 |
+
transformer-1.3B-100B/based_nq_2048/[[:space:]]checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_nq_2048.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 61 |
+
transformer-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
|
| 62 |
+
transformer-1.3B-100B/based_squad/[[:space:]]checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_squad.jsonl filter=lfs diff=lfs merge=lfs -text
|
retnet-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_fda.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1926925f2840097db0fe990c2b5e11f13324f9c7bfde7d3f9512a8289e2ee4eb
|
| 3 |
+
size 14171353
|
retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_nq_2048.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b4b4ff4042a7ff6a8fc8d145014a7855f34e8323cd321a3ce0123227c03339af
|
| 3 |
+
size 41001635
|
retnet-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_nq_2048.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6e2666be797d8d33e29a9ac1c7385a60f28ce65e4e8493fbb507f85ade0e66d1
|
| 3 |
+
size 41337513
|
retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__retnet-1.3B-100B_based_squad.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aad0d024eff64c8e48b55da997604e712c4f90167c8f320f3cea1ca432767a17
|
| 3 |
+
size 14930884
|
retnet-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__retnet-1.3B-100B_based_squad.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:56c6b7cba182dec8ec19c08ac928bbc6fd04b455cfbbbe63c2587d1eb62a4a2d
|
| 3 |
+
size 14079972
|
transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_fda.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cf7c1f275c2f4ff58d4b049acb2d100f8e172b488bc25a695dbd3a3dcded3978
|
| 3 |
+
size 14174515
|
transformer-1.3B-100B/based_fda/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_fda.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d1e9269d688db011bf3a4c75de3de165e9c7c6491a40188a8cfa339d8aaf9fbf
|
| 3 |
+
size 14474221
|
transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_nq_2048.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b3f0f80f593482eba938129cf798118cd643bcab3c682bd0c47c9aaa0158ff54
|
| 3 |
+
size 40983751
|
transformer-1.3B-100B/based_nq_2048/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_nq_2048.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:195b60849fb130d21cf7a39d095d95d42a850a1d4c96994eea2a019e376390c3
|
| 3 |
+
size 41916071
|
transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__download_model__transformer-1.3B-100B_based_squad.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:08874dee3322c50b55ec6eb364dd7b915cd02a322ecfa26d81996ab9758e706a
|
| 3 |
+
size 14987974
|
transformer-1.3B-100B/based_squad/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_squad.jsonl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7be1f93c9f06169dec7e21f5683c9d4fefc38e91a79a88cbe0de116ed7c29a5d
|
| 3 |
+
size 14990478
|
transformer-1.3B-100B/based_swde/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_swde.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
transformer-1.3B-100B/based_triviaqa/ checkpoint_name____mnt__jfzn__msj__transformer-1.3B-100B_based_triviaqa.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
transformer-1.3B-100B/based_triviaqa/results.json
ADDED
|
@@ -0,0 +1,55 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"results": {
|
| 3 |
+
"based_triviaqa": {
|
| 4 |
+
"exact,none": 1.481042654028436,
|
| 5 |
+
"exact_stderr,none": "N/A",
|
| 6 |
+
"f1,none": 8.155291191508606,
|
| 7 |
+
"f1_stderr,none": "N/A",
|
| 8 |
+
"contains,none": 0.5811611374407583,
|
| 9 |
+
"contains_stderr,none": "N/A",
|
| 10 |
+
"alias": "based_triviaqa"
|
| 11 |
+
}
|
| 12 |
+
},
|
| 13 |
+
"configs": {
|
| 14 |
+
"based_triviaqa": {
|
| 15 |
+
"description": "",
|
| 16 |
+
"target_delimiter": " ",
|
| 17 |
+
"fewshot_delimiter": "\n\n",
|
| 18 |
+
"num_fewshot": 0,
|
| 19 |
+
"output_type": "generate_until",
|
| 20 |
+
"generation_kwargs": {
|
| 21 |
+
"until": [
|
| 22 |
+
"\n\n"
|
| 23 |
+
],
|
| 24 |
+
"do_sample": false
|
| 25 |
+
},
|
| 26 |
+
"repeats": 1,
|
| 27 |
+
"should_decontaminate": false,
|
| 28 |
+
"metadata": {
|
| 29 |
+
"version": "default"
|
| 30 |
+
}
|
| 31 |
+
}
|
| 32 |
+
},
|
| 33 |
+
"versions": {
|
| 34 |
+
"based_triviaqa": "default"
|
| 35 |
+
},
|
| 36 |
+
"n-shot": {
|
| 37 |
+
"based_triviaqa": 0
|
| 38 |
+
},
|
| 39 |
+
"config": {
|
| 40 |
+
"model": "lm_eval_model",
|
| 41 |
+
"model_args": " checkpoint_name=/mnt/jfzn/msj/download_model/transformer-1.3B-100B",
|
| 42 |
+
"batch_size": "8",
|
| 43 |
+
"batch_sizes": [],
|
| 44 |
+
"device": "cuda:0",
|
| 45 |
+
"use_cache": null,
|
| 46 |
+
"limit": null,
|
| 47 |
+
"bootstrap_iters": 100000,
|
| 48 |
+
"gen_kwargs": null
|
| 49 |
+
},
|
| 50 |
+
"git_hash": null,
|
| 51 |
+
"context_length": 2000,
|
| 52 |
+
"answer_length": 48,
|
| 53 |
+
"cutting_context": true,
|
| 54 |
+
"decode_mode": "default"
|
| 55 |
+
}
|