Add files using upload-large-folder tool
Browse files- base_checkpoints/d20/model_021400.pt +3 -0
- chatsft_checkpoints/d20/meta_000700.json +14 -0
- eval_bundle/eval_data/language_understanding/hellaswag.jsonl +0 -0
- eval_bundle/eval_data/symbolic_problem_solving/agi_eval_lsat_ar.jsonl +0 -0
- eval_bundle/eval_data/symbolic_problem_solving/bigbench_repeat_copy_logic.jsonl +32 -0
- eval_bundle/eval_data/symbolic_problem_solving/math_qa.jsonl +0 -0
- eval_bundle/eval_data/symbolic_problem_solving/math_simple_soln.jsonl +0 -0
- eval_bundle/eval_data/world_knowledge/mmlu.jsonl +0 -0
- eval_bundle/eval_data/world_knowledge/mmlu_expand.jsonl +0 -0
- mid_checkpoints/d20/meta_000809.json +29 -0
- mid_checkpoints/d20/model_000809.pt +3 -0
base_checkpoints/d20/model_021400.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fd2e8749a51ac2c0be8214d16213805f6346b85a1369af2b1a3b394d984ec439
|
| 3 |
+
size 2076230219
|
chatsft_checkpoints/d20/meta_000700.json
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 700,
|
| 3 |
+
"val_loss": 1.0105494260787964,
|
| 4 |
+
"mmlu_acc": 0.3203125,
|
| 5 |
+
"arc_easy_acc": 0.33203125,
|
| 6 |
+
"model_config": {
|
| 7 |
+
"sequence_len": 2048,
|
| 8 |
+
"vocab_size": 65536,
|
| 9 |
+
"n_layer": 20,
|
| 10 |
+
"n_head": 10,
|
| 11 |
+
"n_kv_head": 10,
|
| 12 |
+
"n_embd": 1280
|
| 13 |
+
}
|
| 14 |
+
}
|
eval_bundle/eval_data/language_understanding/hellaswag.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval_bundle/eval_data/symbolic_problem_solving/agi_eval_lsat_ar.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval_bundle/eval_data/symbolic_problem_solving/bigbench_repeat_copy_logic.jsonl
ADDED
|
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{"context": "repeat with logic:\n\nQ: A watermelon has seven seeds. Repeat they're delicious once for every seed\nA:", "continuation": "they're delicious they're delicious they're delicious they're delicious they're delicious they're delicious they're delicious"}
|
| 2 |
+
{"context": "repeat with logic:\n\nQ: say python twice and data once, and then repeat all of this three times.\nA:", "continuation": "python python data python python data python python data"}
|
| 3 |
+
{"context": "repeat with logic:\n\nQ: output if you teach a person to fish you will three times\nA:", "continuation": "if you teach a person to fish you will if you teach a person to fish you will if you teach a person to fish you will"}
|
| 4 |
+
{"context": "repeat with logic:\n\nQ: repeat election to the council three times, but after every other word say cool\nA:", "continuation": "election to cool the council cool election to cool the council cool election to cool the council cool"}
|
| 5 |
+
{"context": "repeat with logic:\n\nQ: say pickup a pound of green beans twice, replacing a pound with a bunch for even times and a handful for odd\nA:", "continuation": "pickup a handful of green beans pickup a bunch of green beans"}
|
| 6 |
+
{"context": "repeat with logic:\n\nQ: Output carbon pricing is an four times, but in the middle also say interesting concept\nA:", "continuation": "carbon pricing is an carbon pricing is an interesting concept carbon pricing is an carbon pricing is an"}
|
| 7 |
+
{"context": "repeat with logic:\n\nQ: say hello world five times, but don't say world every even time\nA:", "continuation": "hello world hello hello world hello hello world"}
|
| 8 |
+
{"context": "repeat with logic:\n\nQ: Print logic eleven times, but after the 3rd and 8th also say true\nA:", "continuation": "logic logic logic true logic logic logic logic logic true logic logic logic"}
|
| 9 |
+
{"context": "repeat with logic:\n\nQ: say fish are healthy twice\nA:", "continuation": "fish are healthy fish are healthy"}
|
| 10 |
+
{"context": "repeat with logic:\n\nQ: Seven times please repeat The School of Music\nA:", "continuation": "The School of Music The School of Music The School of Music The School of Music The School of Music The School of Music The School of Music"}
|
| 11 |
+
{"context": "repeat with logic:\n\nQ: repeat the phrase the administrative district three times, and say the phrase hello world after the second time\nA:", "continuation": "the administrative district the administrative district hello world the administrative district"}
|
| 12 |
+
{"context": "repeat with logic:\n\nQ: repeat whole note quarter note quarter note quarter note twice\nA:", "continuation": "whole note quarter note quarter note quarter note whole note quarter note quarter note quarter note"}
|
| 13 |
+
{"context": "repeat with logic:\n\nQ: Say the letters of the alphabet in capital letters, but only the odd ones\nA:", "continuation": "A C E G I K M O Q S U W Y"}
|
| 14 |
+
{"context": "repeat with logic:\n\nQ: Repeat historic church building twice, but after every word also say wow\nA:", "continuation": "historic wow church wow building wow historic wow church wow building wow"}
|
| 15 |
+
{"context": "repeat with logic:\n\nQ: repeat a woodchuck chucks lots of wood two times, but replace lots with five pounds the first time and two tons the second time\nA:", "continuation": "a woodchuck chucks five pounds of wood a woodchuck chucks two tons of wood"}
|
| 16 |
+
{"context": "repeat with logic:\n\nQ: Three times please repeat The School of Music, and before the first time say Who plays the bass loud?\nA:", "continuation": "Who plays the bass loud? The School of Music The School of Music The School of Music"}
|
| 17 |
+
{"context": "repeat with logic:\n\nQ: Say the days of the week but only the weekend days, two times\nA:", "continuation": "Saturday Sunday Saturday Sunday"}
|
| 18 |
+
{"context": "repeat with logic:\n\nQ: repeat the word cat four times. After the second time, also say the word meow.\nA:", "continuation": "cat cat meow cat cat"}
|
| 19 |
+
{"context": "repeat with logic:\n\nQ: Twice repeat inhabitants in the urban area and then three times live in walking distance\nA:", "continuation": "inhabitants in the urban area inhabitants in the urban area live in walking distance live in walking distance live in walking distance"}
|
| 20 |
+
{"context": "repeat with logic:\n\nQ: ask a genus of plants in what family? four times. after the fourth time say The happy family\nA:", "continuation": "a genus of plants in what family? a genus of plants in what family? a genus of plants in what family? a genus of plants in what family? The happy family"}
|
| 21 |
+
{"context": "repeat with logic:\n\nQ: Repeat the word dog four times, but halfway through also say woof\nA:", "continuation": "dog dog woof dog dog"}
|
| 22 |
+
{"context": "repeat with logic:\n\nQ: say the village has a population five times, and after odd times add larger than California\nA:", "continuation": "the village has a population larger than California the village has a population the village has a population larger than California the village has a population the village has a population larger than California"}
|
| 23 |
+
{"context": "repeat with logic:\n\nQ: Repeat cheese seven times; every third say whiz\nA:", "continuation": "cheese cheese cheese whiz cheese cheese cheese whiz cheese"}
|
| 24 |
+
{"context": "repeat with logic:\n\nQ: Repeat all the world seven times, and after every second time add is a stage.\nA:", "continuation": "all the world all the world is a stage all the world all the world is a stage all the world all the world is a stage all the world"}
|
| 25 |
+
{"context": "repeat with logic:\n\nQ: Repeat the phrase all cars eat gas four times. On the odd times, drop words that start with vowels\nA:", "continuation": "cars gas all cars eat gas cars gas all cars eat gas"}
|
| 26 |
+
{"context": "repeat with logic:\n\nQ: Say hungry three times, then hippo two times, then feed me four times\nA:", "continuation": "hungry hungry hungry hippo hippo feed me feed me feed me feed me"}
|
| 27 |
+
{"context": "repeat with logic:\n\nQ: A strawberry has three leaves. Say wish I had some chocolate for every odd leaf\nA:", "continuation": "wish I had some chocolate wish I had some chocolate"}
|
| 28 |
+
{"context": "repeat with logic:\n\nQ: Say the botanical gardens are five times. If the time divides evenly by two add beautiful, or by three add wonderful. Otherwise say great.\nA:", "continuation": "the botanical gardens are great the botanical gardens are beautiful the botanical gardens are wonderful the botanical gardens are beautiful the botanical gardens are great"}
|
| 29 |
+
{"context": "repeat with logic:\n\nQ: Repeat cat five times. After each time, also say mouse\nA:", "continuation": "cat mouse cat mouse cat mouse cat mouse cat mouse"}
|
| 30 |
+
{"context": "repeat with logic:\n\nQ: say all work and no play makes three times, but every even time add Jack and odd time add Jill\nA:", "continuation": "all work and no play makes Jill all work and no play makes Jack all work and no play makes Jill"}
|
| 31 |
+
{"context": "repeat with logic:\n\nQ: Repeat 5 times hello world\nA:", "continuation": "hello world hello world hello world hello world hello world"}
|
| 32 |
+
{"context": "repeat with logic:\n\nQ: Repeat squiggly line twice after the phrase can you draw\nA:", "continuation": "can you draw squiggly line squiggly line"}
|
eval_bundle/eval_data/symbolic_problem_solving/math_qa.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval_bundle/eval_data/symbolic_problem_solving/math_simple_soln.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval_bundle/eval_data/world_knowledge/mmlu.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
eval_bundle/eval_data/world_knowledge/mmlu_expand.jsonl
ADDED
|
The diff for this file is too large to render.
See raw diff
|
|
|
mid_checkpoints/d20/meta_000809.json
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 809,
|
| 3 |
+
"val_bpb": 0.3952791820903297,
|
| 4 |
+
"model_config": {
|
| 5 |
+
"sequence_len": 2048,
|
| 6 |
+
"vocab_size": 65536,
|
| 7 |
+
"n_layer": 20,
|
| 8 |
+
"n_head": 10,
|
| 9 |
+
"n_kv_head": 10,
|
| 10 |
+
"n_embd": 1280
|
| 11 |
+
},
|
| 12 |
+
"user_config": {
|
| 13 |
+
"run": "fal-mid",
|
| 14 |
+
"device_type": "",
|
| 15 |
+
"dtype": "bfloat16",
|
| 16 |
+
"num_iterations": -1,
|
| 17 |
+
"max_seq_len": 2048,
|
| 18 |
+
"device_batch_size": 32,
|
| 19 |
+
"unembedding_lr": 0.004,
|
| 20 |
+
"embedding_lr": 0.2,
|
| 21 |
+
"matrix_lr": 0.02,
|
| 22 |
+
"init_lr_frac": 1.0,
|
| 23 |
+
"weight_decay": 0.0,
|
| 24 |
+
"eval_every": 150,
|
| 25 |
+
"eval_tokens": 10485760,
|
| 26 |
+
"total_batch_size": 524288,
|
| 27 |
+
"dry_run": 0
|
| 28 |
+
}
|
| 29 |
+
}
|
mid_checkpoints/d20/model_000809.pt
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:331c589a962cbe831f2f13543d7d3090a31f6277a15c67cd2d5396b9b73bd4d4
|
| 3 |
+
size 2076230219
|