ttj commited on
Commit
67a101a
·
verified ·
1 Parent(s): 85a524c

Add files using upload-large-folder tool

Browse files
base_checkpoints/d20/model_021400.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd2e8749a51ac2c0be8214d16213805f6346b85a1369af2b1a3b394d984ec439
3
+ size 2076230219
chatsft_checkpoints/d20/meta_000700.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "step": 700,
3
+ "val_loss": 1.0105494260787964,
4
+ "mmlu_acc": 0.3203125,
5
+ "arc_easy_acc": 0.33203125,
6
+ "model_config": {
7
+ "sequence_len": 2048,
8
+ "vocab_size": 65536,
9
+ "n_layer": 20,
10
+ "n_head": 10,
11
+ "n_kv_head": 10,
12
+ "n_embd": 1280
13
+ }
14
+ }
eval_bundle/eval_data/language_understanding/hellaswag.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
eval_bundle/eval_data/symbolic_problem_solving/agi_eval_lsat_ar.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
eval_bundle/eval_data/symbolic_problem_solving/bigbench_repeat_copy_logic.jsonl ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {"context": "repeat with logic:\n\nQ: A watermelon has seven seeds. Repeat they're delicious once for every seed\nA:", "continuation": "they're delicious they're delicious they're delicious they're delicious they're delicious they're delicious they're delicious"}
2
+ {"context": "repeat with logic:\n\nQ: say python twice and data once, and then repeat all of this three times.\nA:", "continuation": "python python data python python data python python data"}
3
+ {"context": "repeat with logic:\n\nQ: output if you teach a person to fish you will three times\nA:", "continuation": "if you teach a person to fish you will if you teach a person to fish you will if you teach a person to fish you will"}
4
+ {"context": "repeat with logic:\n\nQ: repeat election to the council three times, but after every other word say cool\nA:", "continuation": "election to cool the council cool election to cool the council cool election to cool the council cool"}
5
+ {"context": "repeat with logic:\n\nQ: say pickup a pound of green beans twice, replacing a pound with a bunch for even times and a handful for odd\nA:", "continuation": "pickup a handful of green beans pickup a bunch of green beans"}
6
+ {"context": "repeat with logic:\n\nQ: Output carbon pricing is an four times, but in the middle also say interesting concept\nA:", "continuation": "carbon pricing is an carbon pricing is an interesting concept carbon pricing is an carbon pricing is an"}
7
+ {"context": "repeat with logic:\n\nQ: say hello world five times, but don't say world every even time\nA:", "continuation": "hello world hello hello world hello hello world"}
8
+ {"context": "repeat with logic:\n\nQ: Print logic eleven times, but after the 3rd and 8th also say true\nA:", "continuation": "logic logic logic true logic logic logic logic logic true logic logic logic"}
9
+ {"context": "repeat with logic:\n\nQ: say fish are healthy twice\nA:", "continuation": "fish are healthy fish are healthy"}
10
+ {"context": "repeat with logic:\n\nQ: Seven times please repeat The School of Music\nA:", "continuation": "The School of Music The School of Music The School of Music The School of Music The School of Music The School of Music The School of Music"}
11
+ {"context": "repeat with logic:\n\nQ: repeat the phrase the administrative district three times, and say the phrase hello world after the second time\nA:", "continuation": "the administrative district the administrative district hello world the administrative district"}
12
+ {"context": "repeat with logic:\n\nQ: repeat whole note quarter note quarter note quarter note twice\nA:", "continuation": "whole note quarter note quarter note quarter note whole note quarter note quarter note quarter note"}
13
+ {"context": "repeat with logic:\n\nQ: Say the letters of the alphabet in capital letters, but only the odd ones\nA:", "continuation": "A C E G I K M O Q S U W Y"}
14
+ {"context": "repeat with logic:\n\nQ: Repeat historic church building twice, but after every word also say wow\nA:", "continuation": "historic wow church wow building wow historic wow church wow building wow"}
15
+ {"context": "repeat with logic:\n\nQ: repeat a woodchuck chucks lots of wood two times, but replace lots with five pounds the first time and two tons the second time\nA:", "continuation": "a woodchuck chucks five pounds of wood a woodchuck chucks two tons of wood"}
16
+ {"context": "repeat with logic:\n\nQ: Three times please repeat The School of Music, and before the first time say Who plays the bass loud?\nA:", "continuation": "Who plays the bass loud? The School of Music The School of Music The School of Music"}
17
+ {"context": "repeat with logic:\n\nQ: Say the days of the week but only the weekend days, two times\nA:", "continuation": "Saturday Sunday Saturday Sunday"}
18
+ {"context": "repeat with logic:\n\nQ: repeat the word cat four times. After the second time, also say the word meow.\nA:", "continuation": "cat cat meow cat cat"}
19
+ {"context": "repeat with logic:\n\nQ: Twice repeat inhabitants in the urban area and then three times live in walking distance\nA:", "continuation": "inhabitants in the urban area inhabitants in the urban area live in walking distance live in walking distance live in walking distance"}
20
+ {"context": "repeat with logic:\n\nQ: ask a genus of plants in what family? four times. after the fourth time say The happy family\nA:", "continuation": "a genus of plants in what family? a genus of plants in what family? a genus of plants in what family? a genus of plants in what family? The happy family"}
21
+ {"context": "repeat with logic:\n\nQ: Repeat the word dog four times, but halfway through also say woof\nA:", "continuation": "dog dog woof dog dog"}
22
+ {"context": "repeat with logic:\n\nQ: say the village has a population five times, and after odd times add larger than California\nA:", "continuation": "the village has a population larger than California the village has a population the village has a population larger than California the village has a population the village has a population larger than California"}
23
+ {"context": "repeat with logic:\n\nQ: Repeat cheese seven times; every third say whiz\nA:", "continuation": "cheese cheese cheese whiz cheese cheese cheese whiz cheese"}
24
+ {"context": "repeat with logic:\n\nQ: Repeat all the world seven times, and after every second time add is a stage.\nA:", "continuation": "all the world all the world is a stage all the world all the world is a stage all the world all the world is a stage all the world"}
25
+ {"context": "repeat with logic:\n\nQ: Repeat the phrase all cars eat gas four times. On the odd times, drop words that start with vowels\nA:", "continuation": "cars gas all cars eat gas cars gas all cars eat gas"}
26
+ {"context": "repeat with logic:\n\nQ: Say hungry three times, then hippo two times, then feed me four times\nA:", "continuation": "hungry hungry hungry hippo hippo feed me feed me feed me feed me"}
27
+ {"context": "repeat with logic:\n\nQ: A strawberry has three leaves. Say wish I had some chocolate for every odd leaf\nA:", "continuation": "wish I had some chocolate wish I had some chocolate"}
28
+ {"context": "repeat with logic:\n\nQ: Say the botanical gardens are five times. If the time divides evenly by two add beautiful, or by three add wonderful. Otherwise say great.\nA:", "continuation": "the botanical gardens are great the botanical gardens are beautiful the botanical gardens are wonderful the botanical gardens are beautiful the botanical gardens are great"}
29
+ {"context": "repeat with logic:\n\nQ: Repeat cat five times. After each time, also say mouse\nA:", "continuation": "cat mouse cat mouse cat mouse cat mouse cat mouse"}
30
+ {"context": "repeat with logic:\n\nQ: say all work and no play makes three times, but every even time add Jack and odd time add Jill\nA:", "continuation": "all work and no play makes Jill all work and no play makes Jack all work and no play makes Jill"}
31
+ {"context": "repeat with logic:\n\nQ: Repeat 5 times hello world\nA:", "continuation": "hello world hello world hello world hello world hello world"}
32
+ {"context": "repeat with logic:\n\nQ: Repeat squiggly line twice after the phrase can you draw\nA:", "continuation": "can you draw squiggly line squiggly line"}
eval_bundle/eval_data/symbolic_problem_solving/math_qa.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
eval_bundle/eval_data/symbolic_problem_solving/math_simple_soln.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
eval_bundle/eval_data/world_knowledge/mmlu.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
eval_bundle/eval_data/world_knowledge/mmlu_expand.jsonl ADDED
The diff for this file is too large to render. See raw diff
 
mid_checkpoints/d20/meta_000809.json ADDED
@@ -0,0 +1,29 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "step": 809,
3
+ "val_bpb": 0.3952791820903297,
4
+ "model_config": {
5
+ "sequence_len": 2048,
6
+ "vocab_size": 65536,
7
+ "n_layer": 20,
8
+ "n_head": 10,
9
+ "n_kv_head": 10,
10
+ "n_embd": 1280
11
+ },
12
+ "user_config": {
13
+ "run": "fal-mid",
14
+ "device_type": "",
15
+ "dtype": "bfloat16",
16
+ "num_iterations": -1,
17
+ "max_seq_len": 2048,
18
+ "device_batch_size": 32,
19
+ "unembedding_lr": 0.004,
20
+ "embedding_lr": 0.2,
21
+ "matrix_lr": 0.02,
22
+ "init_lr_frac": 1.0,
23
+ "weight_decay": 0.0,
24
+ "eval_every": 150,
25
+ "eval_tokens": 10485760,
26
+ "total_batch_size": 524288,
27
+ "dry_run": 0
28
+ }
29
+ }
mid_checkpoints/d20/model_000809.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:331c589a962cbe831f2f13543d7d3090a31f6277a15c67cd2d5396b9b73bd4d4
3
+ size 2076230219