Upload inference_step13015680_2026-03-13T10-48-12Z.json with huggingface_hub
Browse files
inference_step13015680_2026-03-13T10-48-12Z.json
ADDED
|
@@ -0,0 +1,16 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"step": 13015680,
|
| 3 |
+
"timestamp": "2026-03-13T10-48-12Z",
|
| 4 |
+
"checkpoint": "pretrain_step13015680.pt",
|
| 5 |
+
"tokens_trained": "~11.7B/35B (33.4%)",
|
| 6 |
+
"ar_samples": [
|
| 7 |
+
{"prompt": "The meaning of life is", "output": "associatedwiththebrain.[citationneeded]In2021,anEpileptiformgyringinEarthreleasedthefirstknownepilepticseizureofspatialelectroencephalography..."},
|
| 8 |
+
{"prompt": "Once upon a time", "output": ",itwasreportedthatthesameday,thesamedaywassubsequentlyspentbytheRazakarsandBuddhisttookcontroloftheirjourneystotheRazakars.[citationneeded]..."},
|
| 9 |
+
{"prompt": "Mathematics is important because", "output": "it'snotthebest-knowntreatmentforpeople.[citationneeded]Inresponse,someofthesegmentsarealsoreferredtoas..."}
|
| 10 |
+
],
|
| 11 |
+
"sat_samples": [
|
| 12 |
+
{"prompt": "The quick brown [MASK] jumps over the lazy dog", "output": "ateomeerminformastberichsoftftintdefshardscentviewenKallE21unbbbbbavb... (garbled subword fragments)"},
|
| 13 |
+
{"prompt": "Paris is the [MASK] of France", "output": "ermomeateinfichormsoftardsastberdefviewfoundftritot21intwhichatutelenavf... (garbled subword fragments)"}
|
| 14 |
+
],
|
| 15 |
+
"notes": "AR: English words but no spaces, heavy Wikipedia/citation contamination, repetitive. SAT: still garbled subword fragments, no improvement from earlier checks."
|
| 16 |
+
}
|