Update evaluation_stats.json via script
Browse files- evaluation_stats.json +12 -12
evaluation_stats.json
CHANGED
|
@@ -1,6 +1,5 @@
|
|
| 1 |
{
|
| 2 |
"perplexity_history": [
|
| 3 |
-
291.82647705078125,
|
| 4 |
291.81048583984375,
|
| 5 |
291.7937927246094,
|
| 6 |
291.7740173339844,
|
|
@@ -19,19 +18,20 @@
|
|
| 19 |
291.5338439941406,
|
| 20 |
291.50592041015625,
|
| 21 |
291.4782409667969,
|
| 22 |
-
291.44378662109375
|
|
|
|
| 23 |
],
|
| 24 |
"last_examples": {
|
| 25 |
-
"Story Continuation": "
|
| 26 |
-
"Simple Instruction": "
|
| 27 |
-
"Creative Prompt": "\
|
| 28 |
-
"Question Answering (Basic)": "
|
| 29 |
-
"Code Generation (Simple Python)": "
|
| 30 |
-
"Reasoning (Simple)": "The
|
| 31 |
},
|
| 32 |
-
"last_update_time": "2025-05-08
|
| 33 |
-
"datasets_processed_count":
|
| 34 |
-
"texts_processed_count":
|
| 35 |
-
"tokens_processed_count":
|
| 36 |
"lighteval_results": {}
|
| 37 |
}
|
|
|
|
| 1 |
{
|
| 2 |
"perplexity_history": [
|
|
|
|
| 3 |
291.81048583984375,
|
| 4 |
291.7937927246094,
|
| 5 |
291.7740173339844,
|
|
|
|
| 18 |
291.5338439941406,
|
| 19 |
291.50592041015625,
|
| 20 |
291.4782409667969,
|
| 21 |
+
291.44378662109375,
|
| 22 |
+
289.20306396484375
|
| 23 |
],
|
| 24 |
"last_examples": {
|
| 25 |
+
"Story Continuation": "How do I get the best picture of what we have now?\nI am getting a lot of awesome photos that can be amazing! Thanks for sharing!!!\nMonday!!!!!!!!! Thanks for all!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!\nSorry this is not the time!!!!!!\nHi guys!!!!",
|
| 26 |
+
"Simple Instruction": "I have been trying to make progress and challenges? What about my biography?\nI wanted to be very creative! I would love to go back to work with myself, but not too much effort or lessons than others, but it helps me feel better when we try to find ourselves happy patients will get a little bit more information on what I want here.",
|
| 27 |
+
"Creative Prompt": "We are pleased to announce the launch of the first prototype projector is bringing us to Mars Earth.\nThe mission is to be launching our new spacecrafts, which will come up with the launch of Marscraftia SpaceXicon Spacecraft and asteroid orbital spacecraft.\nWe have a mission to make Earthcraft asteroids through NASA Earth Day\u2122",
|
| 28 |
+
"Question Answering (Basic)": "As an example we've been using the same pattern threaded threading patches of new threads that can be removed from thread threads. These thread threads were used to thread thread thread threads removed them onto thread threads or thread threads. It is threadbare threads thread threads thread thread thread threads for thread thread thread threads when thread thread threads thread thread threadbone thread thread threads thread",
|
| 29 |
+
"Code Generation (Simple Python)": "We are looking forward to seeing us in the future today! This is one of our favourite gameplaying gameplayers! We have been lucky enough to play this game when we come back to the point where we need to learn how to get started, but what happens after we gotta go.\nWe had a great day ahead of time. It was fun",
|
| 30 |
+
"Reasoning (Simple)": "The time of day we were trying to get our latest updates. It\u2019s been amazed because we are going to see all the way upcoming events happening in Europe but hopefully we know some new people have lost their lives!\nIn recent years as they go on to see what happens when we are doing.\nThe biggest event has been so far away from the start"
|
| 31 |
},
|
| 32 |
+
"last_update_time": "2025-05-08 15:36:17 UTC",
|
| 33 |
+
"datasets_processed_count": 1,
|
| 34 |
+
"texts_processed_count": 6,
|
| 35 |
+
"tokens_processed_count": 3072,
|
| 36 |
"lighteval_results": {}
|
| 37 |
}
|