Upload Token-Choice-NoLB_retrain_results.json with huggingface_hub
Browse files
Token-Choice-NoLB_retrain_results.json
CHANGED
|
@@ -1,19 +1,19 @@
|
|
| 1 |
{
|
| 2 |
"model_name": "Token-Choice-NoLB",
|
| 3 |
"train_losses": [
|
| 4 |
-
1.
|
| 5 |
-
1.
|
| 6 |
],
|
| 7 |
"val_losses": [
|
| 8 |
-
1.
|
| 9 |
-
1.
|
| 10 |
],
|
| 11 |
"retrain_epochs": 2,
|
| 12 |
"retrain_samples": 1000,
|
| 13 |
"original_model": "AKG2/sparse-moe-Token-Choice-NoLB",
|
| 14 |
"target_repo": "J10Official/sparse-moe-Token-Choice-NoLB",
|
| 15 |
-
"final_train_loss": 1.
|
| 16 |
-
"final_val_loss": 1.
|
| 17 |
"total_epochs": 2,
|
| 18 |
"account_info": {
|
| 19 |
"source_account": "AKG2",
|
|
|
|
| 1 |
{
|
| 2 |
"model_name": "Token-Choice-NoLB",
|
| 3 |
"train_losses": [
|
| 4 |
+
1.505009480885097,
|
| 5 |
+
1.4836681816313002
|
| 6 |
],
|
| 7 |
"val_losses": [
|
| 8 |
+
1.7107005669520452,
|
| 9 |
+
1.7021628801639264
|
| 10 |
],
|
| 11 |
"retrain_epochs": 2,
|
| 12 |
"retrain_samples": 1000,
|
| 13 |
"original_model": "AKG2/sparse-moe-Token-Choice-NoLB",
|
| 14 |
"target_repo": "J10Official/sparse-moe-Token-Choice-NoLB",
|
| 15 |
+
"final_train_loss": 1.4836681816313002,
|
| 16 |
+
"final_val_loss": 1.7021628801639264,
|
| 17 |
"total_epochs": 2,
|
| 18 |
"account_info": {
|
| 19 |
"source_account": "AKG2",
|