Upload add_sub_sorl_v1_abs30_K1_10K_1L2H256d
Browse files
add_sub_sorl_v1_abs30_K1_10K_1L2H256d/train_config.json
CHANGED
|
@@ -70,14 +70,14 @@
|
|
| 70 |
"n_params": 78706688,
|
| 71 |
"run_name": "add_sub_sorl_v1_abs30_K1_10K_1L2H256d",
|
| 72 |
"git_commit": "17e935f460a7f9595b705c1d614101a6b0e520f7",
|
| 73 |
-
"timestamp": "2026-04-14T06:
|
| 74 |
"tokenizer": "Qwen/Qwen3-0.6B",
|
| 75 |
"dataset_repo": "thoughtworks/arithmetic-sorl-data",
|
| 76 |
"dataset_config": "add_sub_6digit",
|
| 77 |
"model_repo": "thoughtworks/arithmetic-sorl",
|
| 78 |
"trainer_version": "v1",
|
| 79 |
-
"wandb_run_id": "
|
| 80 |
-
"wandb_url": "https://wandb.ai/nlp_and_interpretability/sorl-arithmetic/runs/
|
| 81 |
"final_accuracy": 0.004166666666666667,
|
| 82 |
"sft_accuracy": 0.00375,
|
| 83 |
"eval_method": "ArithmeticEvaluator"
|
|
|
|
| 70 |
"n_params": 78706688,
|
| 71 |
"run_name": "add_sub_sorl_v1_abs30_K1_10K_1L2H256d",
|
| 72 |
"git_commit": "17e935f460a7f9595b705c1d614101a6b0e520f7",
|
| 73 |
+
"timestamp": "2026-04-14T06:43:49.081569+00:00",
|
| 74 |
"tokenizer": "Qwen/Qwen3-0.6B",
|
| 75 |
"dataset_repo": "thoughtworks/arithmetic-sorl-data",
|
| 76 |
"dataset_config": "add_sub_6digit",
|
| 77 |
"model_repo": "thoughtworks/arithmetic-sorl",
|
| 78 |
"trainer_version": "v1",
|
| 79 |
+
"wandb_run_id": "of7o17e5",
|
| 80 |
+
"wandb_url": "https://wandb.ai/nlp_and_interpretability/sorl-arithmetic/runs/of7o17e5",
|
| 81 |
"final_accuracy": 0.004166666666666667,
|
| 82 |
"sft_accuracy": 0.00375,
|
| 83 |
"eval_method": "ArithmeticEvaluator"
|