Periodic upload
Browse files- README.md +4 -4
- model.safetensors +1 -1
- special_tokens_map.json +7 -1
- tokenizer.json +1 -10
- training.log +11 -0
README.md
CHANGED
|
@@ -9,7 +9,7 @@ library_name: transformers
|
|
| 9 |
|
| 10 |
## Progreso de Entrenamiento
|
| 11 |
|
| 12 |
-
- **Datasets procesados:**
|
| 13 |
-
- **Ejemplos de texto procesados:**
|
| 14 |
-
- **Tokens procesados:**
|
| 15 |
-
- **Última subida:** 2025-05-06 14:
|
|
|
|
| 9 |
|
| 10 |
## Progreso de Entrenamiento
|
| 11 |
|
| 12 |
+
- **Datasets procesados:** 3.0
|
| 13 |
+
- **Ejemplos de texto procesados:** 9.0
|
| 14 |
+
- **Tokens procesados:** 4434.0
|
| 15 |
+
- **Última subida:** 2025-05-06 14:32:12 UTC
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 51957256
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:5ec694330f318cc4748e5749da1919ab636e66c0dbdcbd15b60aae6061228e77
|
| 3 |
size 51957256
|
special_tokens_map.json
CHANGED
|
@@ -13,7 +13,13 @@
|
|
| 13 |
"rstrip": false,
|
| 14 |
"single_word": false
|
| 15 |
},
|
| 16 |
-
"pad_token":
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 17 |
"unk_token": {
|
| 18 |
"content": "<unk>",
|
| 19 |
"lstrip": false,
|
|
|
|
| 13 |
"rstrip": false,
|
| 14 |
"single_word": false
|
| 15 |
},
|
| 16 |
+
"pad_token": {
|
| 17 |
+
"content": "</s>",
|
| 18 |
+
"lstrip": false,
|
| 19 |
+
"normalized": true,
|
| 20 |
+
"rstrip": false,
|
| 21 |
+
"single_word": false
|
| 22 |
+
},
|
| 23 |
"unk_token": {
|
| 24 |
"content": "<unk>",
|
| 25 |
"lstrip": false,
|
tokenizer.json
CHANGED
|
@@ -6,16 +6,7 @@
|
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
| 9 |
-
"padding":
|
| 10 |
-
"strategy": {
|
| 11 |
-
"Fixed": 512
|
| 12 |
-
},
|
| 13 |
-
"direction": "Left",
|
| 14 |
-
"pad_to_multiple_of": null,
|
| 15 |
-
"pad_id": 2,
|
| 16 |
-
"pad_type_id": 0,
|
| 17 |
-
"pad_token": "</s>"
|
| 18 |
-
},
|
| 19 |
"added_tokens": [
|
| 20 |
{
|
| 21 |
"id": 0,
|
|
|
|
| 6 |
"strategy": "LongestFirst",
|
| 7 |
"stride": 0
|
| 8 |
},
|
| 9 |
+
"padding": null,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 10 |
"added_tokens": [
|
| 11 |
{
|
| 12 |
"id": 0,
|
training.log
CHANGED
|
@@ -7,3 +7,14 @@
|
|
| 7 |
2025-05-06 16:30:41,433 INFO: HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
|
| 8 |
2025-05-06 16:31:07,974 INFO: Fetched 379843 datasets to process.
|
| 9 |
2025-05-06 16:31:08,585 INFO: Preparing data for nvidia/Nemotron-CrossThink, config: default
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 7 |
2025-05-06 16:30:41,433 INFO: HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
|
| 8 |
2025-05-06 16:31:07,974 INFO: Fetched 379843 datasets to process.
|
| 9 |
2025-05-06 16:31:08,585 INFO: Preparing data for nvidia/Nemotron-CrossThink, config: default
|
| 10 |
+
2025-05-06 16:31:12,688 INFO: Upload successful.
|
| 11 |
+
2025-05-06 16:31:12,688 INFO: Preparing data for nvidia/OpenMathReasoning, config: default
|
| 12 |
+
2025-05-06 16:31:14,303 INFO: Starting model update for nvidia/Nemotron-CrossThink, config: default
|
| 13 |
+
2025-05-06 16:31:17,591 INFO: Finished training and saved model/tokenizer for nvidia/Nemotron-CrossThink config default
|
| 14 |
+
2025-05-06 16:31:17,595 ERROR: Error in background_training_loop task scheduling: local variable 'merged_model' referenced before assignment
|
| 15 |
+
2025-05-06 16:31:17,970 INFO: Preparing data for nvidia/OpenCodeReasoning, config: split_0
|
| 16 |
+
2025-05-06 16:31:18,439 INFO: Starting model update for nvidia/OpenMathReasoning, config: default
|
| 17 |
+
2025-05-06 16:31:21,695 INFO: Finished training and saved model/tokenizer for nvidia/OpenMathReasoning config default
|
| 18 |
+
2025-05-06 16:31:21,776 ERROR: Failed to get configs for rajpurkarlab/ReXGradient-160K: Dataset 'rajpurkarlab/ReXGradient-160K' is a gated dataset on the Hub. Visit the dataset page at https://huggingface.co/datasets/rajpurkarlab/ReXGradient-160K to ask for access.
|
| 19 |
+
2025-05-06 16:31:29,921 INFO: Starting model update for nvidia/OpenCodeReasoning, config: split_0
|
| 20 |
+
2025-05-06 16:31:39,156 INFO: Finished training and saved model/tokenizer for nvidia/OpenCodeReasoning config split_0
|