jnjj commited on
Commit
5614daa
·
verified ·
1 Parent(s): a2a12c0

Periodic upload

Browse files
Files changed (5) hide show
  1. README.md +4 -4
  2. model.safetensors +1 -1
  3. special_tokens_map.json +7 -1
  4. tokenizer.json +1 -10
  5. training.log +11 -0
README.md CHANGED
@@ -9,7 +9,7 @@ library_name: transformers
9
 
10
  ## Progreso de Entrenamiento
11
 
12
- - **Datasets procesados:** 0.0
13
- - **Ejemplos de texto procesados:** 0.0
14
- - **Tokens procesados:** 0.0
15
- - **Última subida:** 2025-05-06 14:31:08 UTC
 
9
 
10
  ## Progreso de Entrenamiento
11
 
12
+ - **Datasets procesados:** 3.0
13
+ - **Ejemplos de texto procesados:** 9.0
14
+ - **Tokens procesados:** 4434.0
15
+ - **Última subida:** 2025-05-06 14:32:12 UTC
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ee3ef577587882ee849f7128857a15ba4dd2c5885c6d189bf033b15f343182f5
3
  size 51957256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ec694330f318cc4748e5749da1919ab636e66c0dbdcbd15b60aae6061228e77
3
  size 51957256
special_tokens_map.json CHANGED
@@ -13,7 +13,13 @@
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
- "pad_token": "</s>",
 
 
 
 
 
 
17
  "unk_token": {
18
  "content": "<unk>",
19
  "lstrip": false,
 
13
  "rstrip": false,
14
  "single_word": false
15
  },
16
+ "pad_token": {
17
+ "content": "</s>",
18
+ "lstrip": false,
19
+ "normalized": true,
20
+ "rstrip": false,
21
+ "single_word": false
22
+ },
23
  "unk_token": {
24
  "content": "<unk>",
25
  "lstrip": false,
tokenizer.json CHANGED
@@ -6,16 +6,7 @@
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
- "padding": {
10
- "strategy": {
11
- "Fixed": 512
12
- },
13
- "direction": "Left",
14
- "pad_to_multiple_of": null,
15
- "pad_id": 2,
16
- "pad_type_id": 0,
17
- "pad_token": "</s>"
18
- },
19
  "added_tokens": [
20
  {
21
  "id": 0,
 
6
  "strategy": "LongestFirst",
7
  "stride": 0
8
  },
9
+ "padding": null,
 
 
 
 
 
 
 
 
 
10
  "added_tokens": [
11
  {
12
  "id": 0,
training.log CHANGED
@@ -7,3 +7,14 @@
7
  2025-05-06 16:30:41,433 INFO: HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
8
  2025-05-06 16:31:07,974 INFO: Fetched 379843 datasets to process.
9
  2025-05-06 16:31:08,585 INFO: Preparing data for nvidia/Nemotron-CrossThink, config: default
 
 
 
 
 
 
 
 
 
 
 
 
7
  2025-05-06 16:30:41,433 INFO: HTTP Request: HEAD http://localhost:7860/ "HTTP/1.1 200 OK"
8
  2025-05-06 16:31:07,974 INFO: Fetched 379843 datasets to process.
9
  2025-05-06 16:31:08,585 INFO: Preparing data for nvidia/Nemotron-CrossThink, config: default
10
+ 2025-05-06 16:31:12,688 INFO: Upload successful.
11
+ 2025-05-06 16:31:12,688 INFO: Preparing data for nvidia/OpenMathReasoning, config: default
12
+ 2025-05-06 16:31:14,303 INFO: Starting model update for nvidia/Nemotron-CrossThink, config: default
13
+ 2025-05-06 16:31:17,591 INFO: Finished training and saved model/tokenizer for nvidia/Nemotron-CrossThink config default
14
+ 2025-05-06 16:31:17,595 ERROR: Error in background_training_loop task scheduling: local variable 'merged_model' referenced before assignment
15
+ 2025-05-06 16:31:17,970 INFO: Preparing data for nvidia/OpenCodeReasoning, config: split_0
16
+ 2025-05-06 16:31:18,439 INFO: Starting model update for nvidia/OpenMathReasoning, config: default
17
+ 2025-05-06 16:31:21,695 INFO: Finished training and saved model/tokenizer for nvidia/OpenMathReasoning config default
18
+ 2025-05-06 16:31:21,776 ERROR: Failed to get configs for rajpurkarlab/ReXGradient-160K: Dataset 'rajpurkarlab/ReXGradient-160K' is a gated dataset on the Hub. Visit the dataset page at https://huggingface.co/datasets/rajpurkarlab/ReXGradient-160K to ask for access.
19
+ 2025-05-06 16:31:29,921 INFO: Starting model update for nvidia/OpenCodeReasoning, config: split_0
20
+ 2025-05-06 16:31:39,156 INFO: Finished training and saved model/tokenizer for nvidia/OpenCodeReasoning config split_0