Periodic upload
Browse files- README.md +4 -4
- model.safetensors +1 -1
- training.log +59 -0
README.md
CHANGED
|
@@ -9,7 +9,7 @@ library_name: transformers
|
|
| 9 |
|
| 10 |
## Progreso de Entrenamiento
|
| 11 |
|
| 12 |
-
- **Datasets procesados:**
|
| 13 |
-
- **Ejemplos de texto procesados:**
|
| 14 |
-
- **Tokens procesados:**
|
| 15 |
-
- **Última subida:** 2025-05-06 14:
|
|
|
|
| 9 |
|
| 10 |
## Progreso de Entrenamiento
|
| 11 |
|
| 12 |
+
- **Datasets procesados:** 9.0
|
| 13 |
+
- **Ejemplos de texto procesados:** 27.0
|
| 14 |
+
- **Tokens procesados:** 10676.0
|
| 15 |
+
- **Última subida:** 2025-05-06 14:34:18 UTC
|
model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 51957256
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:260d4fa77856dc2ee64e872ada25b5c99b1b68cd1da1ef8bfa558f36fbb2e4ae
|
| 3 |
size 51957256
|
training.log
CHANGED
|
@@ -81,3 +81,62 @@ Traceback (most recent call last):
|
|
| 81 |
File "pyarrow/error.pxi", line 155, in pyarrow.lib.pyarrow_internal_check_status
|
| 82 |
File "pyarrow/error.pxi", line 92, in pyarrow.lib.check_status
|
| 83 |
pyarrow.lib.ArrowInvalid: JSON parse error: Invalid value. in row 0
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 81 |
File "pyarrow/error.pxi", line 155, in pyarrow.lib.pyarrow_internal_check_status
|
| 82 |
File "pyarrow/error.pxi", line 92, in pyarrow.lib.check_status
|
| 83 |
pyarrow.lib.ArrowInvalid: JSON parse error: Invalid value. in row 0
|
| 84 |
+
2025-05-06 16:33:18,163 INFO: Upload successful.
|
| 85 |
+
2025-05-06 16:33:22,552 INFO: Preparing data for Eureka-Lab/PHYBench, config: default
|
| 86 |
+
2025-05-06 16:33:22,655 INFO: Preparing data for nyuuzyou/svgfind, config: default
|
| 87 |
+
2025-05-06 16:33:24,226 INFO: Starting model update for Eureka-Lab/PHYBench, config: default
|
| 88 |
+
2025-05-06 16:33:25,829 ERROR: Error during data preparation for nyuuzyou/svgfind config default: Compression type zstd not supported
|
| 89 |
+
Traceback (most recent call last):
|
| 90 |
+
File "/home/user/app/app.py", line 233, in process_and_train
|
| 91 |
+
first_item = await asyncio.to_thread(lambda: next(iter(train_ds_instance), None))
|
| 92 |
+
File "/usr/local/lib/python3.10/asyncio/threads.py", line 25, in to_thread
|
| 93 |
+
return await loop.run_in_executor(None, func_call)
|
| 94 |
+
File "/usr/local/lib/python3.10/concurrent/futures/thread.py", line 58, in run
|
| 95 |
+
result = self.fn(*self.args, **self.kwargs)
|
| 96 |
+
File "/home/user/app/app.py", line 233, in <lambda>
|
| 97 |
+
first_item = await asyncio.to_thread(lambda: next(iter(train_ds_instance), None))
|
| 98 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/iterable_dataset.py", line 2266, in __iter__
|
| 99 |
+
for key, example in ex_iterable:
|
| 100 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/iterable_dataset.py", line 222, in __iter__
|
| 101 |
+
for key_example in islice(self.generate_examples_fn(**gen_kwags), shard_example_idx_start, None):
|
| 102 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/packaged_modules/generator/generator.py", line 33, in _generate_examples
|
| 103 |
+
yield from enumerate(self.config.generator(**gen_kwargs))
|
| 104 |
+
File "/home/user/app/app.py", line 214, in gen_data_for_cfg
|
| 105 |
+
for ex in dataset_split:
|
| 106 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/iterable_dataset.py", line 2266, in __iter__
|
| 107 |
+
for key, example in ex_iterable:
|
| 108 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/iterable_dataset.py", line 302, in __iter__
|
| 109 |
+
for key, pa_table in self.generate_tables_fn(**gen_kwags):
|
| 110 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/packaged_modules/json/json.py", line 99, in _generate_tables
|
| 111 |
+
for file_idx, file in enumerate(itertools.chain.from_iterable(files)):
|
| 112 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/utils/track.py", line 49, in __iter__
|
| 113 |
+
for x in self.generator(*self.args):
|
| 114 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/utils/file_utils.py", line 1366, in _iter_from_urlpaths
|
| 115 |
+
elif xisdir(urlpath, download_config=download_config):
|
| 116 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/utils/file_utils.py", line 799, in xisdir
|
| 117 |
+
return fs.isdir(inner_path)
|
| 118 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/spec.py", line 701, in isdir
|
| 119 |
+
return self.info(path)["type"] == "directory"
|
| 120 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/archive.py", line 40, in info
|
| 121 |
+
self._get_dirs()
|
| 122 |
+
File "/usr/local/lib/python3.10/site-packages/datasets/filesystems/compression.py", line 66, in _get_dirs
|
| 123 |
+
f = {**self._open_with_fsspec().fs.info(self.fo), "name": self.uncompressed_name}
|
| 124 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/core.py", line 491, in open
|
| 125 |
+
out = open_files(
|
| 126 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/core.py", line 314, in open_files
|
| 127 |
+
[
|
| 128 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/core.py", line 315, in <listcomp>
|
| 129 |
+
OpenFile(
|
| 130 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/core.py", line 78, in __init__
|
| 131 |
+
self.compression = get_compression(path, compression)
|
| 132 |
+
File "/usr/local/lib/python3.10/site-packages/fsspec/core.py", line 544, in get_compression
|
| 133 |
+
raise ValueError(f"Compression type {compression} not supported")
|
| 134 |
+
ValueError: Compression type zstd not supported
|
| 135 |
+
2025-05-06 16:33:27,737 INFO: Finished training and saved model/tokenizer for Eureka-Lab/PHYBench config default
|
| 136 |
+
2025-05-06 16:33:27,738 ERROR: Error in background_training_loop task scheduling: local variable 'merged_model' referenced before assignment
|
| 137 |
+
2025-05-06 16:33:28,089 INFO: Preparing data for FreedomIntelligence/medical-o1-reasoning-SFT, config: en
|
| 138 |
+
2025-05-06 16:33:28,153 INFO: Preparing data for BramVanroy/CommonCrawl-CreativeCommons, config: v1
|
| 139 |
+
2025-05-06 16:33:32,653 INFO: Starting model update for FreedomIntelligence/medical-o1-reasoning-SFT, config: en
|
| 140 |
+
2025-05-06 16:33:36,683 INFO: Finished training and saved model/tokenizer for FreedomIntelligence/medical-o1-reasoning-SFT config en
|
| 141 |
+
2025-05-06 16:33:36,683 INFO: Starting model update for BramVanroy/CommonCrawl-CreativeCommons, config: v1
|
| 142 |
+
2025-05-06 16:33:38,967 INFO: Finished training and saved model/tokenizer for BramVanroy/CommonCrawl-CreativeCommons config v1
|