rahul7star commited on
Commit
342360f
Β·
verified Β·
1 Parent(s): 5e2ce82

Chatterbox fine-tuned model + logs

Browse files
Files changed (1) hide show
  1. training.log +475 -161
training.log CHANGED
@@ -5,199 +5,513 @@ Resolved paths:
5
 
6
  Starting training...
7
 
8
- 02/10/2026 03:45:28 - INFO - __main__ - Training/evaluation parameters CustomTrainingArguments(
9
- accelerator_config={'split_batches': False, 'dispatch_batches': None, 'even_batches': True, 'use_seedable_sampler': True, 'non_blocking': False, 'gradient_accumulation_kwargs': None, 'use_configured_state': False},
10
- adam_beta1=0.9,
11
- adam_beta2=0.999,
12
- adam_epsilon=1e-08,
13
- auto_find_batch_size=False,
14
- average_tokens_across_devices=True,
15
- batch_eval_metrics=False,
16
- bf16=False,
17
- bf16_full_eval=False,
18
- data_seed=None,
19
- dataloader_drop_last=False,
20
- dataloader_num_workers=8,
21
- dataloader_persistent_workers=False,
22
- dataloader_pin_memory=False,
23
- dataloader_prefetch_factor=None,
24
- ddp_backend=None,
25
- ddp_broadcast_buffers=None,
26
- ddp_bucket_cap_mb=None,
27
- ddp_find_unused_parameters=None,
28
- ddp_timeout=1800,
29
- debug=[],
30
- deepspeed=None,
31
- disable_tqdm=False,
32
- do_eval=True,
33
- do_predict=False,
34
- do_train=True,
35
- early_stopping_patience=None,
36
- enable_jit_checkpoint=False,
37
- eval_accumulation_steps=None,
38
- eval_delay=0,
39
- eval_do_concat_batches=True,
40
- eval_on_start=True,
41
- eval_steps=2,
42
- eval_strategy=IntervalStrategy.STEPS,
43
- eval_use_gather_object=False,
44
- fp16=True,
45
- fp16_full_eval=False,
46
- fsdp=[],
47
- fsdp_config={'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False},
48
- full_determinism=False,
49
- gradient_accumulation_steps=1,
50
- gradient_checkpointing=False,
51
- gradient_checkpointing_kwargs=None,
52
- greater_is_better=None,
53
- group_by_length=False,
54
- hub_always_push=False,
55
- hub_model_id=None,
56
- hub_private_repo=None,
57
- hub_revision=None,
58
- hub_strategy=HubStrategy.EVERY_SAVE,
59
- hub_token=<HUB_TOKEN>,
60
- ignore_data_skip=False,
61
- include_for_metrics=[],
62
- include_num_input_tokens_seen=no,
63
- label_names=['labels_speech'],
64
- label_smoothing_factor=0.0,
65
- learning_rate=5e-05,
66
- length_column_name=length,
67
- liger_kernel_config=None,
68
- load_best_model_at_end=False,
69
- local_rank=-1,
70
- log_level=passive,
71
- log_level_replica=warning,
72
- log_on_each_node=True,
73
- logging_dir=None,
74
- logging_first_step=False,
75
- logging_nan_inf_filter=True,
76
- logging_steps=1.0,
77
- logging_strategy=IntervalStrategy.STEPS,
78
- lr_scheduler_kwargs=None,
79
- lr_scheduler_type=SchedulerType.LINEAR,
80
- max_grad_norm=1.0,
81
- max_steps=-1,
82
- metric_for_best_model=None,
83
- neftune_noise_alpha=None,
84
- num_train_epochs=1.0,
85
- optim=OptimizerNames.ADAMW_TORCH_FUSED,
86
- optim_args=None,
87
- optim_target_modules=None,
88
- output_dir=/app/checkpoints/v1,
89
- parallelism_config=None,
90
- per_device_eval_batch_size=8,
91
- per_device_train_batch_size=1,
92
- prediction_loss_only=False,
93
- project=huggingface,
94
- push_to_hub=False,
95
- remove_unused_columns=True,
96
- report_to=['tensorboard'],
97
- restore_callback_states_from_checkpoint=False,
98
- resume_from_checkpoint=None,
99
- run_name=None,
100
- save_on_each_node=False,
101
- save_only_model=False,
102
- save_steps=1.0,
103
- save_strategy=SaveStrategy.STEPS,
104
- save_total_limit=1,
105
- seed=42,
106
- skip_memory_metrics=True,
107
- tf32=None,
108
- torch_compile=False,
109
- torch_compile_backend=None,
110
- torch_compile_mode=None,
111
- torch_empty_cache_steps=None,
112
- trackio_space_id=trackio,
113
- use_cache=False,
114
- use_cpu=False,
115
- use_liger_kernel=False,
116
- warmup_ratio=None,
117
- warmup_steps=1.0,
118
- weight_decay=0.0,
119
- )
120
- 02/10/2026 03:45:28 - INFO - __main__ - Model parameters ModelArguments(model_name_or_path='/app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9', local_model_dir=None, cache_dir=None, freeze_voice_encoder=True, freeze_s3gen=True)
121
- 02/10/2026 03:45:28 - INFO - __main__ - Data parameters DataArguments(language='hi', dataset_dir=None, metadata_file=None, dataset_name='rahul7star/hindi-speech-dataset', dataset_config_name=None, train_split_name='train', eval_split_name='validation', text_column_name='transcript', audio_column_name='audio', max_text_len=256, max_speech_len=800, audio_prompt_duration_s=3.0, eval_split_size=0.0002, preprocessing_num_workers=None, ignore_verifications=False)
122
- 02/10/2026 03:45:28 - INFO - __main__ - Loading ChatterboxTTS model...
123
- 02/10/2026 03:45:28 - INFO - __main__ - Loading model from Hugging Face Hub: /app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9
124
- 02/10/2026 03:45:28 - WARNING - __main__ - Could not download ve.safetensors from /app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9: Repo id must be in the form 'repo_name' or 'namespace/repo_name': '/app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9'. Use `repo_type` argument if needed..
125
- 02/10/2026 03:45:28 - WARNING - __main__ - Could not download t3_mtl23ls_v2.safetensors from /app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9: Repo id must be in the form 'repo_name' or 'namespace/repo_name': '/app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9'. Use `repo_type` argument if needed..
126
- 02/10/2026 03:45:28 - WARNING - __main__ - Could not download s3gen.safetensors from /app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9: Repo id must be in the form 'repo_name' or 'namespace/repo_name': '/app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9'. Use `repo_type` argument if needed..
127
- 02/10/2026 03:45:28 - WARNING - __main__ - Could not download mtl_tokenizer.json from /app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9: Repo id must be in the form 'repo_name' or 'namespace/repo_name': '/app/hf_cache/models--ResembleAI--chatterbox/snapshots/05e904af2b5c7f8e482687a9d7336c5c824467d9'. Use `repo_type` argument if needed..
128
- 02/10/2026 03:45:28 - INFO - __main__ - conds.pt not found on Hub or failed to download for this model.
129
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/models/ResembleAI/chatterbox/revision/main "HTTP/1.1 200 OK"
130
 
131
 
132
- Downloading (incomplete total...): 0.00B [00:00, ?B/s]
 
133
 
134
- Fetching 5 files: 0%| | 0/5 [00:00<?, ?it/s]02/10/2026 03:45:28 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/ResembleAI/chatterbox/resolve/05e904af2b5c7f8e482687a9d7336c5c824467d9/conds.pt "HTTP/1.1 302 Found"
135
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/ResembleAI/chatterbox/resolve/05e904af2b5c7f8e482687a9d7336c5c824467d9/grapheme_mtl_merged_expanded_v1.json "HTTP/1.1 307 Temporary Redirect"
136
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/ResembleAI/chatterbox/resolve/05e904af2b5c7f8e482687a9d7336c5c824467d9/s3gen.pt "HTTP/1.1 302 Found"
137
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/ResembleAI/chatterbox/resolve/05e904af2b5c7f8e482687a9d7336c5c824467d9/ve.pt "HTTP/1.1 302 Found"
138
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/ResembleAI/chatterbox/resolve/05e904af2b5c7f8e482687a9d7336c5c824467d9/t3_mtl23ls_v2.safetensors "HTTP/1.1 302 Found"
139
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/models/ResembleAI/chatterbox/xet-read-token/05e904af2b5c7f8e482687a9d7336c5c824467d9 "HTTP/1.1 200 OK"
140
 
 
141
 
142
- Downloading (incomplete total...): 0%| | 0.00/107k [00:00<?, ?B/s]02/10/2026 03:45:28 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/api/resolve-cache/models/ResembleAI/chatterbox/05e904af2b5c7f8e482687a9d7336c5c824467d9/grapheme_mtl_merged_expanded_v1.json "HTTP/1.1 200 OK"
143
- 02/10/2026 03:45:28 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/models/ResembleAI/chatterbox/xet-read-token/05e904af2b5c7f8e482687a9d7336c5c824467d9 "HTTP/1.1 200 OK"
144
 
 
145
 
146
- Downloading (incomplete total...): 0%| | 0.00/5.81M [00:00<?, ?B/s]02/10/2026 03:45:28 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/models/ResembleAI/chatterbox/xet-read-token/05e904af2b5c7f8e482687a9d7336c5c824467d9 "HTTP/1.1 200 OK"
147
 
 
148
 
149
- Downloading (incomplete total...): 0%| | 0.00/1.06G [00:00<?, ?B/s]02/10/2026 03:45:28 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/models/ResembleAI/chatterbox/xet-read-token/05e904af2b5c7f8e482687a9d7336c5c824467d9 "HTTP/1.1 200 OK"
 
150
 
 
151
 
152
- Downloading (incomplete total...): 0%| | 0.00/3.21G [00:00<?, ?B/s]02/10/2026 03:45:28 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/resolve-cache/models/ResembleAI/chatterbox/05e904af2b5c7f8e482687a9d7336c5c824467d9/grapheme_mtl_merged_expanded_v1.json "HTTP/1.1 200 OK"
153
 
 
 
154
 
155
- Downloading (incomplete total...): 0%| | 0.00/3.21G [00:00<?, ?B/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
156
 
157
- Downloading (incomplete total...): 0%| | 13.5M/3.21G [00:01<07:02, 7.56MB/s]
158
 
159
- Downloading (incomplete total...): 3%|β–Ž | 80.6M/3.21G [00:04<02:36, 19.9MB/s]
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
160
 
161
- Downloading (incomplete total...): 7%|β–‹ | 215M/3.21G [00:05<01:06, 45.2MB/s] 
162
 
163
- Downloading (incomplete total...): 9%|β–‰ | 282M/3.21G [00:07<01:07, 43.1MB/s]
164
 
165
- Downloading (incomplete total...): 23%|β–ˆβ–ˆβ–Ž | 743M/3.21G [00:08<00:17, 142MB/s] 
166
 
167
- Downloading (incomplete total...): 50%|β–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.59G/3.21G [00:09<00:05, 308MB/s]
168
 
169
- Fetching 5 files: 60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 3/5 [00:10<00:06, 3.44s/it]
170
 
171
- Downloading (incomplete total...): 73%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 2.35G/3.21G [00:10<00:02, 424MB/s]
172
- Fetching 5 files: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 5/5 [00:11<00:00, 2.22s/it]
173
 
174
 
175
- Download complete: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 3.21G/3.21G [00:11<00:00, 424MB/s] 
176
- Download complete: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 3.21G/3.21G [00:16<00:00, 189MB/s]
177
  /usr/local/lib/python3.13/site-packages/diffusers/models/lora.py:393: FutureWarning: `LoRACompatibleLinear` is deprecated and will be removed in version 1.0.0. Use of `LoRACompatibleLinear` is deprecated. Please switch to PEFT backend by installing PEFT: `pip install peft`.
178
  deprecate("LoRACompatibleLinear", "1.0.0", deprecation_message)
179
- 02/10/2026 03:45:46 - INFO - root - input frame rate=25
180
- 02/10/2026 03:45:47 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/ResembleAI/chatterbox/resolve/main/Cangjie5_TC.json "HTTP/1.1 307 Temporary Redirect"
181
- 02/10/2026 03:45:47 - INFO - httpx - HTTP Request: HEAD https://huggingface.co/api/resolve-cache/models/ResembleAI/chatterbox/05e904af2b5c7f8e482687a9d7336c5c824467d9/Cangjie5_TC.json "HTTP/1.1 200 OK"
182
- 02/10/2026 03:45:47 - INFO - httpx - HTTP Request: GET https://huggingface.co/api/resolve-cache/models/ResembleAI/chatterbox/05e904af2b5c7f8e482687a9d7336c5c824467d9/Cangjie5_TC.json "HTTP/1.1 200 OK"
183
 
184
 
185
  Cangjie5_TC.json: 0%| | 0.00/1.92M [00:00<?, ?B/s]
186
- Cangjie5_TC.json: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.92M/1.92M [00:00<00:00, 19.7MB/s]
187
  Downloading: "https://github.com/explosion/spacy-pkuseg/releases/download/v0.0.26/spacy_ontonotes.zip" to /root/.pkuseg/spacy_ontonotes.zip
188
 
189
 
190
  0%| | 0/34567143 [00:00<?, ?it/s]
191
- 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 34567143/34567143 [00:00<00:00, 164494667.16it/s]
192
- 02/10/2026 03:45:49 - INFO - __main__ - Voice Encoder frozen.
193
- 02/10/2026 03:45:49 - INFO - __main__ - S3Gen model frozen.
194
- 02/10/2026 03:45:49 - INFO - __main__ - T3 model set to trainable.
195
- 02/10/2026 03:45:49 - INFO - __main__ - Loading and processing dataset...
196
  Traceback (most recent call last):
197
- File "/app/chatterbox-multilingual-finetuning/src/finetune_t3.py", line 860, in <module>
198
  main()
199
  ~~~~^^
200
- File "/app/chatterbox-multilingual-finetuning/src/finetune_t3.py", line 651, in main
201
- train_hf_dataset = train_hf_dataset.map(decode_audio)
202
- ^^^^^^^^^^^^^^^^
203
- UnboundLocalError: cannot access local variable 'train_hf_dataset' where it is not associated with a value
 
 
 
 
 
5
 
6
  Starting training...
7
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8
 
9
 
10
+ README.md: 0%| | 0.00/591 [00:00<?, ?B/s]
11
+ README.md: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 591/591 [00:00<00:00, 3.34MB/s]
12
 
13
+ Downloading data: 0%| | 0/36 [00:00<?, ?files/s]
 
 
 
 
 
14
 
15
+ data/train-00000-of-00036.parquet: 0%| | 0.00/1.77G [00:00<?, ?B/s]
16
 
17
+ data/train-00000-of-00036.parquet: 0%| | 11.6k/1.77G [00:01<44:03:44, 11.1kB/s]
 
18
 
19
+ data/train-00000-of-00036.parquet: 11%|β–ˆβ– | 203M/1.77G [00:02<00:13, 117MB/s] 
20
 
21
+ data/train-00000-of-00036.parquet: 34%|β–ˆβ–ˆβ–ˆβ– | 598M/1.77G [00:03<00:04, 243MB/s]
22
 
23
+ data/train-00000-of-00036.parquet: 59%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 1.04G/1.77G [00:04<00:02, 319MB/s]
24
 
25
+ data/train-00000-of-00036.parquet: 86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 1.52G/1.77G [00:05<00:00, 376MB/s]
26
+ data/train-00000-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.77G/1.77G [00:05<00:00, 336MB/s]
27
 
28
+ Downloading data: 3%|β–Ž | 1/36 [00:05<03:05, 5.31s/files]
29
 
30
+ data/train-00001-of-00036.parquet: 0%| | 0.00/496M [00:00<?, ?B/s]
31
 
32
+ data/train-00001-of-00036.parquet: 5%|▍ | 23.6M/496M [00:01<00:20, 23.6MB/s]
33
+ data/train-00001-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 496M/496M [00:01<00:00, 263MB/s]
34
 
35
+ Downloading data: 6%|β–Œ | 2/36 [00:07<01:52, 3.31s/files]
36
+
37
+ data/train-00002-of-00036.parquet: 0%| | 0.00/461M [00:00<?, ?B/s]
38
+
39
+ data/train-00002-of-00036.parquet: 15%|β–ˆβ– | 68.8M/461M [00:01<00:05, 68.6MB/s]
40
+ data/train-00002-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆοΏ½οΏ½οΏ½| 461M/461M [00:01<00:00, 251MB/s]
41
+
42
+ Downloading data: 8%|β–Š | 3/36 [00:09<01:27, 2.65s/files]
43
+
44
+ data/train-00003-of-00036.parquet: 0%| | 0.00/372M [00:00<?, ?B/s]
45
+
46
+ data/train-00003-of-00036.parquet: 10%|β–ˆ | 37.5M/372M [00:01<00:08, 37.5MB/s]
47
+ data/train-00003-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 372M/372M [00:01<00:00, 214MB/s]
48
+
49
+ Downloading data: 11%|β–ˆ | 4/36 [00:10<01:13, 2.30s/files]
50
+
51
+ data/train-00004-of-00036.parquet: 0%| | 0.00/373M [00:00<?, ?B/s]
52
+
53
+ data/train-00004-of-00036.parquet: 10%|β–ˆ | 39.0M/373M [00:01<00:08, 38.8MB/s]
54
+ data/train-00004-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 373M/373M [00:01<00:00, 231MB/s]
55
+
56
+ Downloading data: 14%|β–ˆβ– | 5/36 [00:12<01:03, 2.06s/files]
57
+
58
+ data/train-00005-of-00036.parquet: 0%| | 0.00/841M [00:00<?, ?B/s]
59
+
60
+ data/train-00005-of-00036.parquet: 5%|▍ | 39.4M/841M [00:01<00:20, 39.4MB/s]
61
+
62
+ data/train-00005-of-00036.parquet: 39%|β–ˆβ–ˆβ–ˆβ–‰ | 330M/841M [00:02<00:02, 187MB/s] 
63
+
64
+ data/train-00005-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 841M/841M [00:03<00:00, 286MB/s]
65
+ data/train-00005-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 841M/841M [00:03<00:00, 249MB/s]
66
+
67
+ Downloading data: 17%|β–ˆβ–‹ | 6/36 [00:15<01:15, 2.52s/files]
68
+
69
+ data/train-00006-of-00036.parquet: 0%| | 0.00/837M [00:00<?, ?B/s]
70
+
71
+ data/train-00006-of-00036.parquet: 3%|β–Ž | 29.3M/837M [00:01<00:27, 29.2MB/s]
72
+
73
+ data/train-00006-of-00036.parquet: 39%|β–ˆβ–ˆβ–ˆβ–‰ | 325M/837M [00:02<00:02, 186MB/s] 
74
+
75
+ data/train-00006-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 837M/837M [00:03<00:00, 310MB/s]
76
+ data/train-00006-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 837M/837M [00:03<00:00, 264MB/s]
77
+
78
+ Downloading data: 19%|β–ˆβ–‰ | 7/36 [00:19<01:19, 2.74s/files]
79
+
80
+ data/train-00007-of-00036.parquet: 0%| | 0.00/618M [00:00<?, ?B/s]
81
+
82
+ data/train-00007-of-00036.parquet: 5%|▍ | 28.5M/618M [00:01<00:20, 28.4MB/s]
83
+
84
+ data/train-00007-of-00036.parquet: 53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 328M/618M [00:02<00:01, 187MB/s] 
85
+
86
+ data/train-00007-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 618M/618M [00:03<00:00, 203MB/s]
87
+ data/train-00007-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 618M/618M [00:03<00:00, 185MB/s]
88
+
89
+ Downloading data: 22%|β–ˆβ–ˆβ– | 8/36 [00:22<01:22, 2.94s/files]
90
+
91
+ data/train-00008-of-00036.parquet: 0%| | 0.00/415M [00:00<?, ?B/s]
92
+
93
+ data/train-00008-of-00036.parquet: 7%|β–‹ | 30.4M/415M [00:01<00:12, 30.4MB/s]
94
+ data/train-00008-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 415M/415M [00:01<00:00, 247MB/s]
95
+
96
+ Downloading data: 25%|β–ˆβ–ˆβ–Œ | 9/36 [00:24<01:08, 2.55s/files]
97
+
98
+ data/train-00009-of-00036.parquet: 0%| | 0.00/303M [00:00<?, ?B/s]
99
+
100
+ data/train-00009-of-00036.parquet: 4%|▍ | 12.7M/303M [00:01<00:23, 12.6MB/s]
101
+ data/train-00009-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 303M/303M [00:01<00:00, 196MB/s]
102
+
103
+ Downloading data: 28%|β–ˆβ–ˆβ–Š | 10/36 [00:25<00:58, 2.25s/files]
104
+
105
+ data/train-00010-of-00036.parquet: 0%| | 0.00/341M [00:00<?, ?B/s]
106
+
107
+ data/train-00010-of-00036.parquet: 20%|β–ˆβ–‰ | 67.3M/341M [00:01<00:04, 66.8MB/s]
108
+
109
+ data/train-00010-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 341M/341M [00:02<00:00, 180MB/s] 
110
+ data/train-00010-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 341M/341M [00:02<00:00, 163MB/s]
111
+
112
+ Downloading data: 31%|β–ˆβ–ˆβ–ˆ | 11/36 [00:27<00:55, 2.21s/files]
113
+
114
+ data/train-00011-of-00036.parquet: 0%| | 0.00/440M [00:00<?, ?B/s]
115
+
116
+ data/train-00011-of-00036.parquet: 5%|▍ | 19.9M/440M [00:01<00:21, 19.9MB/s]
117
+
118
+ data/train-00011-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 440M/440M [00:02<00:00, 253MB/s] 
119
+ data/train-00011-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 440M/440M [00:02<00:00, 218MB/s]
120
+
121
+ Downloading data: 33%|β–ˆβ–ˆβ–ˆβ–Ž | 12/36 [00:29<00:52, 2.17s/files]
122
+
123
+ data/train-00012-of-00036.parquet: 0%| | 0.00/412M [00:00<?, ?B/s]
124
+
125
+ data/train-00012-of-00036.parquet: 18%|β–ˆβ–Š | 74.7M/412M [00:01<00:04, 74.5MB/s]
126
+ data/train-00012-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 412M/412M [00:01<00:00, 283MB/s]
127
+
128
+ Downloading data: 36%|β–ˆβ–ˆβ–ˆβ–Œ | 13/36 [00:31<00:45, 1.96s/files]
129
+
130
+ data/train-00013-of-00036.parquet: 0%| | 0.00/397M [00:00<?, ?B/s]
131
+
132
+ data/train-00013-of-00036.parquet: 14%|β–ˆβ– | 55.0M/397M [00:01<00:06, 54.3MB/s]
133
+ data/train-00013-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 397M/397M [00:01<00:00, 261MB/s]
134
+
135
+ Downloading data: 39%|β–ˆβ–ˆβ–ˆβ–‰ | 14/36 [00:32<00:40, 1.84s/files]
136
+
137
+ data/train-00014-of-00036.parquet: 0%| | 0.00/397M [00:00<?, ?B/s]
138
+
139
+ data/train-00014-of-00036.parquet: 7%|β–‹ | 28.0M/397M [00:01<00:13, 27.9MB/s]
140
+
141
+ data/train-00014-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 397M/397M [00:02<00:00, 185MB/s] 
142
+ data/train-00014-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 397M/397M [00:02<00:00, 165MB/s]
143
+
144
+ Downloading data: 42%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 15/36 [00:35<00:42, 2.02s/files]
145
+
146
+ data/train-00015-of-00036.parquet: 0%| | 0.00/389M [00:00<?, ?B/s]
147
+
148
+ data/train-00015-of-00036.parquet: 7%|β–‹ | 26.6M/389M [00:01<00:13, 26.6MB/s]
149
+
150
+ data/train-00015-of-00036.parquet: 83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 322M/389M [00:02<00:00, 177MB/s] 
151
+ data/train-00015-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 389M/389M [00:02<00:00, 177MB/s]
152
+
153
+ Downloading data: 44%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 16/36 [00:37<00:41, 2.08s/files]
154
+
155
+ data/train-00016-of-00036.parquet: 0%| | 0.00/384M [00:00<?, ?B/s]
156
+
157
+ data/train-00016-of-00036.parquet: 11%|β–ˆβ– | 43.8M/384M [00:01<00:07, 43.7MB/s]
158
+
159
+ data/train-00016-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 384M/384M [00:02<00:00, 218MB/s] 
160
+ data/train-00016-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 384M/384M [00:02<00:00, 192MB/s]
161
+
162
+ Downloading data: 47%|β–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 17/36 [00:39<00:39, 2.06s/files]
163
+
164
+ data/train-00017-of-00036.parquet: 0%| | 0.00/441M [00:00<?, ?B/s]
165
+
166
+ data/train-00017-of-00036.parquet: 3%|β–Ž | 14.5M/441M [00:01<00:29, 14.5MB/s]
167
+
168
+ data/train-00017-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 441M/441M [00:02<00:00, 229MB/s] 
169
+ data/train-00017-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 441M/441M [00:02<00:00, 200MB/s]
170
+
171
+ Downloading data: 50%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 18/36 [00:41<00:38, 2.11s/files]
172
+
173
+ data/train-00018-of-00036.parquet: 0%| | 0.00/571M [00:00<?, ?B/s]
174
+
175
+ data/train-00018-of-00036.parquet: 4%|▍ | 24.9M/571M [00:01<00:22, 24.8MB/s]
176
+
177
+ data/train-00018-of-00036.parquet: 88%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 504M/571M [00:02<00:00, 290MB/s] 
178
+ data/train-00018-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 571M/571M [00:03<00:00, 188MB/s]
179
+
180
+ Downloading data: 53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 19/36 [00:44<00:40, 2.40s/files]
181
+
182
+ data/train-00019-of-00036.parquet: 0%| | 0.00/413M [00:00<?, ?B/s]
183
+
184
+ data/train-00019-of-00036.parquet: 10%|β–ˆ | 41.5M/413M [00:01<00:08, 41.5MB/s]
185
+ data/train-00019-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 413M/413M [00:01<00:00, 211MB/s]
186
+
187
+ Downloading data: 56%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 20/36 [00:46<00:36, 2.27s/files]
188
+
189
+ data/train-00020-of-00036.parquet: 0%| | 0.00/417M [00:00<?, ?B/s]
190
+
191
+ data/train-00020-of-00036.parquet: 8%|β–Š | 34.8M/417M [00:01<00:11, 34.6MB/s]
192
+ data/train-00020-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 417M/417M [00:01<00:00, 234MB/s]
193
+
194
+ Downloading data: 58%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 21/36 [00:48<00:32, 2.14s/files]
195
+
196
+ data/train-00021-of-00036.parquet: 0%| | 0.00/401M [00:00<?, ?B/s]
197
+
198
+ data/train-00021-of-00036.parquet: 0%| | 26.6k/401M [00:01<4:29:15, 24.8kB/s]
199
+
200
+ data/train-00021-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 401M/401M [00:02<00:00, 189MB/s] 
201
+ data/train-00021-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 401M/401M [00:02<00:00, 164MB/s]
202
+
203
+ Downloading data: 61%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 22/36 [00:51<00:31, 2.24s/files]
204
+
205
+ data/train-00022-of-00036.parquet: 0%| | 0.00/373M [00:00<?, ?B/s]
206
+
207
+ data/train-00022-of-00036.parquet: 4%|▍ | 14.0M/373M [00:01<00:25, 14.0MB/s]
208
+ data/train-00022-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 373M/373M [00:01<00:00, 214MB/s]
209
+
210
+ Downloading data: 64%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 23/36 [00:52<00:27, 2.09s/files]
211
+
212
+ data/train-00023-of-00036.parquet: 0%| | 0.00/374M [00:00<?, ?B/s]
213
+
214
+ data/train-00023-of-00036.parquet: 0%| | 30.4k/374M [00:01<3:31:02, 29.5kB/s]
215
+
216
+ data/train-00023-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 374M/374M [00:02<00:00, 210MB/s] 
217
+ data/train-00023-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 374M/374M [00:02<00:00, 179MB/s]
218
+
219
+ Downloading data: 67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 24/36 [00:55<00:25, 2.11s/files]
220
+
221
+ data/train-00024-of-00036.parquet: 0%| | 0.00/531M [00:00<?, ?B/s]
222
+
223
+ data/train-00024-of-00036.parquet: 4%|▍ | 21.0M/531M [00:01<00:24, 21.0MB/s]
224
+
225
+ data/train-00024-of-00036.parquet: 73%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 386M/531M [00:02<00:00, 223MB/s] 
226
+ data/train-00024-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 531M/531M [00:02<00:00, 190MB/s]
227
+
228
+ Downloading data: 69%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 25/36 [00:57<00:25, 2.32s/files]
229
+
230
+ data/train-00025-of-00036.parquet: 0%| | 0.00/542M [00:00<?, ?B/s]
231
+
232
+ data/train-00025-of-00036.parquet: 6%|β–Œ | 33.2M/542M [00:01<00:15, 33.2MB/s]
233
+
234
+ data/train-00025-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 542M/542M [00:02<00:00, 212MB/s] 
235
+ data/train-00025-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 542M/542M [00:02<00:00, 193MB/s]
236
+
237
+ Downloading data: 72%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 26/36 [01:00<00:24, 2.48s/files]
238
+
239
+ data/train-00026-of-00036.parquet: 0%| | 0.00/434M [00:00<?, ?B/s]
240
+
241
+ data/train-00026-of-00036.parquet: 8%|β–Š | 36.0M/434M [00:01<00:11, 35.5MB/s]
242
+
243
+ data/train-00026-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 434M/434M [00:02<00:00, 200MB/s] 
244
+ data/train-00026-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 434M/434M [00:02<00:00, 179MB/s]
245
+
246
+ Downloading data: 75%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 27/36 [01:03<00:22, 2.47s/files]
247
+
248
+ data/train-00027-of-00036.parquet: 0%| | 0.00/366M [00:00<?, ?B/s]
249
+
250
+ data/train-00027-of-00036.parquet: 8%|β–Š | 29.6M/366M [00:01<00:11, 29.6MB/s]
251
+ data/train-00027-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 366M/366M [00:01<00:00, 202MB/s]
252
+
253
+ Downloading data: 78%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 28/36 [01:05<00:18, 2.28s/files]
254
+
255
+ data/train-00028-of-00036.parquet: 0%| | 0.00/374M [00:00<?, ?B/s]
256
+
257
+ data/train-00028-of-00036.parquet: 8%|β–Š | 29.5M/374M [00:01<00:11, 29.4MB/s]
258
+ data/train-00028-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 374M/374M [00:01<00:00, 225MB/s]
259
+
260
+ Downloading data: 81%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 29/36 [01:06<00:14, 2.10s/files]
261
+
262
+ data/train-00029-of-00036.parquet: 0%| | 0.00/402M [00:00<?, ?B/s]
263
+
264
+ data/train-00029-of-00036.parquet: 5%|β–Œ | 21.8M/402M [00:01<00:17, 21.8MB/s]
265
+ data/train-00029-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 402M/402M [00:01<00:00, 231MB/s]
266
+
267
+ Downloading data: 83%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 30/36 [01:08<00:12, 2.00s/files]
268
 
269
+ data/train-00030-of-00036.parquet: 0%| | 0.00/400M [00:00<?, ?B/s]
270
 
271
+ data/train-00030-of-00036.parquet: 3%|β–Ž | 12.8M/400M [00:01<00:30, 12.8MB/s]
272
+
273
+ data/train-00030-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 400M/400M [00:02<00:00, 199MB/s] 
274
+ data/train-00030-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 400M/400M [00:02<00:00, 175MB/s]
275
+
276
+ Downloading data: 86%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 31/36 [01:10<00:10, 2.09s/files]
277
+
278
+ data/train-00031-of-00036.parquet: 0%| | 0.00/382M [00:00<?, ?B/s]
279
+
280
+ data/train-00031-of-00036.parquet: 2%|▏ | 7.72M/382M [00:01<00:48, 7.70MB/s]
281
+ data/train-00031-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 382M/382M [00:01<00:00, 209MB/s]
282
+
283
+ Downloading data: 89%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 32/36 [01:12<00:08, 2.02s/files]
284
+
285
+ data/train-00032-of-00036.parquet: 0%| | 0.00/380M [00:00<?, ?B/s]
286
+
287
+ data/train-00032-of-00036.parquet: 5%|▍ | 18.4M/380M [00:01<00:19, 18.4MB/s]
288
+ data/train-00032-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 380M/380M [00:01<00:00, 196MB/s]
289
+
290
+ Downloading data: 92%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 33/36 [01:14<00:06, 2.00s/files]
291
+
292
+ data/train-00033-of-00036.parquet: 0%| | 0.00/376M [00:00<?, ?B/s]
293
+
294
+ data/train-00033-of-00036.parquet: 1%| | 3.43M/376M [00:01<01:48, 3.42MB/s]
295
+ data/train-00033-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 376M/376M [00:01<00:00, 201MB/s]
296
+
297
+ Downloading data: 94%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 34/36 [01:16<00:03, 1.97s/files]
298
+
299
+ data/train-00034-of-00036.parquet: 0%| | 0.00/372M [00:00<?, ?B/s]
300
+
301
+ data/train-00034-of-00036.parquet: 4%|▍ | 14.3M/372M [00:01<00:25, 14.3MB/s]
302
+ data/train-00034-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 372M/372M [00:01<00:00, 220MB/s]
303
+
304
+ Downloading data: 97%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 35/36 [01:18<00:01, 1.90s/files]
305
+
306
+ data/train-00035-of-00036.parquet: 0%| | 0.00/373M [00:00<?, ?B/s]
307
+
308
+ data/train-00035-of-00036.parquet: 5%|β–Œ | 19.1M/373M [00:01<00:18, 19.1MB/s]
309
+ data/train-00035-of-00036.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 373M/373M [00:01<00:00, 207MB/s]
310
+
311
+ Downloading data: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 36/36 [01:20<00:00, 1.87s/files]
312
+ Downloading data: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 36/36 [01:20<00:00, 2.22s/files]
313
+
314
+
315
+ data/validation-00000-of-00001.parquet: 0%| | 0.00/162M [00:00<?, ?B/s]
316
+
317
+ data/validation-00000-of-00001.parquet: 37%|β–ˆβ–ˆβ–ˆβ–‹ | 59.3M/162M [00:01<00:01, 59.2MB/s]
318
+ data/validation-00000-of-00001.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 162M/162M [00:01<00:00, 137MB/s]
319
+
320
+
321
+ data/test-00000-of-00001.parquet: 0%| | 0.00/306M [00:00<?, ?B/s]
322
+
323
+ data/test-00000-of-00001.parquet: 3%|β–Ž | 10.7M/306M [00:01<00:27, 10.6MB/s]
324
+
325
+ data/test-00000-of-00001.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 306M/306M [00:02<00:00, 169MB/s] 
326
+ data/test-00000-of-00001.parquet: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 306M/306M [00:02<00:00, 147MB/s]
327
+
328
+
329
+ Generating train split: 0%| | 0/145152 [00:00<?, ? examples/s]
330
+
331
+ Generating train split: 0%| | 200/145152 [00:01<15:32, 155.47 examples/s]
332
+
333
+ Generating train split: 0%| | 500/145152 [00:02<11:15, 214.23 examples/s]
334
+
335
+ Generating train split: 1%| | 800/145152 [00:03<11:05, 216.89 examples/s]
336
+
337
+ Generating train split: 1%| | 1100/145152 [00:05<10:52, 220.70 examples/s]
338
+
339
+ Generating train split: 1%| | 1400/145152 [00:06<10:16, 233.33 examples/s]
340
+
341
+ Generating train split: 1%| | 1700/145152 [00:07<09:57, 240.15 examples/s]
342
+
343
+ Generating train split: 1%|▏ | 2000/145152 [00:08<10:01, 238.10 examples/s]
344
+
345
+ Generating train split: 3%|β–Ž | 4132/145152 [00:09<03:14, 725.45 examples/s]
346
+
347
+ Generating train split: 4%|▍ | 6232/145152 [00:10<02:08, 1085.02 examples/s]
348
+
349
+ Generating train split: 6%|β–Œ | 8264/145152 [00:11<01:42, 1339.46 examples/s]
350
+
351
+ Generating train split: 7%|β–‹ | 10464/145152 [00:13<01:25, 1570.42 examples/s]
352
+
353
+ Generating train split: 9%|β–‰ | 13296/145152 [00:14<01:09, 1890.88 examples/s]
354
+
355
+ Generating train split: 11%|β–ˆβ– | 16428/145152 [00:15<00:58, 2186.18 examples/s]
356
+
357
+ Generating train split: 13%|β–ˆβ–Ž | 19428/145152 [00:16<00:53, 2362.66 examples/s]
358
+
359
+ Generating train split: 15%|β–ˆβ–Œ | 21860/145152 [00:17<01:02, 1973.51 examples/s]
360
+
361
+ Generating train split: 17%|β–ˆβ–‹ | 23960/145152 [00:19<01:12, 1665.91 examples/s]
362
+
363
+ Generating train split: 18%|β–ˆβ–Š | 25792/145152 [00:21<01:18, 1518.35 examples/s]
364
+
365
+ Generating train split: 19%|β–ˆβ–‰ | 27492/145152 [00:22<01:22, 1419.11 examples/s]
366
+
367
+ Generating train split: 20%|β–ˆβ–‰ | 29024/145152 [00:24<01:24, 1366.99 examples/s]
368
+
369
+ Generating train split: 21%|β–ˆβ–ˆ | 30824/145152 [00:25<01:17, 1466.19 examples/s]
370
+
371
+ Generating train split: 22%|β–ˆβ–ˆβ– | 32656/145152 [00:26<01:13, 1522.14 examples/s]
372
+
373
+ Generating train split: 24%|β–ˆβ–ˆβ– | 34956/145152 [00:27<01:04, 1712.43 examples/s]
374
+
375
+ Generating train split: 26%|β–ˆβ–ˆβ–‹ | 38288/145152 [00:28<00:50, 2132.95 examples/s]
376
+
377
+ Generating train split: 29%|β–ˆβ–ˆβ–Š | 41520/145152 [00:29<00:42, 2427.94 examples/s]
378
+
379
+ Generating train split: 31%|β–ˆβ–ˆβ–ˆ | 44452/145152 [00:30<00:39, 2559.95 examples/s]
380
+
381
+ Generating train split: 33%|β–ˆβ–ˆβ–ˆβ–Ž | 47352/145152 [00:31<00:39, 2462.75 examples/s]
382
+
383
+ Generating train split: 34%|β–ˆβ–ˆβ–ˆβ– | 49884/145152 [00:32<00:39, 2422.60 examples/s]
384
+
385
+ Generating train split: 36%|β–ˆβ–ˆβ–ˆβ–Œ | 52516/145152 [00:33<00:37, 2463.02 examples/s]
386
+
387
+ Generating train split: 38%|β–ˆβ–ˆβ–ˆβ–Š | 55116/145152 [00:34<00:36, 2479.32 examples/s]
388
+
389
+ Generating train split: 40%|β–ˆβ–ˆβ–ˆβ–‰ | 57948/145152 [00:35<00:34, 2503.63 examples/s]
390
+
391
+ Generating train split: 42%|β–ˆβ–ˆβ–ˆβ–ˆβ– | 60580/145152 [00:36<00:33, 2535.19 examples/s]
392
+
393
+ Generating train split: 44%|β–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 63480/145152 [00:37<00:31, 2569.53 examples/s]
394
+
395
+ Generating train split: 46%|β–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 66312/145152 [00:38<00:30, 2618.17 examples/s]
396
+
397
+ Generating train split: 48%|β–ˆβ–ˆβ–ˆβ–ˆβ–Š | 69144/145152 [00:39<00:28, 2639.65 examples/s]
398
+
399
+ Generating train split: 49%|β–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 71844/145152 [00:40<00:28, 2603.44 examples/s]
400
+
401
+ Generating train split: 51%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 74576/145152 [00:42<00:30, 2323.08 examples/s]
402
+
403
+ Generating train split: 53%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 77208/145152 [00:43<00:30, 2210.35 examples/s]
404
+
405
+ Generating train split: 55%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 79908/145152 [00:44<00:28, 2308.45 examples/s]
406
+
407
+ Generating train split: 57%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 82440/145152 [00:45<00:26, 2367.41 examples/s]
408
+
409
+ Generating train split: 59%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 85272/145152 [00:46<00:24, 2422.16 examples/s]
410
+
411
+ Generating train split: 61%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 87972/145152 [00:47<00:23, 2469.83 examples/s]
412
+
413
+ Generating train split: 63%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 90804/145152 [00:49<00:21, 2544.65 examples/s]
414
+
415
+ Generating train split: 65%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 93636/145152 [00:50<00:19, 2622.46 examples/s]
416
+
417
+ Generating train split: 67%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 96636/145152 [00:51<00:17, 2724.14 examples/s]
418
+
419
+ Generating train split: 69%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Š | 99468/145152 [00:52<00:18, 2430.66 examples/s]
420
+
421
+ Generating train split: 70%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 102000/145152 [00:53<00:19, 2238.26 examples/s]
422
+
423
+ Generating train split: 72%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 104400/145152 [00:55<00:19, 2133.52 examples/s]
424
+
425
+ Generating train split: 74%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 106832/145152 [00:56<00:18, 2089.83 examples/s]
426
+
427
+ Generating train split: 76%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 109764/145152 [00:57<00:15, 2273.20 examples/s]
428
+
429
+ Generating train split: 78%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆοΏ½οΏ½οΏ½β–Š | 112764/145152 [00:58<00:13, 2438.22 examples/s]
430
+
431
+ Generating train split: 80%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 115596/145152 [00:59<00:11, 2516.56 examples/s]
432
+
433
+ Generating train split: 82%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 118428/145152 [01:00<00:10, 2533.33 examples/s]
434
+
435
+ Generating train split: 84%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž | 121260/145152 [01:01<00:09, 2546.56 examples/s]
436
+
437
+ Generating train split: 85%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ | 123960/145152 [01:02<00:08, 2580.24 examples/s]
438
+
439
+ Generating train split: 87%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹ | 126792/145152 [01:03<00:07, 2620.04 examples/s]
440
+
441
+ Generating train split: 89%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰ | 129624/145152 [01:04<00:05, 2663.67 examples/s]
442
+
443
+ Generating train split: 91%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–| 132624/145152 [01:05<00:04, 2705.80 examples/s]
444
+
445
+ Generating train split: 93%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Ž| 135456/145152 [01:06<00:03, 2734.67 examples/s]
446
+
447
+ Generating train split: 95%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–Œ| 138588/145152 [01:07<00:02, 2775.60 examples/s]
448
+
449
+ Generating train split: 97%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‹| 141420/145152 [01:08<00:01, 2784.34 examples/s]
450
+
451
+ Generating train split: 99%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–‰| 144420/145152 [01:10<00:00, 2815.47 examples/s]
452
+ Generating train split: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 145152/145152 [01:10<00:00, 2068.64 examples/s]
453
+
454
+
455
+ Generating validation split: 0%| | 0/239 [00:00<?, ? examples/s]
456
+ Generating validation split: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 239/239 [00:00<00:00, 271.32 examples/s]
457
+
458
+
459
+ Generating test split: 0%| | 0/418 [00:00<?, ? examples/s]
460
+
461
+ Generating test split: 48%|β–ˆβ–ˆβ–ˆβ–ˆβ–Š | 200/418 [00:01<00:01, 151.91 examples/s]
462
+ Generating test split: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 418/418 [00:01<00:00, 235.25 examples/s]
463
+
464
+
465
+ Downloading (incomplete total...): 0.00B [00:00, ?B/s]
466
+
467
+ Fetching 5 files: 0%| | 0/5 [00:00<?, ?it/s]
468
+
469
+ Downloading (incomplete total...): 0%| | 0.00/5.70M [00:00<?, ?B/s]
470
+
471
+ Downloading (incomplete total...): 0%| | 0.00/5.81M [00:00<?, ?B/s]
472
+
473
+ Downloading (incomplete total...): 0%| | 0.00/2.15G [00:00<?, ?B/s]
474
+
475
+ Downloading (incomplete total...): 0%| | 0.00/3.21G [00:00<?, ?B/s]
476
+
477
+ Downloading (incomplete total...): 0%| | 0.00/3.21G [00:00<?, ?B/s]
478
 
479
+ Downloading (incomplete total...): 0%| | 13.5M/3.21G [00:01<04:28, 11.9MB/s]
480
 
481
+ Downloading (incomplete total...): 2%|▏ | 64.6M/3.21G [00:08<07:11, 7.29MB/s]
482
 
483
+ Downloading (incomplete total...): 4%|▍ | 132M/3.21G [00:09<03:16, 15.7MB/s] 
484
 
485
+ Downloading (incomplete total...): 23%|β–ˆβ–ˆβ–Ž | 748M/3.21G [00:10<00:21, 115MB/s] 
486
 
487
+ Downloading (incomplete total...): 62%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ– | 2.00G/3.21G [00:11<00:03, 331MB/s]
488
 
489
+ Fetching 5 files: 60%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ | 3/5 [00:12<00:08, 4.05s/it]
490
+ Fetching 5 files: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 5/5 [00:12<00:00, 2.54s/it]
491
 
492
 
493
+ Download complete: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 3.21G/3.21G [00:12<00:00, 331MB/s] 
494
+ Download complete: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 3.21G/3.21G [00:13<00:00, 244MB/s]
495
  /usr/local/lib/python3.13/site-packages/diffusers/models/lora.py:393: FutureWarning: `LoRACompatibleLinear` is deprecated and will be removed in version 1.0.0. Use of `LoRACompatibleLinear` is deprecated. Please switch to PEFT backend by installing PEFT: `pip install peft`.
496
  deprecate("LoRACompatibleLinear", "1.0.0", deprecation_message)
 
 
 
 
497
 
498
 
499
  Cangjie5_TC.json: 0%| | 0.00/1.92M [00:00<?, ?B/s]
500
+ Cangjie5_TC.json: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 1.92M/1.92M [00:00<00:00, 42.7MB/s]
501
  Downloading: "https://github.com/explosion/spacy-pkuseg/releases/download/v0.0.26/spacy_ontonotes.zip" to /root/.pkuseg/spacy_ontonotes.zip
502
 
503
 
504
  0%| | 0/34567143 [00:00<?, ?it/s]
505
+ 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 34567143/34567143 [00:00<00:00, 172484889.55it/s]
 
 
 
 
506
  Traceback (most recent call last):
507
+ File "/app/chatterbox-multilingual-finetuning/src/finetune_t3.py", line 570, in <module>
508
  main()
509
  ~~~~^^
510
+ File "/app/chatterbox-multilingual-finetuning/src/finetune_t3.py", line 549, in main
511
+ text_pad_token_id=t3_config.start_text_token,
512
+ ^^^^^^^^^^^^^^^^^^^^^^^^^^
513
+ File "/usr/local/lib/python3.13/site-packages/torch/nn/modules/module.py", line 1965, in __getattr__
514
+ raise AttributeError(
515
+ f"'{type(self).__name__}' object has no attribute '{name}'"
516
+ )
517
+ AttributeError: 'T3' object has no attribute 'start_text_token'