Upload cnets.py with huggingface_hub
Browse files
cnets.py
CHANGED
|
@@ -668,14 +668,10 @@ class Model(nn.Module):
|
|
| 668 |
|
| 669 |
|
| 670 |
|
| 671 |
-
|
| 672 |
-
|
| 673 |
-
chunks = [dataset[i:i +
|
| 674 |
-
|
| 675 |
-
# 创建进程池
|
| 676 |
-
with multiprocessing.Pool(num_processes) as pool:
|
| 677 |
-
# 并行处理数据块
|
| 678 |
-
results = pool.map(process_data, chunks)
|
| 679 |
|
| 680 |
# 合并结果
|
| 681 |
token_dict = merge_dicts(results)
|
|
|
|
| 668 |
|
| 669 |
|
| 670 |
|
| 671 |
+
# Process data sequentially to avoid DeepSpeed pickle issues
|
| 672 |
+
# (multiprocessing.Pool cannot pickle torch.distributed ProcessGroup)
|
| 673 |
+
chunks = [dataset[i:i + len(dataset)] for i in range(0, len(dataset), len(dataset))]
|
| 674 |
+
results = [process_data(chunk) for chunk in chunks]
|
|
|
|
|
|
|
|
|
|
|
|
|
| 675 |
|
| 676 |
# 合并结果
|
| 677 |
token_dict = merge_dicts(results)
|