|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
from collections import OrderedDict |
|
|
from batchgenerators.utilities.file_and_folder_operations import * |
|
|
import shutil |
|
|
import numpy as np |
|
|
from sklearn.model_selection import KFold |
|
|
|
|
|
|
|
|
def convert_to_submission(source_dir, target_dir): |
|
|
niftis = subfiles(source_dir, join=False, suffix=".nii.gz") |
|
|
patientids = np.unique([i[:10] for i in niftis]) |
|
|
maybe_mkdir_p(target_dir) |
|
|
for p in patientids: |
|
|
files_of_that_patient = subfiles(source_dir, prefix=p, suffix=".nii.gz", join=False) |
|
|
assert len(files_of_that_patient) |
|
|
files_of_that_patient.sort() |
|
|
|
|
|
shutil.copy(join(source_dir, files_of_that_patient[0]), join(target_dir, p + "_ED.nii.gz")) |
|
|
shutil.copy(join(source_dir, files_of_that_patient[1]), join(target_dir, p + "_ES.nii.gz")) |
|
|
|
|
|
|
|
|
if __name__ == "__main__": |
|
|
folder = "/media/fabian/My Book/datasets/ACDC/training" |
|
|
folder_test = "/media/fabian/My Book/datasets/ACDC/testing/testing" |
|
|
out_folder = "/media/fabian/My Book/MedicalDecathlon/MedicalDecathlon_raw_splitted/Task027_ACDC" |
|
|
|
|
|
maybe_mkdir_p(join(out_folder, "imagesTr")) |
|
|
maybe_mkdir_p(join(out_folder, "imagesTs")) |
|
|
maybe_mkdir_p(join(out_folder, "labelsTr")) |
|
|
|
|
|
|
|
|
all_train_files = [] |
|
|
patient_dirs_train = subfolders(folder, prefix="patient") |
|
|
for p in patient_dirs_train: |
|
|
current_dir = p |
|
|
data_files_train = [i for i in subfiles(current_dir, suffix=".nii.gz") if i.find("_gt") == -1 and i.find("_4d") == -1] |
|
|
corresponding_seg_files = [i[:-7] + "_gt.nii.gz" for i in data_files_train] |
|
|
for d, s in zip(data_files_train, corresponding_seg_files): |
|
|
patient_identifier = d.split("/")[-1][:-7] |
|
|
all_train_files.append(patient_identifier + "_0000.nii.gz") |
|
|
shutil.copy(d, join(out_folder, "imagesTr", patient_identifier + "_0000.nii.gz")) |
|
|
shutil.copy(s, join(out_folder, "labelsTr", patient_identifier + ".nii.gz")) |
|
|
|
|
|
|
|
|
all_test_files = [] |
|
|
patient_dirs_test = subfolders(folder_test, prefix="patient") |
|
|
for p in patient_dirs_test: |
|
|
current_dir = p |
|
|
data_files_test = [i for i in subfiles(current_dir, suffix=".nii.gz") if i.find("_gt") == -1 and i.find("_4d") == -1] |
|
|
for d in data_files_test: |
|
|
patient_identifier = d.split("/")[-1][:-7] |
|
|
all_test_files.append(patient_identifier + "_0000.nii.gz") |
|
|
shutil.copy(d, join(out_folder, "imagesTs", patient_identifier + "_0000.nii.gz")) |
|
|
|
|
|
|
|
|
json_dict = OrderedDict() |
|
|
json_dict['name'] = "ACDC" |
|
|
json_dict['description'] = "cardias cine MRI segmentation" |
|
|
json_dict['tensorImageSize'] = "4D" |
|
|
json_dict['reference'] = "see ACDC challenge" |
|
|
json_dict['licence'] = "see ACDC challenge" |
|
|
json_dict['release'] = "0.0" |
|
|
json_dict['modality'] = { |
|
|
"0": "MRI", |
|
|
} |
|
|
json_dict['labels'] = { |
|
|
"0": "background", |
|
|
"1": "RV", |
|
|
"2": "MLV", |
|
|
"3": "LVC" |
|
|
} |
|
|
json_dict['numTraining'] = len(all_train_files) |
|
|
json_dict['numTest'] = len(all_test_files) |
|
|
json_dict['training'] = [{'image': "./imagesTr/%s.nii.gz" % i.split("/")[-1][:-12], "label": "./labelsTr/%s.nii.gz" % i.split("/")[-1][:-12]} for i in |
|
|
all_train_files] |
|
|
json_dict['test'] = ["./imagesTs/%s.nii.gz" % i.split("/")[-1][:-12] for i in all_test_files] |
|
|
|
|
|
save_json(json_dict, os.path.join(out_folder, "dataset.json")) |
|
|
|
|
|
|
|
|
splits = [] |
|
|
patients = np.unique([i[:10] for i in all_train_files]) |
|
|
patientids = [i[:-12] for i in all_train_files] |
|
|
|
|
|
kf = KFold(5, True, 12345) |
|
|
for tr, val in kf.split(patients): |
|
|
splits.append(OrderedDict()) |
|
|
tr_patients = patients[tr] |
|
|
splits[-1]['train'] = [i[:-12] for i in all_train_files if i[:10] in tr_patients] |
|
|
val_patients = patients[val] |
|
|
splits[-1]['val'] = [i[:-12] for i in all_train_files if i[:10] in val_patients] |
|
|
|
|
|
save_pickle(splits, "/media/fabian/nnunet/Task027_ACDC/splits_final.pkl") |