# import scanpy as sc # # file_path = '/scDifformer/data/240412_test/raw_h5ad/zheng68k_fold0_test.h5ad' # # adata = sc.read_h5ad(file_path) # adata[:3, :3].to_df().to_excel('/scDifformer/data/240412_test/data_info/h5ad_info.xlsx') # import loompy # # file_path = '/scDifformer/data/240412_test/looms/zheng68k_fold0_test.loom' # # # 使用loompy连接loom文件 # with loompy.connect(file_path) as ds: # # # 打印所有的列属性(column attributes, 即细胞元数据) # print("\nColumn:") # for key, val in ds.ca.items(): # print(f"{key}: {val}") # # # 打印所有的行属性(row attributes, 即基因元数据) # print("\nRow:") # for key, val in ds.ra.items(): # print(f"{key}: {val}") # # # 打印矩阵的一部分(例如,前5个基因和前5个细胞的表达量) # print("\nData matrix:") # matrix_slice = ds[:, :5] # 获取所有基因在前5个细胞中的表达量 # print(matrix_slice) # import pickle # # file_path = '/scDifformer/data/240412_test/material/gene_median_dictionary.pkl' # # with open(file_path, 'rb') as file: # data = pickle.load(file) # # print(data) # import pickle # # file_path = '/scDifformer/data/240412_test/material/token_dictionary.pkl' # # with open(file_path, 'rb') as file: # data = pickle.load(file) # # print(data) from datasets import load_from_disk file_path = '/scDifformer/data/240412_test/output_directory_run/geneformer_run.dataset' ds = load_from_disk(file_path) print(ds[:3])