allenxiao's picture
Upload 17 files
8081b08 verified
# import scanpy as sc
#
# file_path = '/scDifformer/data/240412_test/raw_h5ad/zheng68k_fold0_test.h5ad'
#
# adata = sc.read_h5ad(file_path)
# adata[:3, :3].to_df().to_excel('/scDifformer/data/240412_test/data_info/h5ad_info.xlsx')
# import loompy
#
# file_path = '/scDifformer/data/240412_test/looms/zheng68k_fold0_test.loom'
#
# # 使用loompy连接loom文件
# with loompy.connect(file_path) as ds:
#
# # 打印所有的列属性(column attributes, 即细胞元数据)
# print("\nColumn:")
# for key, val in ds.ca.items():
# print(f"{key}: {val}")
#
# # 打印所有的行属性(row attributes, 即基因元数据)
# print("\nRow:")
# for key, val in ds.ra.items():
# print(f"{key}: {val}")
#
# # 打印矩阵的一部分(例如,前5个基因和前5个细胞的表达量)
# print("\nData matrix:")
# matrix_slice = ds[:, :5] # 获取所有基因在前5个细胞中的表达量
# print(matrix_slice)
# import pickle
#
# file_path = '/scDifformer/data/240412_test/material/gene_median_dictionary.pkl'
#
# with open(file_path, 'rb') as file:
# data = pickle.load(file)
#
# print(data)
# import pickle
#
# file_path = '/scDifformer/data/240412_test/material/token_dictionary.pkl'
#
# with open(file_path, 'rb') as file:
# data = pickle.load(file)
#
# print(data)
from datasets import load_from_disk
file_path = '/scDifformer/data/240412_test/output_directory_run/geneformer_run.dataset'
ds = load_from_disk(file_path)
print(ds[:3])