Tokenization fixed
Browse files- tokenization_nicheformer.py +11 -3
tokenization_nicheformer.py
CHANGED
|
@@ -290,9 +290,17 @@ class NicheformerTokenizer(PreTrainedTokenizer):
|
|
| 290 |
X = adata.X
|
| 291 |
|
| 292 |
# Get metadata for special tokens
|
| 293 |
-
|
| 294 |
-
|
| 295 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 296 |
|
| 297 |
print(f"Modality: {modality}")
|
| 298 |
print(f"Species: {species}")
|
|
|
|
| 290 |
X = adata.X
|
| 291 |
|
| 292 |
# Get metadata for special tokens
|
| 293 |
+
# Print column types
|
| 294 |
+
print("\nColumn types:")
|
| 295 |
+
if 'modality' in adata.obs.columns:
|
| 296 |
+
print(f"modality type: {type(adata.obs['modality'])} with dtype: {adata.obs['modality'].dtype}")
|
| 297 |
+
if 'specie' in adata.obs.columns:
|
| 298 |
+
print(f"specie type: {type(adata.obs['specie'])} with dtype: {adata.obs['specie'].dtype}")
|
| 299 |
+
if 'assay' in adata.obs.columns:
|
| 300 |
+
print(f"assay type: {type(adata.obs['assay'])} with dtype: {adata.obs['assay'].dtype}")
|
| 301 |
+
modality = adata.obs['modality'] if 'modality' in adata.obs.columns else None
|
| 302 |
+
species = adata.obs['specie'] if 'specie' in adata.obs.columns else None
|
| 303 |
+
technology = adata.obs['assay'] if 'assay' in adata.obs.columns else None
|
| 304 |
|
| 305 |
print(f"Modality: {modality}")
|
| 306 |
print(f"Species: {species}")
|