Update README.md
Browse files
README.md
CHANGED
|
@@ -16,13 +16,19 @@ Mapping gene networks requires large amounts of transcriptomic data to learn the
|
|
| 16 |
from tdc.model_server.tokenizers.geneformer import GeneformerTokenizer
|
| 17 |
from tdc import tdc_hf_interface
|
| 18 |
import torch
|
| 19 |
-
# Retrieve anndata object. Then,
|
| 20 |
tokenizer = GeneformerTokenizer()
|
| 21 |
x = tokenizer.tokenize_cell_vectors(adata,
|
| 22 |
ensembl_id="feature_id",
|
| 23 |
ncounts="n_measured_vars")
|
| 24 |
cells, _ = x
|
| 25 |
input_tensor = torch.tensor(cells) # note that you may need to pad or perform other custom data processing
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 26 |
attention_mask = torch.tensor(
|
| 27 |
[[x[0] != 0, x[1] != 0] for x in input_tensor]) # here we assume we used 0/False as a special padding token
|
| 28 |
outputs = model(batch,
|
|
|
|
| 16 |
from tdc.model_server.tokenizers.geneformer import GeneformerTokenizer
|
| 17 |
from tdc import tdc_hf_interface
|
| 18 |
import torch
|
| 19 |
+
# Retrieve anndata object. Then, tokenize
|
| 20 |
tokenizer = GeneformerTokenizer()
|
| 21 |
x = tokenizer.tokenize_cell_vectors(adata,
|
| 22 |
ensembl_id="feature_id",
|
| 23 |
ncounts="n_measured_vars")
|
| 24 |
cells, _ = x
|
| 25 |
input_tensor = torch.tensor(cells) # note that you may need to pad or perform other custom data processing
|
| 26 |
+
|
| 27 |
+
# retrieve model
|
| 28 |
+
geneformer = tdc_hf_interface("Geneformer")
|
| 29 |
+
model = geneformer.load()
|
| 30 |
+
|
| 31 |
+
# run inference
|
| 32 |
attention_mask = torch.tensor(
|
| 33 |
[[x[0] != 0, x[1] != 0] for x in input_tensor]) # here we assume we used 0/False as a special padding token
|
| 34 |
outputs = model(batch,
|