krkawzq commited on
Commit
91fd45d
·
verified ·
1 Parent(s): 47547cc

Upload folder using huggingface_hub

Browse files
Files changed (4) hide show
  1. README.md +22 -3
  2. args.json +43 -0
  3. best_model.pt +3 -0
  4. vocab.json +0 -0
README.md CHANGED
@@ -1,3 +1,22 @@
1
- ---
2
- license: mit
3
- ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ library_name: perturblab
3
+ tags:
4
+ - biology
5
+ - genomics
6
+ - scgpt
7
+ license: mit
8
+ base_model: bowang-lab/scGPT
9
+ ---
10
+
11
+ # scgpt-brain
12
+
13
+ ## Model Description
14
+ This model weights were originally downloaded from the [bowang-lab/scGPT](https://github.com/bowang-lab/scGPT) repository.
15
+ It has been re-uploaded here for ease of use with the `perturblab` library.
16
+
17
+ ## Source
18
+ - **Original Repository**: [https://github.com/bowang-lab/scGPT](https://github.com/bowang-lab/scGPT)
19
+ - **Paper**: [scGPT: Foundation Model for Single Cell Biology](https://www.nature.com/articles/s41592-024-02201-0)
20
+
21
+ ## Usage
22
+ Intended for internal use with the PerturbLab framework.
args.json ADDED
@@ -0,0 +1,43 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "data_source": "/scratch/ssd004/datasets/cellxgene/scb_strict/brain/all_counts",
3
+ "save_dir": "./save/cellxgene_census_brain-May19-02-00-2023",
4
+ "load_model": null,
5
+ "n_hvg": null,
6
+ "valid_size_or_ratio": 0.03,
7
+ "vocab_path": "/scratch/ssd004/datasets/cellxgene/scFormer/scformer/tokenizer/default_census_vocab.json",
8
+ "pad_token": "<pad>",
9
+ "input_style": "binned",
10
+ "input_emb_style": "continuous",
11
+ "n_bins": 51,
12
+ "max_seq_len": 1200,
13
+ "training_tasks": "both",
14
+ "mask_ratio": [
15
+ 0.25,
16
+ 0.5,
17
+ 0.75
18
+ ],
19
+ "trunc_by_sample": true,
20
+ "local_rank": 0,
21
+ "batch_size": 32,
22
+ "eval_batch_size": 64,
23
+ "grad_accu_steps": 1,
24
+ "epochs": 6,
25
+ "lr": 0.0001,
26
+ "scheduler_interval": 100,
27
+ "scheduler_factor": 0.99,
28
+ "warmup_ratio_or_step": 10000.0,
29
+ "no_cls": true,
30
+ "no_cce": true,
31
+ "fp16": true,
32
+ "fast_transformer": true,
33
+ "nlayers": 12,
34
+ "nheads": 8,
35
+ "embsize": 512,
36
+ "d_hid": 512,
37
+ "dropout": 0.2,
38
+ "n_layers_cls": 3,
39
+ "log_interval": 6000,
40
+ "save_interval": 18000,
41
+ "mask_value": -1,
42
+ "pad_value": -2
43
+ }
best_model.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf2cf7dce9867f8174ad5186c0692d5a8fed41786ab44f4a3f9b736e066dbff8
3
+ size 205385258
vocab.json ADDED
The diff for this file is too large to render. See raw diff