weililab
/

pertTF-small

Model card Files Files and versions

yqsu95 commited on Feb 5

Commit

a3b3df8

·

verified ·

1 Parent(s): d95d398

Push model using huggingface_hub.

Files changed (3) hide show

README.md +6 -11
config.json +6 -6
training_config.json +32 -1

README.md CHANGED Viewed

@@ -1,15 +1,10 @@
 ---
-language: en
-license: mit
 tags:
-- pytorch
-- pertTF
 ---
-# pertTF small
-This is model files for pertTF small
-## Usage
-```python
-model = HFPerturbationTFModel.from_pretrained('weililab/pertTF-small')

 ---
 tags:
+- model_hub_mixin
+- pytorch_model_hub_mixin
 ---
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
+- Code: [More Information Needed]
+- Paper: [More Information Needed]
+- Docs: [More Information Needed]

config.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "cell_emb_style": "cls",
-  "d_hid": null,
-  "d_model": 32,
   "do_dab": false,
-  "do_mvc": false,
   "domain_spec_batchnorm": false,
   "dropout": 0.1,
   "ecs_threshold": 0.7,
@@ -12,8 +12,8 @@
   "input_emb_style": "continuous",
   "mvc_decoder_style": "inner product",
   "n_bins": 51,
-  "n_cls": 1,
-  "n_pert": 1,
   "n_ps": 1,
   "nhead": 4,
   "nlayers": 4,
@@ -29,6 +29,6 @@
   "pred_lochness_next": false,
   "ps_decoder2_nlayer": 3,
   "use_batch_labels": false,
-  "use_fast_transformer": false,
   "vocab": null
 }

 {
   "cell_emb_style": "cls",
+  "d_hid": 64,
+  "d_model": 64,
   "do_dab": false,
+  "do_mvc": true,
   "domain_spec_batchnorm": false,
   "dropout": 0.1,
   "ecs_threshold": 0.7,
   "input_emb_style": "continuous",
   "mvc_decoder_style": "inner product",
   "n_bins": 51,
+  "n_cls": 20,
+  "n_pert": 40,
   "n_ps": 1,
   "nhead": 4,
   "nlayers": 4,
   "pred_lochness_next": false,
   "ps_decoder2_nlayer": 3,
   "use_batch_labels": false,
+  "use_fast_transformer": true,
   "vocab": null
 }

training_config.json CHANGED Viewed

@@ -49,5 +49,36 @@
   "hvg_col": "highly_variable",
   "mvc_masked_train": true,
   "max_seq_len": 3001,
-  "pad_value": -2
 }

   "hvg_col": "highly_variable",
   "mvc_masked_train": true,
   "max_seq_len": 3001,
+  "n_pert": 40,
+  "nlayers_pert": 4,
+  "n_ps": 1,
+  "ntoken": 36604,
+  "d_model": 64,
+  "nhead": 4,
+  "d_hid": 64,
+  "nlayers": 4,
+  "nlayers_cls": 3,
+  "n_cls": 20,
+  "vocab": null,
+  "dropout": 0.1,
+  "pad_token": "<pad>",
+  "pad_value": -2,
+  "do_mvc": true,
+  "do_dab": false,
+  "use_batch_labels": false,
+  "num_batch_labels": null,
+  "domain_spec_batchnorm": false,
+  "input_emb_style": "continuous",
+  "n_bins": 51,
+  "cell_emb_style": "cls",
+  "mvc_decoder_style": "inner product",
+  "ecs_threshold": 0.7,
+  "explicit_zero_prob": true,
+  "use_fast_transformer": true,
+  "fast_transformer_backend": "flash",
+  "pre_norm": false,
+  "pred_lochness_next": false,
+  "ps_decoder2_nlayer": 3,
+  "pert_pad_id": null,
+  "pert_dim": null
 }