Push model using huggingface_hub.

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,16 +1,10 @@
 ---
-language: en
-license: mit
 tags:
-- pytorch
-- pertTF
-- perturbation
 ---
-# pertTF perturbation model (tiny, mvc_only)
-This is model files for pertTF (tiny) trained for perturbation prediction using only all losses turned on (5k HVGs)
-## Usage
-```python
-model = HFPerturbationTFModel.from_pretrained('weililab/pert_5k_alltask')

 ---
 tags:
+- model_hub_mixin
+- pytorch_model_hub_mixin
 ---
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
+- Code: [More Information Needed]
+- Paper: [More Information Needed]
+- Docs: [More Information Needed]

config.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "cell_emb_style": "cls",
-  "d_hid": null,
   "d_model": 32,
   "do_dab": false,
-  "do_mvc": false,
   "domain_spec_batchnorm": false,
   "dropout": 0.1,
   "ecs_threshold": 0.7,
@@ -12,8 +12,8 @@
   "input_emb_style": "continuous",
   "mvc_decoder_style": "inner product",
   "n_bins": 51,
-  "n_cls": 1,
-  "n_pert": 1,
   "n_ps": 1,
   "nhead": 4,
   "nlayers": 2,
@@ -29,6 +29,6 @@
   "pred_lochness_next": false,
   "ps_decoder2_nlayer": 3,
   "use_batch_labels": false,
-  "use_fast_transformer": false,
   "vocab": null
 }

 {
   "cell_emb_style": "cls",
+  "d_hid": 32,
   "d_model": 32,
   "do_dab": false,
+  "do_mvc": true,
   "domain_spec_batchnorm": false,
   "dropout": 0.1,
   "ecs_threshold": 0.7,
   "input_emb_style": "continuous",
   "mvc_decoder_style": "inner product",
   "n_bins": 51,
+  "n_cls": 19,
+  "n_pert": 9854,
   "n_ps": 1,
   "nhead": 4,
   "nlayers": 2,
   "pred_lochness_next": false,
   "ps_decoder2_nlayer": 3,
   "use_batch_labels": false,
+  "use_fast_transformer": true,
   "vocab": null
 }

training_config.json CHANGED Viewed

@@ -51,5 +51,36 @@
   "hvg_col": "highly_variable",
   "mvc_masked_train": true,
   "max_seq_len": 4001,
-  "pad_value": -2
 }

   "hvg_col": "highly_variable",
   "mvc_masked_train": true,
   "max_seq_len": 4001,
+  "n_pert": 9854,
+  "nlayers_pert": 4,
+  "n_ps": 1,
+  "ntoken": 5057,
+  "d_model": 32,
+  "nhead": 4,
+  "d_hid": 32,
+  "nlayers": 2,
+  "nlayers_cls": 3,
+  "n_cls": 19,
+  "vocab": null,
+  "dropout": 0.1,
+  "pad_token": "<pad>",
+  "pad_value": -2,
+  "do_mvc": true,
+  "do_dab": false,
+  "use_batch_labels": false,
+  "num_batch_labels": null,
+  "domain_spec_batchnorm": false,
+  "input_emb_style": "continuous",
+  "n_bins": 51,
+  "cell_emb_style": "cls",
+  "mvc_decoder_style": "inner product",
+  "ecs_threshold": 0.7,
+  "explicit_zero_prob": true,
+  "use_fast_transformer": true,
+  "fast_transformer_backend": "flash",
+  "pre_norm": false,
+  "pred_lochness_next": false,
+  "ps_decoder2_nlayer": 3,
+  "pert_pad_id": null,
+  "pert_dim": null
 }