Push model using huggingface_hub.

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,16 +1,10 @@
 ---
-language: en
-license: mit
 tags:
-- pytorch
-- pertTF
-- perturbation
 ---
-# pertTF lochness score prediction model
-This is model files for pertTF (tiny) trained for lochness score prediction
-## Usage
-```python
-model = HFPerturbationTFModel.from_pretrained('weililab/pertTF_virtual_screen_lochness')

 ---
 tags:
+- model_hub_mixin
+- pytorch_model_hub_mixin
 ---
+This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
+- Code: [More Information Needed]
+- Paper: [More Information Needed]
+- Docs: [More Information Needed]

config.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "cell_emb_style": "cls",
-  "d_hid": null,
   "d_model": 32,
   "do_dab": false,
   "do_mvc": true,
@@ -12,9 +12,9 @@
   "input_emb_style": "continuous",
   "mvc_decoder_style": "inner product",
   "n_bins": 0,
-  "n_cls": 1,
-  "n_pert": 1,
-  "n_ps": 1,
   "nhead": 4,
   "nlayers": 2,
   "nlayers_cls": 3,

 {
   "cell_emb_style": "cls",
+  "d_hid": 32,
   "d_model": 32,
   "do_dab": false,
   "do_mvc": true,
   "input_emb_style": "continuous",
   "mvc_decoder_style": "inner product",
   "n_bins": 0,
+  "n_cls": 14,
+  "n_pert": 9854,
+  "n_ps": 23,
   "nhead": 4,
   "nlayers": 2,
   "nlayers_cls": 3,

training_config.json CHANGED Viewed

@@ -10,9 +10,6 @@
   "dab_weight": 0.0,
   "this_weight": 1.0,
   "next_weight": 0.0,
-  "pad_token": "<pad>",
-  "mask_token": "<mask>",
-  "cls_token": "<cls>",
   "n_rounds": 10,
   "next_cell_pred_type": "lochness",
   "ecs_weight": 1.0,
@@ -48,5 +45,36 @@
   "fix_nonzero_prop": false,
   "nonzero_prop": 0.9,
   "max_seq_len": 3001,
-  "pad_value": -2
 }

   "dab_weight": 0.0,
   "this_weight": 1.0,
   "next_weight": 0.0,
   "n_rounds": 10,
   "next_cell_pred_type": "lochness",
   "ecs_weight": 1.0,
   "fix_nonzero_prop": false,
   "nonzero_prop": 0.9,
   "max_seq_len": 3001,
+  "n_pert": 9854,
+  "nlayers_pert": 3,
+  "n_ps": 23,
+  "ntoken": 5014,
+  "d_model": 32,
+  "nhead": 4,
+  "d_hid": 32,
+  "nlayers": 2,
+  "nlayers_cls": 3,
+  "n_cls": 14,
+  "vocab": null,
+  "dropout": 0.4,
+  "pad_token": "<pad>",
+  "pad_value": -2,
+  "do_mvc": true,
+  "do_dab": false,
+  "use_batch_labels": false,
+  "num_batch_labels": null,
+  "domain_spec_batchnorm": false,
+  "input_emb_style": "continuous",
+  "n_bins": 0,
+  "cell_emb_style": "cls",
+  "mvc_decoder_style": "inner product",
+  "ecs_threshold": 0.7,
+  "explicit_zero_prob": true,
+  "use_fast_transformer": true,
+  "fast_transformer_backend": "flash",
+  "pre_norm": false,
+  "pred_lochness_next": 100,
+  "ps_decoder2_nlayer": 5,
+  "pert_pad_id": null,
+  "pert_dim": null
 }