BioGeek commited on
Commit
cbf6244
·
verified ·
1 Parent(s): f0c8db2

Add instanovo-v1.1.0 model

Browse files
Files changed (3) hide show
  1. README.md +10 -0
  2. config.json +98 -0
  3. model.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,10 @@
 
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Code: [More Information Needed]
9
+ - Paper: [More Information Needed]
10
+ - Docs: [More Information Needed]
config.json ADDED
@@ -0,0 +1,98 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "blacklist": null,
3
+ "ckpt_interval": 100000,
4
+ "column_remapping": null,
5
+ "compile_model": true,
6
+ "console_logging_steps": 2000,
7
+ "conv_peak_encoder": false,
8
+ "dim_feedforward": 1024,
9
+ "dim_model": 768,
10
+ "dropout": 0.1,
11
+ "epochs": 30,
12
+ "fp16": true,
13
+ "grad_accumulation": 1,
14
+ "gradient_clip_val": 10.0,
15
+ "isotope_error_range": [
16
+ 0,
17
+ 1
18
+ ],
19
+ "lazy_loading": true,
20
+ "learning_rate": 5e-05,
21
+ "logger": null,
22
+ "max_charge": 10,
23
+ "max_iters": 3000000,
24
+ "max_length": 40,
25
+ "max_mz": 2500.0,
26
+ "max_shard_size": 1000000,
27
+ "min_intensity": 0.01,
28
+ "min_mz": 50.0,
29
+ "model_save_folder_path": "checkpoints/instanovo-extended-massivekb",
30
+ "n_beams": 5,
31
+ "n_gpu": 1,
32
+ "n_head": 16,
33
+ "n_layers": 9,
34
+ "n_peaks": 200,
35
+ "num_sanity_val_steps": 10,
36
+ "perform_data_checks": true,
37
+ "precursor_mass_tol": 50,
38
+ "predict_batch_size": 64,
39
+ "preshuffle_shards": true,
40
+ "remove_precursor_tol": 2.0,
41
+ "report_to": "neptune",
42
+ "residue_remapping": null,
43
+ "residues": {
44
+ "A": 71.037114,
45
+ "C": 103.009185,
46
+ "C[UNIMOD:4]": 160.030649,
47
+ "D": 115.026943,
48
+ "E": 129.042593,
49
+ "F": 147.068414,
50
+ "G": 57.021464,
51
+ "H": 137.058912,
52
+ "I": 113.084064,
53
+ "K": 128.094963,
54
+ "L": 113.084064,
55
+ "M": 131.040485,
56
+ "M[UNIMOD:35]": 147.0354,
57
+ "N": 114.042927,
58
+ "N[UNIMOD:7]": 115.026943,
59
+ "P": 97.052764,
60
+ "Q": 128.058578,
61
+ "Q[UNIMOD:7]": 129.042594,
62
+ "R": 156.101111,
63
+ "S": 87.032028,
64
+ "S[UNIMOD:21]": 166.998028,
65
+ "T": 101.04767,
66
+ "T[UNIMOD:21]": 181.01367,
67
+ "V": 99.068414,
68
+ "W": 186.079313,
69
+ "Y": 163.063329,
70
+ "Y[UNIMOD:21]": 243.029329,
71
+ "[UNIMOD:1]": 42.010565,
72
+ "[UNIMOD:385]": -17.026549,
73
+ "[UNIMOD:5]": 43.005814
74
+ },
75
+ "resume_checkpoint": null,
76
+ "run_name": "instanovo_acpt_base",
77
+ "save_model": true,
78
+ "save_weights_only": false,
79
+ "seed": 101,
80
+ "tb_summarywriter": "s3://dtu-denovo-s-2e6da747d6d34f62-outputs/output/8cbd543a-56cb-4866-a257-731cc32e822b/tensorboard/",
81
+ "tensorboard_logging_steps": 500,
82
+ "train_batch_size": 128,
83
+ "train_from_scratch": true,
84
+ "train_partition": null,
85
+ "train_path": "/mnt/instanovo-data-kyber/identity_splits_parquet/*/*-train-*.parquet",
86
+ "train_subset": 1.0,
87
+ "use_flash_attention": false,
88
+ "use_shards": true,
89
+ "val_check_interval": 1.0,
90
+ "valid_partition": null,
91
+ "valid_path": "/mnt/instanovo-data-kyber/identity_splits_parquet/*/*-valid-*.parquet",
92
+ "valid_subset": 0.01,
93
+ "valid_subset_of_train": null,
94
+ "validate_precursor_mass": false,
95
+ "verbose_loading": true,
96
+ "warmup_iters": 100000,
97
+ "weight_decay": 1e-05
98
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:194c19eca33744124fcb4164dd79e9d94adec7ba7d01a53151a054597895fba8
3
+ size 379123956