mgh6 commited on
Commit
0b8d33f
·
verified ·
1 Parent(s): 46aa461

Training in progress, epoch 1

Browse files
config.json CHANGED
@@ -1,21 +1,30 @@
1
  {
2
- "_name_or_path": "tattabio/gLM2_650M",
3
  "architectures": [
4
- "gLM2ForMaskedLM"
5
  ],
6
- "auto_map": {
7
- "AutoConfig": "configuration_glm2.gLM2Config",
8
- "AutoModel": "modeling_glm2.gLM2Model",
9
- "AutoModelForMaskedLM": "modeling_glm2.gLM2ForMaskedLM"
10
- },
11
- "depth": 33,
12
- "dim": 1280,
13
- "ffn_dim_multiplier": null,
14
- "heads": 20,
15
- "model_type": "gLM2",
16
- "norm_eps": 1e-05,
17
- "swiglu_multiple_of": 256,
 
 
 
 
 
 
 
18
  "torch_dtype": "float32",
19
  "transformers_version": "4.49.0",
20
- "vocab_size": 37
 
 
21
  }
 
1
  {
2
+ "_name_or_path": "facebook/esm2_t33_650M_UR50D",
3
  "architectures": [
4
+ "EsmForMaskedLM"
5
  ],
6
+ "attention_probs_dropout_prob": 0.0,
7
+ "classifier_dropout": null,
8
+ "emb_layer_norm_before": false,
9
+ "esmfold_config": null,
10
+ "hidden_act": "gelu",
11
+ "hidden_dropout_prob": 0.0,
12
+ "hidden_size": 1280,
13
+ "initializer_range": 0.02,
14
+ "intermediate_size": 5120,
15
+ "is_folding_model": false,
16
+ "layer_norm_eps": 1e-05,
17
+ "mask_token_id": 32,
18
+ "max_position_embeddings": 1026,
19
+ "model_type": "esm",
20
+ "num_attention_heads": 20,
21
+ "num_hidden_layers": 33,
22
+ "pad_token_id": 1,
23
+ "position_embedding_type": "rotary",
24
+ "token_dropout": true,
25
  "torch_dtype": "float32",
26
  "transformers_version": "4.49.0",
27
+ "use_cache": true,
28
+ "vocab_list": null,
29
+ "vocab_size": 33
30
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:60a8151bee68255d9064bbfdc2170764612ef8d251c1027fa3d7f12321916dbc
3
- size 2682482800
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:414be13553d235730cd6c247e44cbd6a06aedc9a3e32ed0e9d4ae9d408220e05
3
+ size 2609498088
runs/Mar04_19-02-49_torch-flash-large22-0-1/events.out.tfevents.1741114969.torch-flash-large22-0-1.331.0 CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ac8f300c7cd050539527e8820e8e2b20f4194aa69f208c6c0c4b425aeeec4080
3
- size 19278
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2f92739ce052064f7f335699dac84913908347d90079968a4812450d614c45f8
3
+ size 20724
runs/Mar04_22-41-26_torch-flash-large22-0-1/events.out.tfevents.1741128086.torch-flash-large22-0-1.2641.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4781b8c116c4a4932d79db74b7b8049c10347ff6bb6ea7b0e9d796cea03fb26b
3
+ size 4834
runs/Mar04_22-45-13_torch-flash-large22-0-1/events.out.tfevents.1741128313.torch-flash-large22-0-1.2923.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c6875e32f5baf652f0f41741750e06de6556027b0309a0eab0cf45eaefa778da
3
+ size 10223
runs/Mar04_22-46-17_torch-flash-large22-0-1/events.out.tfevents.1741128378.torch-flash-large22-0-1.3223.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:020255edf9d2ef047e9bdf706b286511bcd52aa1e6d22a2082a45d2d12fcc1d2
3
+ size 10223
runs/Mar04_22-47-36_torch-flash-large22-0-1/events.out.tfevents.1741128456.torch-flash-large22-0-1.3223.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4a2461360c0c587da2a9ed0d794f60ad9864a441dff92e60769a46957fe80ce1
3
+ size 10223
runs/Mar04_22-56-59_torch-flash-large22-0-1/events.out.tfevents.1741129019.torch-flash-large22-0-1.3223.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3879aa7c64121614f1e621b2fd310d1486dc6be48622143745707fee45bc4c65
3
+ size 10223
runs/Mar04_22-58-18_torch-flash-large22-0-1/events.out.tfevents.1741129098.torch-flash-large22-0-1.3223.3 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a854bd4e234531bb47351b92f677a328adc5f17d095af626f6d39be74e902a70
3
+ size 10223
runs/Mar07_21-08-56_torch-flash-large22-0-9/events.out.tfevents.1741381737.torch-flash-large22-0-9.466.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:922ba98da5c38505e773a1c258fb5362916c2d18865b2cebd66c58fb36704c8c
3
+ size 5105
runs/Mar07_21-11-48_torch-flash-large22-0-9/events.out.tfevents.1741381909.torch-flash-large22-0-9.679.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:262a1a64a492eea58d3d4768b88d6bf643a026dc9589f67062b8784d0e4b2865
3
+ size 5105
runs/Mar07_21-12-41_torch-flash-large22-0-9/events.out.tfevents.1741381962.torch-flash-large22-0-9.891.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61933e70ea7e1bcea417fe701b2b908457fdb183542a70f5297d0c2239cd00b3
3
+ size 5105
runs/Mar07_21-13-17_torch-flash-large22-0-9/events.out.tfevents.1741382040.torch-flash-large22-0-9.1038.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e747f0676a6456a562608085b640010656bbbe19c75df87530d5173d91987822
3
+ size 5105
runs/Mar07_21-19-47_torch-flash-large22-0-9/events.out.tfevents.1741382388.torch-flash-large22-0-9.1443.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4805a69faba6f8d41261516ff14cd4ae9bc7647fce0e997b10845387e4b462f5
3
+ size 6051
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:d60cd4fa81843b4806dea3364d37d3df9835095733d168d051c0b135e77b91aa
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:497104d84493788ba6f9029b34e87263e741d66179363d27985c9e12854dd130
3
  size 5368